mirror of
https://github.com/jointakahe/takahe.git
synced 2024-11-21 23:01:00 +00:00
Add identity pruning, improve post pruning
This commit is contained in:
parent
9fc497f826
commit
74f69a3813
5 changed files with 70 additions and 6 deletions
|
@ -3,6 +3,7 @@ import sys
|
|||
|
||||
from django.conf import settings
|
||||
from django.core.management.base import BaseCommand
|
||||
from django.db.models import Q
|
||||
from django.utils import timezone
|
||||
|
||||
from activities.models import Post
|
||||
|
@ -21,13 +22,21 @@ class Command(BaseCommand):
|
|||
)
|
||||
|
||||
def handle(self, number: int, *args, **options):
|
||||
if not settings.SETUP.REMOTE_PRUNE_HORIZON:
|
||||
print("Pruning has been disabled as REMOTE_PRUNE_HORIZON=0")
|
||||
sys.exit(2)
|
||||
# Find a set of posts that match the initial criteria
|
||||
print(f"Running query to find up to {number} old posts...")
|
||||
posts = Post.objects.filter(
|
||||
local=False,
|
||||
created__lt=timezone.now()
|
||||
- datetime.timedelta(days=settings.SETUP.REMOTE_PRUNE_HORIZON),
|
||||
).exclude(interactions__identity__local=True)[:number]
|
||||
).exclude(
|
||||
Q(interactions__identity__local=True)
|
||||
| Q(visibility=Post.Visibilities.mentioned)
|
||||
)[
|
||||
:number
|
||||
]
|
||||
post_ids_and_uris = dict(posts.values_list("object_uri", "id"))
|
||||
print(f" found {len(post_ids_and_uris)}")
|
||||
|
||||
|
@ -43,9 +52,12 @@ class Command(BaseCommand):
|
|||
|
||||
# Delete them
|
||||
print(f" down to {len(post_ids_and_uris)} to delete")
|
||||
number_deleted, _ = Post.objects.filter(
|
||||
print("Deleting...")
|
||||
number_deleted, deleted = Post.objects.filter(
|
||||
id__in=post_ids_and_uris.values()
|
||||
).delete()
|
||||
print(f"Deleted {number_deleted} posts and dependencies")
|
||||
print("Deleted:")
|
||||
for model, model_deleted in deleted.items():
|
||||
print(f" {model}: {model_deleted}")
|
||||
if number_deleted == 0:
|
||||
sys.exit(1)
|
||||
|
|
|
@ -143,9 +143,9 @@ class Settings(BaseSettings):
|
|||
CACHES_DEFAULT: CacheBackendUrl | None = None
|
||||
|
||||
# How long to wait, in days, until remote posts/profiles are pruned from
|
||||
# our database if nobody local has interacted with them. Must be in rough
|
||||
# multiples of two weeks. Set to zero to disable.
|
||||
REMOTE_PRUNE_HORIZON: int = 0
|
||||
# our database if nobody local has interacted with them.
|
||||
# Set to zero to disable.
|
||||
REMOTE_PRUNE_HORIZON: int = 90
|
||||
|
||||
# Stator tuning
|
||||
STATOR_CONCURRENCY: int = 50
|
||||
|
|
0
users/management/__init__.py
Normal file
0
users/management/__init__.py
Normal file
0
users/management/commands/__init__.py
Normal file
0
users/management/commands/__init__.py
Normal file
52
users/management/commands/pruneidentities.py
Normal file
52
users/management/commands/pruneidentities.py
Normal file
|
@ -0,0 +1,52 @@
|
|||
import sys
|
||||
|
||||
from django.conf import settings
|
||||
from django.core.management.base import BaseCommand
|
||||
from django.db.models import Q
|
||||
from django.utils import timezone
|
||||
|
||||
from users.models import Identity
|
||||
|
||||
|
||||
class Command(BaseCommand):
|
||||
help = "Prunes identities that have no local interaction"
|
||||
|
||||
def add_arguments(self, parser):
|
||||
parser.add_argument(
|
||||
"--number",
|
||||
"-n",
|
||||
type=int,
|
||||
default=1000,
|
||||
help="The maximum number of identities to prune at once",
|
||||
)
|
||||
|
||||
def handle(self, number: int, *args, **options):
|
||||
if not settings.SETUP.REMOTE_PRUNE_HORIZON:
|
||||
print("Pruning has been disabled as REMOTE_PRUNE_HORIZON=0")
|
||||
sys.exit(2)
|
||||
# Find a set of identities that match the initial criteria
|
||||
print(f"Running query to find up to {number} unused identities...")
|
||||
identities = Identity.objects.filter(
|
||||
local=False,
|
||||
created__lt=timezone.now(),
|
||||
).exclude(
|
||||
Q(interactions__post__local=True)
|
||||
| Q(posts__isnull=False)
|
||||
| Q(outbound_follows__isnull=False)
|
||||
| Q(inbound_follows__isnull=False)
|
||||
| Q(outbound_blocks__isnull=False)
|
||||
| Q(inbound_blocks__isnull=False)
|
||||
)[
|
||||
:number
|
||||
]
|
||||
identity_ids = identities.values_list("id", flat=True)
|
||||
print(f" found {len(identity_ids)}")
|
||||
|
||||
# Delete them
|
||||
print("Deleting...")
|
||||
number_deleted, deleted = Identity.objects.filter(id__in=identity_ids).delete()
|
||||
print("Deleted:")
|
||||
for model, model_deleted in deleted.items():
|
||||
print(f" {model}: {model_deleted}")
|
||||
if number_deleted == 0:
|
||||
sys.exit(1)
|
Loading…
Reference in a new issue