|
|
|
|
@@ -4,11 +4,13 @@
|
|
|
|
|
# Python
|
|
|
|
|
import datetime
|
|
|
|
|
import logging
|
|
|
|
|
import pytz
|
|
|
|
|
import re
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
# Django
|
|
|
|
|
from django.core.management.base import BaseCommand, CommandError
|
|
|
|
|
from django.db import transaction
|
|
|
|
|
from django.db import transaction, connection
|
|
|
|
|
from django.utils.timezone import now
|
|
|
|
|
|
|
|
|
|
# AWX
|
|
|
|
|
@@ -18,6 +20,132 @@ from awx.main.signals import disable_activity_stream, disable_computed_fields
|
|
|
|
|
from awx.main.utils.deletion import AWXCollector, pre_delete
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def unified_job_class_to_event_table_name(job_class):
|
|
|
|
|
return f'main_{job_class().event_class.__name__.lower()}'
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def partition_table_name(job_class, dt):
|
|
|
|
|
suffix = dt.replace(microsecond=0, second=0, minute=0).strftime('%Y%m%d_%H')
|
|
|
|
|
|
|
|
|
|
event_tbl_name = unified_job_class_to_event_table_name(job_class)
|
|
|
|
|
event_tbl_name += f'_{suffix}'
|
|
|
|
|
return event_tbl_name
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def partition_name_dt(part_name):
|
|
|
|
|
"""
|
|
|
|
|
part_name examples:
|
|
|
|
|
main_jobevent_20210318_09
|
|
|
|
|
main_projectupdateevent_20210318_11
|
|
|
|
|
main_inventoryupdateevent_20210318_03
|
|
|
|
|
"""
|
|
|
|
|
if '_unpartitioned' in part_name:
|
|
|
|
|
return None
|
|
|
|
|
p = re.compile('([a-z]+)_([a-z]+)_([0-9]+)_([0-9][0-9])')
|
|
|
|
|
m = p.match(part_name)
|
|
|
|
|
if not m:
|
|
|
|
|
return m
|
|
|
|
|
dt_str = f"{m.group(3)}_{m.group(4)}"
|
|
|
|
|
dt = datetime.datetime.strptime(dt_str, '%Y%m%d_%H').replace(tzinfo=pytz.UTC)
|
|
|
|
|
return dt
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def dt_to_partition_name(tbl_name, dt):
|
|
|
|
|
return f"{tbl_name}_{dt.strftime('%Y%m%d_%H')}"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class DeleteMeta:
|
|
|
|
|
def __init__(self, logger, job_class, cutoff, dry_run):
|
|
|
|
|
self.logger = logger
|
|
|
|
|
self.job_class = job_class
|
|
|
|
|
self.cutoff = cutoff
|
|
|
|
|
self.dry_run = dry_run
|
|
|
|
|
|
|
|
|
|
self.jobs_qs = None # Set in by find_jobs_to_delete()
|
|
|
|
|
|
|
|
|
|
self.parts_no_drop = set() # Set in identify_excluded_partitions()
|
|
|
|
|
self.parts_to_drop = set() # Set in find_partitions_to_drop()
|
|
|
|
|
self.jobs_pk_list = [] # Set in find_jobs_to_delete()
|
|
|
|
|
self.jobs_to_delete_count = 0 # Set in find_jobs_to_delete()
|
|
|
|
|
self.jobs_no_delete_count = 0 # Set in find_jobs_to_delete()
|
|
|
|
|
|
|
|
|
|
def find_jobs_to_delete(self):
|
|
|
|
|
self.jobs_qs = self.job_class.objects.filter(created__lt=self.cutoff).values_list('pk', 'status', 'created')
|
|
|
|
|
for pk, status, created in self.jobs_qs:
|
|
|
|
|
if status not in ['pending', 'waiting', 'running']:
|
|
|
|
|
self.jobs_to_delete_count += 1
|
|
|
|
|
self.jobs_pk_list.append(pk)
|
|
|
|
|
self.jobs_no_delete_count = (
|
|
|
|
|
self.job_class.objects.filter(created__gte=self.cutoff) | self.job_class.objects.filter(status__in=['pending', 'waiting', 'running'])
|
|
|
|
|
).count()
|
|
|
|
|
|
|
|
|
|
def identify_excluded_partitions(self):
|
|
|
|
|
|
|
|
|
|
part_drop = {}
|
|
|
|
|
|
|
|
|
|
for pk, status, created in self.jobs_qs:
|
|
|
|
|
|
|
|
|
|
part_key = partition_table_name(self.job_class, created)
|
|
|
|
|
if status in ['pending', 'waiting', 'running']:
|
|
|
|
|
part_drop[part_key] = False
|
|
|
|
|
else:
|
|
|
|
|
part_drop.setdefault(part_key, True)
|
|
|
|
|
|
|
|
|
|
# Note that parts_no_drop _may_ contain the names of partitions that don't exist
|
|
|
|
|
# This can happen when the cleanup of _unpartitioned_* logic leaves behind jobs with status pending, waiting, running. The find_jobs_to_delete() will
|
|
|
|
|
# pick these jobs up.
|
|
|
|
|
self.parts_no_drop = set([k for k, v in part_drop.items() if v is False])
|
|
|
|
|
|
|
|
|
|
def delete_jobs(self):
|
|
|
|
|
if not self.dry_run:
|
|
|
|
|
self.job_class.objects.filter(pk__in=self.jobs_pk_list).delete()
|
|
|
|
|
|
|
|
|
|
def find_partitions_to_drop(self):
|
|
|
|
|
tbl_name = unified_job_class_to_event_table_name(self.job_class)
|
|
|
|
|
|
|
|
|
|
with connection.cursor() as cursor:
|
|
|
|
|
query = "SELECT inhrelid::regclass::text AS child FROM pg_catalog.pg_inherits"
|
|
|
|
|
query += f" WHERE inhparent = 'public.{tbl_name}'::regclass"
|
|
|
|
|
query += f" AND TO_TIMESTAMP(LTRIM(inhrelid::regclass::text, '{tbl_name}_'), 'YYYYMMDD_HH24') < '{self.cutoff}'"
|
|
|
|
|
query += " ORDER BY inhrelid::regclass::text"
|
|
|
|
|
|
|
|
|
|
cursor.execute(query)
|
|
|
|
|
partitions_from_db = [r[0] for r in cursor.fetchall()]
|
|
|
|
|
|
|
|
|
|
partitions_dt = [partition_name_dt(p) for p in partitions_from_db if not None]
|
|
|
|
|
partitions_dt = [p for p in partitions_dt if not None]
|
|
|
|
|
|
|
|
|
|
# convert datetime partition back to string partition
|
|
|
|
|
partitions_maybe_drop = set([dt_to_partition_name(tbl_name, dt) for dt in partitions_dt])
|
|
|
|
|
|
|
|
|
|
# Do not drop partition if there is a job that will not be deleted pointing at it
|
|
|
|
|
self.parts_to_drop = partitions_maybe_drop - self.parts_no_drop
|
|
|
|
|
|
|
|
|
|
def drop_partitions(self):
|
|
|
|
|
if len(self.parts_to_drop) > 0:
|
|
|
|
|
parts_to_drop = list(self.parts_to_drop)
|
|
|
|
|
parts_to_drop.sort() # sort it to make reading it easier for humans
|
|
|
|
|
parts_to_drop_str = ','.join(parts_to_drop)
|
|
|
|
|
if self.dry_run:
|
|
|
|
|
self.logger.debug(f"Would drop event partition(s) {parts_to_drop_str}")
|
|
|
|
|
else:
|
|
|
|
|
self.logger.debug(f"Dropping event partition(s) {parts_to_drop_str}")
|
|
|
|
|
|
|
|
|
|
if not self.dry_run:
|
|
|
|
|
with connection.cursor() as cursor:
|
|
|
|
|
cursor.execute(f"DROP TABLE {parts_to_drop_str}")
|
|
|
|
|
else:
|
|
|
|
|
self.logger.debug("No event partitions to drop")
|
|
|
|
|
|
|
|
|
|
def delete(self):
|
|
|
|
|
self.find_jobs_to_delete()
|
|
|
|
|
self.identify_excluded_partitions()
|
|
|
|
|
self.find_partitions_to_drop()
|
|
|
|
|
self.drop_partitions()
|
|
|
|
|
self.delete_jobs()
|
|
|
|
|
return (self.jobs_no_delete_count, self.jobs_to_delete_count)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class Command(BaseCommand):
|
|
|
|
|
"""
|
|
|
|
|
Management command to cleanup old jobs and project updates.
|
|
|
|
|
@@ -36,6 +164,43 @@ class Command(BaseCommand):
|
|
|
|
|
parser.add_argument('--notifications', dest='only_notifications', action='store_true', default=False, help='Remove notifications')
|
|
|
|
|
parser.add_argument('--workflow-jobs', default=False, action='store_true', dest='only_workflow_jobs', help='Remove workflow jobs')
|
|
|
|
|
|
|
|
|
|
def cleanup(self, job_class):
|
|
|
|
|
delete_meta = DeleteMeta(self.logger, job_class, self.cutoff, self.dry_run)
|
|
|
|
|
skipped, deleted = delete_meta.delete()
|
|
|
|
|
|
|
|
|
|
return (delete_meta.jobs_no_delete_count, delete_meta.jobs_to_delete_count)
|
|
|
|
|
|
|
|
|
|
def cleanup_jobs_partition(self):
|
|
|
|
|
return self.cleanup(Job)
|
|
|
|
|
|
|
|
|
|
def cleanup_ad_hoc_commands_partition(self):
|
|
|
|
|
return self.cleanup(AdHocCommand)
|
|
|
|
|
|
|
|
|
|
def cleanup_project_updates_partition(self):
|
|
|
|
|
return self.cleanup(ProjectUpdate)
|
|
|
|
|
|
|
|
|
|
def cleanup_inventory_updates_partition(self):
|
|
|
|
|
return self.cleanup(InventoryUpdate)
|
|
|
|
|
|
|
|
|
|
def cleanup_management_jobs_partition(self):
|
|
|
|
|
return self.cleanup(SystemJob)
|
|
|
|
|
|
|
|
|
|
def cleanup_workflow_jobs_partition(self):
|
|
|
|
|
delete_meta = DeleteMeta(self.logger, WorkflowJob, self.cutoff, self.dry_run)
|
|
|
|
|
|
|
|
|
|
delete_meta.find_jobs_to_delete()
|
|
|
|
|
delete_meta.delete_jobs()
|
|
|
|
|
return (delete_meta.jobs_no_delete_count, delete_meta.jobs_to_delete_count)
|
|
|
|
|
|
|
|
|
|
def _cascade_delete_job_events(self, model, pk_list):
|
|
|
|
|
if len(pk_list) > 0:
|
|
|
|
|
with connection.cursor() as cursor:
|
|
|
|
|
tblname = unified_job_class_to_event_table_name(model)
|
|
|
|
|
|
|
|
|
|
pk_list_csv = ','.join(map(str, pk_list))
|
|
|
|
|
rel_name = model().event_parent_key
|
|
|
|
|
cursor.execute(f"DELETE FROM _unpartitioned_{tblname} WHERE {rel_name} IN ({pk_list_csv})")
|
|
|
|
|
|
|
|
|
|
def cleanup_jobs(self):
|
|
|
|
|
skipped, deleted = 0, 0
|
|
|
|
|
|
|
|
|
|
@@ -45,12 +210,14 @@ class Command(BaseCommand):
|
|
|
|
|
# get queryset for available jobs to remove
|
|
|
|
|
qs = Job.objects.filter(created__lt=self.cutoff).exclude(status__in=['pending', 'waiting', 'running'])
|
|
|
|
|
# get pk list for the first N (batch_size) objects
|
|
|
|
|
pk_list = qs[0:batch_size].values_list('pk')
|
|
|
|
|
pk_list = qs[0:batch_size].values_list('pk', flat=True)
|
|
|
|
|
# You cannot delete queries with sql LIMIT set, so we must
|
|
|
|
|
# create a new query from this pk_list
|
|
|
|
|
qs_batch = Job.objects.filter(pk__in=pk_list)
|
|
|
|
|
just_deleted = 0
|
|
|
|
|
if not self.dry_run:
|
|
|
|
|
self._cascade_delete_job_events(Job, pk_list)
|
|
|
|
|
|
|
|
|
|
del_query = pre_delete(qs_batch)
|
|
|
|
|
collector = AWXCollector(del_query.db)
|
|
|
|
|
collector.collect(del_query)
|
|
|
|
|
@@ -71,6 +238,7 @@ class Command(BaseCommand):
|
|
|
|
|
def cleanup_ad_hoc_commands(self):
|
|
|
|
|
skipped, deleted = 0, 0
|
|
|
|
|
ad_hoc_commands = AdHocCommand.objects.filter(created__lt=self.cutoff)
|
|
|
|
|
pk_list = []
|
|
|
|
|
for ad_hoc_command in ad_hoc_commands.iterator():
|
|
|
|
|
ad_hoc_command_display = '"%s" (%d events)' % (str(ad_hoc_command), ad_hoc_command.ad_hoc_command_events.count())
|
|
|
|
|
if ad_hoc_command.status in ('pending', 'waiting', 'running'):
|
|
|
|
|
@@ -81,15 +249,20 @@ class Command(BaseCommand):
|
|
|
|
|
action_text = 'would delete' if self.dry_run else 'deleting'
|
|
|
|
|
self.logger.info('%s %s', action_text, ad_hoc_command_display)
|
|
|
|
|
if not self.dry_run:
|
|
|
|
|
pk_list.append(ad_hoc_command.pk)
|
|
|
|
|
ad_hoc_command.delete()
|
|
|
|
|
deleted += 1
|
|
|
|
|
|
|
|
|
|
if not self.dry_run:
|
|
|
|
|
self._cascade_delete_job_events(AdHocCommand, pk_list)
|
|
|
|
|
|
|
|
|
|
skipped += AdHocCommand.objects.filter(created__gte=self.cutoff).count()
|
|
|
|
|
return skipped, deleted
|
|
|
|
|
|
|
|
|
|
def cleanup_project_updates(self):
|
|
|
|
|
skipped, deleted = 0, 0
|
|
|
|
|
project_updates = ProjectUpdate.objects.filter(created__lt=self.cutoff)
|
|
|
|
|
pk_list = []
|
|
|
|
|
for pu in project_updates.iterator():
|
|
|
|
|
pu_display = '"%s" (type %s)' % (str(pu), str(pu.launch_type))
|
|
|
|
|
if pu.status in ('pending', 'waiting', 'running'):
|
|
|
|
|
@@ -104,15 +277,20 @@ class Command(BaseCommand):
|
|
|
|
|
action_text = 'would delete' if self.dry_run else 'deleting'
|
|
|
|
|
self.logger.info('%s %s', action_text, pu_display)
|
|
|
|
|
if not self.dry_run:
|
|
|
|
|
pk_list.append(pu.pk)
|
|
|
|
|
pu.delete()
|
|
|
|
|
deleted += 1
|
|
|
|
|
|
|
|
|
|
if not self.dry_run:
|
|
|
|
|
self._cascade_delete_job_events(ProjectUpdate, pk_list)
|
|
|
|
|
|
|
|
|
|
skipped += ProjectUpdate.objects.filter(created__gte=self.cutoff).count()
|
|
|
|
|
return skipped, deleted
|
|
|
|
|
|
|
|
|
|
def cleanup_inventory_updates(self):
|
|
|
|
|
skipped, deleted = 0, 0
|
|
|
|
|
inventory_updates = InventoryUpdate.objects.filter(created__lt=self.cutoff)
|
|
|
|
|
pk_list = []
|
|
|
|
|
for iu in inventory_updates.iterator():
|
|
|
|
|
iu_display = '"%s" (source %s)' % (str(iu), str(iu.source))
|
|
|
|
|
if iu.status in ('pending', 'waiting', 'running'):
|
|
|
|
|
@@ -127,15 +305,20 @@ class Command(BaseCommand):
|
|
|
|
|
action_text = 'would delete' if self.dry_run else 'deleting'
|
|
|
|
|
self.logger.info('%s %s', action_text, iu_display)
|
|
|
|
|
if not self.dry_run:
|
|
|
|
|
pk_list.append(iu.pk)
|
|
|
|
|
iu.delete()
|
|
|
|
|
deleted += 1
|
|
|
|
|
|
|
|
|
|
if not self.dry_run:
|
|
|
|
|
self._cascade_delete_job_events(InventoryUpdate, pk_list)
|
|
|
|
|
|
|
|
|
|
skipped += InventoryUpdate.objects.filter(created__gte=self.cutoff).count()
|
|
|
|
|
return skipped, deleted
|
|
|
|
|
|
|
|
|
|
def cleanup_management_jobs(self):
|
|
|
|
|
skipped, deleted = 0, 0
|
|
|
|
|
system_jobs = SystemJob.objects.filter(created__lt=self.cutoff)
|
|
|
|
|
pk_list = []
|
|
|
|
|
for sj in system_jobs.iterator():
|
|
|
|
|
sj_display = '"%s" (type %s)' % (str(sj), str(sj.job_type))
|
|
|
|
|
if sj.status in ('pending', 'waiting', 'running'):
|
|
|
|
|
@@ -146,9 +329,13 @@ class Command(BaseCommand):
|
|
|
|
|
action_text = 'would delete' if self.dry_run else 'deleting'
|
|
|
|
|
self.logger.info('%s %s', action_text, sj_display)
|
|
|
|
|
if not self.dry_run:
|
|
|
|
|
pk_list.append(sj.pk)
|
|
|
|
|
sj.delete()
|
|
|
|
|
deleted += 1
|
|
|
|
|
|
|
|
|
|
if not self.dry_run:
|
|
|
|
|
self._cascade_delete_job_events(SystemJob, pk_list)
|
|
|
|
|
|
|
|
|
|
skipped += SystemJob.objects.filter(created__gte=self.cutoff).count()
|
|
|
|
|
return skipped, deleted
|
|
|
|
|
|
|
|
|
|
@@ -222,6 +409,13 @@ class Command(BaseCommand):
|
|
|
|
|
for m in model_names:
|
|
|
|
|
if m in models_to_cleanup:
|
|
|
|
|
skipped, deleted = getattr(self, 'cleanup_%s' % m)()
|
|
|
|
|
|
|
|
|
|
func = getattr(self, 'cleanup_%s_partition' % m, None)
|
|
|
|
|
if func:
|
|
|
|
|
skipped_partition, deleted_partition = func()
|
|
|
|
|
skipped += skipped_partition
|
|
|
|
|
deleted += deleted_partition
|
|
|
|
|
|
|
|
|
|
if self.dry_run:
|
|
|
|
|
self.logger.log(99, '%s: %d would be deleted, %d would be skipped.', m.replace('_', ' '), deleted, skipped)
|
|
|
|
|
else:
|
|
|
|
|
|