__package__ = 'archivebox.core' import os from pathlib import Path from django.contrib import admin from django.utils.html import format_html, mark_safe from django.core.exceptions import ValidationError from django.urls import reverse, resolve from django.utils import timezone from archivebox.config import DATA_DIR from archivebox.config.common import SERVER_CONFIG from archivebox.misc.paginators import AccelleratedPaginator from archivebox.base_models.admin import BaseModelAdmin from archivebox.hooks import get_extractor_icon from core.models import ArchiveResult, Snapshot class ArchiveResultInline(admin.TabularInline): name = 'Archive Results Log' model = ArchiveResult parent_model = Snapshot # fk_name = 'snapshot' extra = 0 sort_fields = ('end_ts', 'extractor', 'output', 'status', 'cmd_version') readonly_fields = ('id', 'result_id', 'completed', 'command', 'version') fields = ('start_ts', 'end_ts', *readonly_fields, 'extractor', 'cmd', 'cmd_version', 'pwd', 'created_by', 'status', 'retry_at', 'output') # exclude = ('id',) ordering = ('end_ts',) show_change_link = True # # classes = ['collapse'] def get_parent_object_from_request(self, request): resolved = resolve(request.path_info) try: return self.parent_model.objects.get(pk=resolved.kwargs['object_id']) except (self.parent_model.DoesNotExist, ValidationError): return None @admin.display( description='Completed', ordering='end_ts', ) def completed(self, obj): return format_html('

{}

', obj.end_ts.strftime('%Y-%m-%d %H:%M:%S')) def result_id(self, obj): return format_html('[{}]', reverse('admin:core_archiveresult_change', args=(obj.id,)), str(obj.id)[:8]) def command(self, obj): return format_html('{}', " ".join(obj.cmd or [])) def version(self, obj): return format_html('{}', obj.cmd_version or '-') def get_formset(self, request, obj=None, **kwargs): formset = super().get_formset(request, obj, **kwargs) snapshot = self.get_parent_object_from_request(request) # import ipdb; ipdb.set_trace() # formset.form.base_fields['id'].widget = formset.form.base_fields['id'].hidden_widget() # default values for new entries formset.form.base_fields['status'].initial = 'succeeded' formset.form.base_fields['start_ts'].initial = timezone.now() formset.form.base_fields['end_ts'].initial = timezone.now() formset.form.base_fields['cmd_version'].initial = '-' formset.form.base_fields['pwd'].initial = str(snapshot.output_dir) formset.form.base_fields['created_by'].initial = request.user formset.form.base_fields['cmd'].initial = '["-"]' formset.form.base_fields['output'].initial = 'Manually recorded cmd output...' if obj is not None: # hidden values for existing entries and new entries formset.form.base_fields['start_ts'].widget = formset.form.base_fields['start_ts'].hidden_widget() formset.form.base_fields['end_ts'].widget = formset.form.base_fields['end_ts'].hidden_widget() formset.form.base_fields['cmd'].widget = formset.form.base_fields['cmd'].hidden_widget() formset.form.base_fields['pwd'].widget = formset.form.base_fields['pwd'].hidden_widget() formset.form.base_fields['created_by'].widget = formset.form.base_fields['created_by'].hidden_widget() formset.form.base_fields['cmd_version'].widget = formset.form.base_fields['cmd_version'].hidden_widget() return formset def get_readonly_fields(self, request, obj=None): if obj is not None: return self.readonly_fields else: return [] class ArchiveResultAdmin(BaseModelAdmin): list_display = ('id', 'created_by', 'created_at', 'snapshot_info', 'tags_str', 'status', 'extractor_with_icon', 'cmd_str', 'output_str') sort_fields = ('id', 'created_by', 'created_at', 'extractor', 'status') readonly_fields = ('cmd_str', 'snapshot_info', 'tags_str', 'created_at', 'modified_at', 'output_summary', 'extractor_with_icon') search_fields = ('id', 'snapshot__url', 'extractor', 'output', 'cmd_version', 'cmd', 'snapshot__timestamp') fields = ('snapshot', 'extractor', 'status', 'retry_at', 'start_ts', 'end_ts', 'created_by', 'pwd', 'cmd_version', 'cmd', 'output', *readonly_fields) autocomplete_fields = ['snapshot'] list_filter = ('status', 'extractor', 'start_ts', 'cmd_version') ordering = ['-start_ts'] list_per_page = SERVER_CONFIG.SNAPSHOTS_PER_PAGE paginator = AccelleratedPaginator save_on_top = True actions = ['delete_selected'] class Meta: verbose_name = 'Archive Result' verbose_name_plural = 'Archive Results' def change_view(self, request, object_id, form_url="", extra_context=None): self.request = request return super().change_view(request, object_id, form_url, extra_context) @admin.display( description='Snapshot Info' ) def snapshot_info(self, result): return format_html( '[{}]   {}   {}
', result.snapshot.timestamp, str(result.snapshot.id)[:8], result.snapshot.bookmarked_at.strftime('%Y-%m-%d %H:%M'), result.snapshot.url[:128], ) @admin.display( description='Snapshot Tags' ) def tags_str(self, result): return result.snapshot.tags_str() @admin.display(description='Extractor', ordering='extractor') def extractor_with_icon(self, result): icon = get_extractor_icon(result.extractor) return format_html( '{} {}', result.extractor, icon, result.extractor, ) def cmd_str(self, result): return format_html( '
{}
', ' '.join(result.cmd) if isinstance(result.cmd, list) else str(result.cmd), ) def output_str(self, result): # Determine output link path - use output if file exists, otherwise link to index output_path = result.output if (result.status == 'succeeded' and result.output) else 'index.html' return format_html( '↗️
{}
', result.snapshot.timestamp, output_path, result.output, ) def output_summary(self, result): snapshot_dir = Path(DATA_DIR) / str(result.pwd).split('data/', 1)[-1] output_str = format_html( '
{}

', result.output, ) output_str += format_html('See result files ...
', str(result.snapshot.timestamp))
        path_from_output_str = (snapshot_dir / (result.output or ''))
        output_str += format_html('{}/{}

', str(snapshot_dir), str(result.output)) if os.access(path_from_output_str, os.R_OK): root_dir = str(path_from_output_str) else: root_dir = str(snapshot_dir) # print(root_dir, str(list(os.walk(root_dir)))) for root, dirs, files in os.walk(root_dir): depth = root.replace(root_dir, '').count(os.sep) + 1 if depth > 2: continue indent = ' ' * 4 * (depth) output_str += format_html('{}{}/
', indent, os.path.basename(root)) indentation_str = ' ' * 4 * (depth + 1) for filename in sorted(files): is_hidden = filename.startswith('.') output_str += format_html('{}{}
', int(not is_hidden), indentation_str, filename.strip()) return output_str + mark_safe('
') def register_admin(admin_site): admin_site.register(ArchiveResult, ArchiveResultAdmin)