From 1773146833c4d706afd0c64dde84c65c24eb0c93 Mon Sep 17 00:00:00 2001 From: Nick Sweeting Date: Fri, 19 Jan 2024 03:43:36 -0800 Subject: [PATCH] include more output file locations when considering whether snapshot.is_archived --- archivebox/index/schema.py | 8 ++++++-- 1 file changed, 6 insertions(+), 2 deletions(-) diff --git a/archivebox/index/schema.py b/archivebox/index/schema.py index 85972993..0a9b39c5 100644 --- a/archivebox/index/schema.py +++ b/archivebox/index/schema.py @@ -379,11 +379,15 @@ class Link: output_paths = ( domain(self.url), + 'output.html', 'output.pdf', 'screenshot.png', - 'output.html', + 'singlefile.html', + 'readability/content.html', + 'mercury/content.html', + 'htmltotext.txt', 'media', - 'singlefile.html' + 'git', ) return any(