1
0
mirror of https://github.com/pirate/ArchiveBox.git synced 2025-08-22 22:25:24 +02:00

Add exception handling for indexable content reader

This commit is contained in:
jdcaballerov
2020-11-24 09:35:06 -05:00
committed by Nick Sweeting
parent b1d70185ed
commit 5a6b814c79

View File

@@ -97,6 +97,14 @@ def index_links(links: Union[List[Link],None], out_dir: Path=OUTPUT_DIR):
for link in links:
if snap := Snapshot.objects.filter(url=link.url).first():
results = ArchiveResult.objects.indexable().filter(snapshot=snap)
texts = get_indexable_content(results)
log_index_started(link.url)
try:
texts = get_indexable_content(results)
except Exception as err:
stderr()
stderr(
f'[X] An Exception ocurred reading the indexable content={err}:',
color='red',
)
else:
write_search_index(link, texts, out_dir=out_dir)