mirror of
https://github.com/pirate/ArchiveBox.git
synced 2025-08-16 11:35:59 +02:00
fix source filenames missing domain
This commit is contained in:
@@ -550,7 +550,7 @@ def add(urls: Union[str, List[str]],
|
|||||||
if new_links and depth == 1:
|
if new_links and depth == 1:
|
||||||
log_crawl_started(new_links)
|
log_crawl_started(new_links)
|
||||||
for new_link in new_links:
|
for new_link in new_links:
|
||||||
downloaded_file = save_file_as_source(new_link.url, filename='{ts}-crawl-{basename}.txt', out_dir=out_dir)
|
downloaded_file = save_file_as_source(new_link.url, filename=f'{new_link.timestamp}-crawl-{new_link.domain}.txt', out_dir=out_dir)
|
||||||
new_links_depth += parse_links_from_source(downloaded_file)
|
new_links_depth += parse_links_from_source(downloaded_file)
|
||||||
|
|
||||||
imported_links = new_links + new_links_depth
|
imported_links = new_links + new_links_depth
|
||||||
|
Reference in New Issue
Block a user