mirror of
https://github.com/pirate/ArchiveBox.git
synced 2025-08-18 20:31:38 +02:00
ignore robots.txt when using wget
This commit is contained in:
@@ -217,6 +217,7 @@ def fetch_wget(link_dir, link, requisites=FETCH_WGET_REQUISITES, warc=FETCH_WARC
|
||||
'--backup-converted',
|
||||
'--span-hosts',
|
||||
'--no-parent',
|
||||
'-e', 'robots=off',
|
||||
'--restrict-file-names=unix',
|
||||
'--timeout={}'.format(timeout),
|
||||
*(() if warc else ('--timestamping',)),
|
||||
|
Reference in New Issue
Block a user