ignore robots.txt when using wget

This commit is contained in:
Nick Sweeting 2019-02-06 22:06:28 -08:00
parent 56d382235f
commit e6d5cd4432

View file

@ -217,6 +217,7 @@ def fetch_wget(link_dir, link, requisites=FETCH_WGET_REQUISITES, warc=FETCH_WARC
'--backup-converted', '--backup-converted',
'--span-hosts', '--span-hosts',
'--no-parent', '--no-parent',
'-e', 'robots=off',
'--restrict-file-names=unix', '--restrict-file-names=unix',
'--timeout={}'.format(timeout), '--timeout={}'.format(timeout),
*(() if warc else ('--timestamping',)), *(() if warc else ('--timestamping',)),