From fbb8823e866a90bf77de57c6529ec5c15f915c78 Mon Sep 17 00:00:00 2001 From: Nick Sweeting Date: Tue, 17 Apr 2018 07:00:15 -0400 Subject: [PATCH] cleanup wget options --- archive_methods.py | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/archive_methods.py b/archive_methods.py index 003df75f..8049a3d5 100644 --- a/archive_methods.py +++ b/archive_methods.py @@ -183,8 +183,9 @@ def fetch_wget(link_dir, link, requisites=FETCH_WGET_REQUISITES, timeout=TIMEOUT return {'output': html_appended_url(link), 'status': 'skipped'} CMD = [ - *'wget --timestamping --adjust-extension --no-parent'.split(' '), # Docs: https://www.gnu.org/software/wget/manual/wget.html - *(('--page-requisites', '--convert-links') if FETCH_WGET_REQUISITES else ()), + # WGET CLI Docs: https://www.gnu.org/software/wget/manual/wget.html + *'wget -N -E -np -x -H -k -K -S --restrict-file-names=unix'.split(' '), + *(('-p',) if FETCH_WGET_REQUISITES else ()), *(('--user-agent="{}"'.format(WGET_USER_AGENT),) if WGET_USER_AGENT else ()), *((() if CHECK_SSL_VALIDITY else ('--no-check-certificate',))), link['url'],