diff --git a/archivebox/extractors/wget.py b/archivebox/extractors/wget.py index 503c3bad..d7133dcb 100644 --- a/archivebox/extractors/wget.py +++ b/archivebox/extractors/wget.py @@ -136,7 +136,6 @@ def wget_output_path(link: Link) -> Optional[str]: See docs on wget --adjust-extension (-E) """ - if is_static_file(link.url): return without_scheme(without_fragment(link.url)) @@ -174,10 +173,9 @@ def wget_output_path(link: Link) -> Optional[str]: full_path = without_fragment(without_query(path(link.url))).strip('/') search_dir = os.path.join( link.link_dir, - domain(link.url), + domain(link.url).replace(":", "+"), urldecode(full_path), ) - for _ in range(4): if os.path.exists(search_dir): if os.path.isdir(search_dir): diff --git a/tests/mock_server/templates/example.com.html b/tests/mock_server/templates/example.com.html index 8492e858..8469956c 100644 --- a/tests/mock_server/templates/example.com.html +++ b/tests/mock_server/templates/example.com.html @@ -40,9 +40,9 @@
This domain is for use in illustrative examples in documents. You may use this - domain in literature without prior coordination or asking for permission.
+ domain in literature without prior coordination or asking for permission.