2020-07-03 13:54:21 -04:00
|
|
|
|
from archivebox import util
|
|
|
|
|
|
|
|
|
|
def test_download_url_downloads_content():
|
2020-07-17 17:55:56 -04:00
|
|
|
|
text = util.download_url("http://127.0.0.1:8080/static/example.com.html")
|
2020-07-22 11:24:08 -04:00
|
|
|
|
assert "Example Domain" in text
|
|
|
|
|
|
|
|
|
|
def test_download_url_gets_encoding_from_body():
|
2020-09-23 11:34:05 -04:00
|
|
|
|
text = util.download_url("http://127.0.0.1:8080/static_no_content_type/shift_jis.html")
|
2020-07-22 11:24:08 -04:00
|
|
|
|
assert "鹿児島のニュース|MBC南日本放送" in text
|
|
|
|
|
assert "掲載された全ての記事・画像等の無断転載、二次利用をお断りいたします" in text
|