feat: Add pytest and initial tests

2024-06-01 18:20:20 +12:00 · 2020-07-03 11:52:57 -05:00 · 2020-07-03 11:52:57 -05:00 · 63fe19e2c2
parent ea93e05c3c
commit 63fe19e2c2
3 changed files with 64 additions and 0 deletions
--- a/setup.py
+++ b/setup.py
@ -65,6 +65,9 @@ setuptools.setup(
            "sphinx-rtd-theme",
            "recommonmark",
        ],
+        "test": [
+            "pytest"
+        ]
        # 'redis': ['redis', 'django-redis'],
        # 'pywb': ['pywb', 'redis'],
    },
--- a/tests/test_init.py
+++ b/tests/test_init.py
@ -0,0 +1,40 @@
+# archivebox init
+# archivebox add
+
+import os
+import subprocess
+from pathlib import Path
+import json
+
+import pytest
+
+@pytest.fixture
+def process(tmp_path):
+    os.chdir(tmp_path)
+    process = subprocess.run(['archivebox', 'init'], capture_output=True)
+    return process
+
+
+def test_init(tmp_path, process):
+    assert "Initializing a new ArchiveBox collection in this folder..." in process.stdout.decode("utf-8")
+    
+def test_update(tmp_path, process):
+    os.chdir(tmp_path)
+    update_process = subprocess.run(['archivebox', 'init'], capture_output=True)
+    assert "Updating existing ArchiveBox collection in this folder" in update_process.stdout.decode("utf-8")
+
+def test_add_link(tmp_path, process):
+    os.chdir(tmp_path)
+    add_process = subprocess.run(['archivebox', 'add', 'http://example.com'], capture_output=True)
+    archived_item_path = list(tmp_path.glob('archive/**/*'))[0]
+
+    assert "index.json" in [x.name for x in archived_item_path.iterdir()]
+
+    with open(archived_item_path / "index.json", "r") as f:
+        output_json = json.load(f)
+    assert "IANA — IANA-managed Reserved Domains" == output_json['history']['title'][0]['output']
+
+    with open(tmp_path / "index.html", "r") as f:
+        output_html = f.read()
+    assert "IANA — IANA-managed Reserved Domains" in output_html
+
--- a/tests/test_util.py
+++ b/tests/test_util.py
@ -0,0 +1,21 @@
+#@enforce_types
+#def download_url(url: str, timeout: int=None) -> str:
+#    """Download the contents of a remote url and return the text"""
+#    from .config import TIMEOUT, CHECK_SSL_VALIDITY, WGET_USER_AGENT
+#    timeout = timeout or TIMEOUT
+#    response = requests.get(
+#        url,
+#        headers={'User-Agent': WGET_USER_AGENT},
+#        verify=CHECK_SSL_VALIDITY,
+#        timeout=timeout,
+#    )
+#    if response.headers.get('Content-Type') == 'application/rss+xml':
+#        # Based on https://github.com/scrapy/w3lib/blob/master/w3lib/encoding.py
+#        _TEMPLATE = r'''%s\s*=\s*["']?\s*%s\s*["']?'''
+#        _XML_ENCODING_RE = _TEMPLATE % ('encoding', r'(?P<xmlcharset>[\w-]+)')
+#        _BODY_ENCODING_PATTERN = r'<\s*(\?xml\s[^>]+%s)' % (_XML_ENCODING_RE)
+#        _BODY_ENCODING_STR_RE = re.compile(_BODY_ENCODING_PATTERN, re.I | re.VERBOSE)
+#        match = _BODY_ENCODING_STR_RE.search(response.text[:1024])
+#        if match:
+#            response.encoding = match.group('xmlcharset')
+#    return response.text