Add test status badge

edsu · edsu · commit 8df2d0d32c82 · 2026-02-04T13:26:19.000-05:00
diff --git a/README.md b/README.md
@@ -1,5 +1,7 @@
 # waybackprov
 
+[![Test](https://github.com/DocNow/waybackprov/actions/workflows/test.yml/badge.svg)](https://github.com/DocNow/waybackprov/actions/workflows/test.yml)
+
 Give *waybackprov* a URL and it will summarize which Internet Archive
 collections have archived the URL. This kind of information can sometimes
 provide insight about why a particular web resource or set of web resources were
diff --git a/setup.py b/setup.py
@@ -5,15 +5,17 @@
 
 if __name__ == "__main__":
     setup(
-        name='waybackprov',
-        version='0.0.9',
-        url='https://github.com/edsu/waybackprov',
-        author='Ed Summers',
-        author_email='ehs@pobox.com',
-        py_modules=['waybackprov', ],
-        description='Checks the provenance of a URL in the Wayback machine',
+        name="waybackprov",
+        version="0.0.9",
+        url="https://github.com/edsu/waybackprov",
+        author="Ed Summers",
+        author_email="ehs@pobox.com",
+        py_modules=[
+            "waybackprov",
+        ],
+        description="Checks the provenance of a URL in the Wayback machine",
         long_description=long_description,
         long_description_content_type="text/markdown",
-        python_requires='>=3.0',
-        entry_points={'console_scripts': ['waybackprov = waybackprov:main']}
+        python_requires=">=3.0",
+        entry_points={"console_scripts": ["waybackprov = waybackprov:main"]},
     )
diff --git a/test_waybackprov.py b/test_waybackprov.py
@@ -1,46 +1,63 @@
 from waybackprov import get_collection, get_crawls, get_depth, deepest_collection, cdx
 
+
 def test_coll():
-    coll = get_collection('ArchiveIt-Collection-2410')
-    assert coll['title'] == 'University of Maryland'
+    coll = get_collection("ArchiveIt-Collection-2410")
+    assert coll["title"] == "University of Maryland"
+
 
 def test_get_crawls():
-    crawls = list(get_crawls('https://mith.umd.edu'))
+    crawls = list(get_crawls("https://mith.umd.edu"))
     assert len(crawls) > 0
-    assert crawls[0]['timestamp']
-    assert crawls[0]['url']
-    assert crawls[0]['status']
-    assert crawls[0]['collections']
-    assert len(crawls[0]['collections']) > 0
+    assert crawls[0]["timestamp"]
+    assert crawls[0]["url"]
+    assert crawls[0]["status"]
+    assert crawls[0]["collections"]
+    assert len(crawls[0]["collections"]) > 0
+
 
 def test_depth():
-    assert get_depth('ArchiveIt-Collection-2410') == 4
-    assert get_depth('wikipediaoutlinks00003') == 3
+    assert get_depth("ArchiveIt-Collection-2410") == 4
+    assert get_depth("wikipediaoutlinks00003") == 3
+
 
 def test_deepest_collection():
     colls = [
-        'ArchiveIt-Partner-408',
-        'archiveitdigitalcollection',
-        'web',
-        'archiveitpartners',
-        'ArchiveIt-Collection-2410'
+        "ArchiveIt-Partner-408",
+        "archiveitdigitalcollection",
+        "web",
+        "archiveitpartners",
+        "ArchiveIt-Collection-2410",
     ]
-    assert deepest_collection(colls) == 'ArchiveIt-Collection-2410'
+    assert deepest_collection(colls) == "ArchiveIt-Collection-2410"
+
 
 def test_loop():
     # weirdly, some collections can contain themselves when there is a loop
     # e.g. coll1 ∃ coll2 and coll2 ∃ coll1
-    assert get_depth('ArchiveIt-Partner-1140') == 3
+    assert get_depth("ArchiveIt-Partner-1140") == 3
+
 
 def test_prefix():
-    crawls = get_crawls('https://twitter.com/Guccifer_2', prefix=True, match='/status/\d+$')
+    crawls = get_crawls(
+        "https://twitter.com/Guccifer_2", prefix=True, match="/status/\d+$"
+    )
     crawl = next(crawls)
-    assert crawl['url']
+    assert crawl["url"]
+
 
 def test_cdx():
-    urls = cdx('https://twitter.com/Guccifer_2', match='/status/\d+$', start_year=2016, end_year=2018)
+    urls = cdx(
+        "https://twitter.com/Guccifer_2",
+        match="/status/\d+$",
+        start_year=2016,
+        end_year=2018,
+    )
     assert len(list(urls)) == 132
 
+
 def test_missing():
-    crawls = list(get_crawls('https://twitter.com/slavresistance/status/1016697918970105857/'))
+    crawls = list(
+        get_crawls("https://twitter.com/slavresistance/status/1016697918970105857/")
+    )
     assert len(crawls) == 0