Further tidy-ups, also adds some ytdlp utils to 'utils'

2026-06-12 05:08:28 +03:00 · 2025-01-20 16:17:57 +01:00
parent befc92deb4
commit fd2e7f973b
6 changed files with 123 additions and 58 deletions
--- a/tests/archivers/test_archiver_base.py
+++ b/tests/archivers/test_archiver_base.py
@@ -3,17 +3,17 @@ import pytest
 from auto_archiver.core import Metadata
 from auto_archiver.core import Step
 from auto_archiver.core.metadata import Metadata
-
+from auto_archiver.archivers.archiver import Archiver
 class TestArchiverBase(object):

-    archiver_class = None
-    config = None
+    archiver_class: str = None
+    config: dict = None

    @pytest.fixture(autouse=True)
    def setup_archiver(self):
        assert self.archiver_class is not None, "self.archiver_class must be set on the subclass"
        assert self.config is not None, "self.config must be a dict set on the subclass"
-        self.archiver = self.archiver_class({self.archiver_class.name: self.config})
+        self.archiver: Archiver = self.archiver_class({self.archiver_class.name: self.config})
    
    def assertValidResponseMetadata(self, test_response: Metadata, title: str, timestamp: str, status: str = ""):
        assert test_response is not False
--- a/tests/archivers/test_generic_archiver.py
+++ b/tests/archivers/test_generic_archiver.py
@@ -46,6 +46,23 @@ class TestGenericArchiver(TestArchiverBase):
        result = self.archiver.download(item)
        assert result.get_url() == "https://www.tiktok.com/@funnycats0ftiktok/video/7345101300750748970"

+    @pytest.mark.download
+    @pytest.mark.parametrize("url", [
+        "https://bsky.app/profile/colborne.bsky.social/post/3lcxcpgt6j42l",
+        "twitter.com/bellingcat/status/123",
+        "https://www.youtube.com/watch?v=1"
+    ])
+    def test_download_nonexistend_media(self, make_item, url):
+        """
+        Test to make sure that the extractor doesn't break on non-existend posts/media
+
+        It should return 'False'
+        """
+        item = make_item(url)
+        result = self.archiver.download(item)
+        assert not result
+
+
    @pytest.mark.download
    def test_youtube_download(self, make_item):
        # url https://www.youtube.com/watch?v=5qap5aO4i9A
@@ -60,14 +77,13 @@ class TestGenericArchiver(TestArchiverBase):

    @pytest.mark.download
    def test_bluesky_download_multiple_images(self, make_item):
-        item = make_item("https://bsky.app/profile/colborne.bsky.social/post/3lec2bqjc5s2y")
+        item = make_item("https://bsky.app/profile/bellingcat.com/post/3lffjoxcu7k2w")
        result = self.archiver.download(item)
        assert result is not False

-    @pytest.mark.skip("ytdlp supports bluesky, but there's currently no way to extract info from pages without videos")
    @pytest.mark.download
    def test_bluesky_download_single_image(self, make_item):
-        item = make_item("https://bsky.app/profile/colborne.bsky.social/post/3lcxcpgt6j42l")
+        item = make_item("https://bsky.app/profile/bellingcat.com/post/3lfn3hbcxgc2q")
        result = self.archiver.download(item)
        assert result is not False
    
@@ -82,6 +98,39 @@ class TestGenericArchiver(TestArchiverBase):
        item = make_item("https://bsky.app/profile/bellingcat.com/post/3le2l4gsxlk2i")
        result = self.archiver.download(item)
        assert result is not False
+    
+    @pytest.mark.download
+    def test_truthsocial_download_video(self, make_item):
+        item = make_item("https://truthsocial.com/@DaynaTrueman/posts/110602446619561579")
+        result = self.archiver.download(item)
+        assert len(result.media) == 1
+        assert result is not False
+
+    @pytest.mark.download
+    def test_truthsocial_download_no_media(self, make_item):
+        item = make_item("https://truthsocial.com/@bbcnewa/posts/109598702184774628")
+        result = self.archiver.download(item)
+        assert result is not False
+    
+    @pytest.mark.download
+    def test_truthsocial_download_poll(self, make_item):
+        item = make_item("https://truthsocial.com/@CNN_US/posts/113724326568555098")
+        result = self.archiver.download(item)
+        assert result is not False
+    
+    @pytest.mark.download
+    def test_truthsocial_download_single_image(self, make_item):
+        item = make_item("https://truthsocial.com/@mariabartiromo/posts/113861116433335006")
+        result = self.archiver.download(item)
+        assert len(result.media) == 1
+        assert result is not False
+
+    @pytest.mark.skip("Currently failing, multiple images are not being downloaded - this is due to an issue with ytdlp extractor")
+    @pytest.mark.download
+    def test_truthsocial_download_multiple_images(self, make_item):
+        item = make_item("https://truthsocial.com/@trrth/posts/113861302149349135")
+        result = self.archiver.download(item)
+        assert len(result.media) == 3

    @pytest.mark.download
    def test_twitter_download_nonexistend_tweet(self, make_item):