implemented deferred media archiving for all scrapers, and implemented tests for them. Refactored archiving methods of Instagram and Gettr scrapers to be able to use default archiving method

This commit is contained in:
Tristan Lee
2022-04-01 01:30:49 -05:00
parent 16aad4ef2c
commit 282f33eff3
26 changed files with 417 additions and 261 deletions

View File

@@ -3,12 +3,19 @@ import pytest
from cisticola.base import Channel
from cisticola.scraper import BitchuteScraper
@pytest.mark.unarchived
def test_scrape_bitchute_channel_no_media(controller, channel_kwargs):
channels = [Channel(**channel_kwargs['bitchute'])]
controller.register_scraper(scraper = BitchuteScraper())
controller.scrape_channels(channels = channels, archive_media = False)
@pytest.mark.media
@pytest.mark.unarchived
def test_scrape_bitchute_channel_unarchived_media(controller):
controller.archive_unarchived_media()
@pytest.mark.media
def test_scrape_bitchute_channel(controller, channel_kwargs):

View File

@@ -3,12 +3,19 @@ import pytest
from cisticola.base import Channel
from cisticola.scraper import GabScraper
@pytest.mark.unarchived
def test_scrape_gab_channel_no_media(controller, channel_kwargs):
channels = [Channel(**channel_kwargs['gab'])]
controller.register_scraper(scraper = GabScraper())
controller.scrape_channels(channels = channels, archive_media = False)
@pytest.mark.media
@pytest.mark.unarchived
def test_scrape_gab_channel_unarchived_media(controller):
controller.archive_unarchived_media()
@pytest.mark.media
def test_scrape_gab_channel(controller, channel_kwargs):

View File

@@ -3,12 +3,19 @@ import pytest
from cisticola.base import Channel
from cisticola.scraper import GettrScraper
@pytest.mark.unarchived
def test_scrape_gettr_channel_no_media(controller, channel_kwargs):
channels = [Channel(**channel_kwargs['gettr'])]
controller.register_scraper(scraper = GettrScraper())
controller.scrape_channels(channels = channels, archive_media = False)
@pytest.mark.media
@pytest.mark.unarchived
def test_scrape_gettr_channel_unarchived_media(controller):
controller.archive_unarchived_media()
@pytest.mark.media
def test_scrape_gettr_channel(controller, channel_kwargs):

View File

@@ -3,12 +3,19 @@ import pytest
from cisticola.base import Channel
from cisticola.scraper import InstagramScraper
@pytest.mark.unarchived
def test_scrape_instagram_channel_no_media(controller, channel_kwargs):
channels = [Channel(**channel_kwargs['instagram'])]
controller.register_scraper(scraper = InstagramScraper())
controller.scrape_channels(channels = channels, archive_media = False)
@pytest.mark.media
@pytest.mark.unarchived
def test_scrape_instagram_channel_unarchived_media(controller):
controller.archive_unarchived_media()
@pytest.mark.media
def test_scrape_instagram_channel(controller, channel_kwargs):

View File

@@ -3,12 +3,19 @@ import pytest
from cisticola.base import Channel
from cisticola.scraper import OdyseeScraper
@pytest.mark.unarchived
def test_scrape_odysee_channel_no_media(controller, channel_kwargs):
channels = [Channel(**channel_kwargs['odysee'])]
controller.register_scraper(scraper = OdyseeScraper())
controller.scrape_channels(channels = channels, archive_media = False)
@pytest.mark.media
@pytest.mark.unarchived
def test_scrape_odysee_channel_unarchived_media(controller):
controller.archive_unarchived_media()
@pytest.mark.media
def test_scrape_odysee_channel(controller, channel_kwargs):

View File

@@ -3,12 +3,19 @@ import pytest
from cisticola.base import Channel
from cisticola.scraper import RumbleScraper
@pytest.mark.unarchived
def test_scrape_rumble_channel_no_media(controller, channel_kwargs):
channels = [Channel(**channel_kwargs['rumble'])]
controller.register_scraper(scraper = RumbleScraper())
controller.scrape_channels(channels = channels, archive_media = False)
@pytest.mark.media
@pytest.mark.unarchived
def test_scrape_rumble_channel_unarchived_media(controller):
controller.archive_unarchived_media()
@pytest.mark.media
def test_scrape_rumble_channel(controller, channel_kwargs):

View File

@@ -3,12 +3,19 @@ import pytest
from cisticola.base import Channel
from cisticola.scraper import TelegramSnscrapeScraper
@pytest.mark.unarchived
def test_scrape_telegram_snscrape_channel_no_media(controller, channel_kwargs):
channels = [Channel(**channel_kwargs['telegram'])]
controller.register_scraper(scraper = TelegramSnscrapeScraper())
controller.scrape_channels(channels = channels, archive_media = False)
@pytest.mark.media
@pytest.mark.unarchived
def test_scrape_telegram_snscrape_channel_unarchived_media(controller):
controller.archive_unarchived_media()
@pytest.mark.media
def test_scrape_telegram_snscrape_channel(controller, channel_kwargs):

View File

@@ -3,6 +3,7 @@ import pytest
from cisticola.base import Channel
from cisticola.scraper import TelegramTelethonScraper
@pytest.mark.unarchived
def test_scrape_telegram_telethon_channel_no_media(controller, channel_kwargs):
controller.remove_all_scrapers()
@@ -10,6 +11,12 @@ def test_scrape_telegram_telethon_channel_no_media(controller, channel_kwargs):
controller.register_scraper(scraper = TelegramTelethonScraper())
controller.scrape_channels(channels = channels, archive_media = False)
@pytest.mark.media
@pytest.mark.unarchived
def test_scrape_telegram_telethon_unarchived_media(controller):
controller.archive_unarchived_media()
@pytest.mark.media
def test_scrape_telegram_telethon_channel(controller, channel_kwargs):

View File

@@ -3,12 +3,19 @@ import pytest
from cisticola.base import Channel
from cisticola.scraper import TwitterScraper
@pytest.mark.unarchived
def test_scrape_twitter_channel_no_media(controller, channel_kwargs):
channels = [Channel(**channel_kwargs['twitter'])]
controller.register_scraper(scraper = TwitterScraper())
controller.scrape_channels(channels = channels, archive_media = False)
@pytest.mark.media
@pytest.mark.unarchived
def test_scrape_twitter_channel_unarchived_media(controller):
controller.archive_unarchived_media()
@pytest.mark.media
def test_scrape_twitter_channel(controller, channel_kwargs):

View File

@@ -3,12 +3,19 @@ import pytest
from cisticola.base import Channel
from cisticola.scraper import VkontakteScraper
@pytest.mark.unarchived
def test_scrape_vkontakte_channel_no_media(controller, channel_kwargs):
channels = [Channel(**channel_kwargs['vkontakte'])]
controller.register_scraper(scraper = VkontakteScraper())
controller.scrape_channels(channels = channels, archive_media = False)
@pytest.mark.media
@pytest.mark.unarchived
def test_scrape_vkontakte_channel_unarchived_media(controller):
controller.archive_unarchived_media()
@pytest.mark.media
def test_scrape_vkontakte_channel(controller, channel_kwargs):

View File

@@ -3,12 +3,19 @@ import pytest
from cisticola.base import Channel
from cisticola.scraper import YoutubeScraper
@pytest.mark.unarchived
def test_scrape_youtube_channel_no_media(controller, channel_kwargs):
channels = [Channel(**channel_kwargs['youtube'])]
controller.register_scraper(scraper = YoutubeScraper())
controller.scrape_channels(channels = channels, archive_media = False)
@pytest.mark.media
@pytest.mark.unarchived
def test_scrape_youtube_channel_unarchived_media(controller):
controller.archive_unarchived_media()
@pytest.mark.media
def test_scrape_youtube_channel(controller, channel_kwargs):