Use user id for TwitterScraper

2026-06-13 05:48:33 +03:00 · 2022-02-24 20:24:03 +01:00
parent d159c09aa4
commit 456d592792
1 changed files with 2 additions and 12 deletions
--- a/cisticola/scraper/twitter.py
+++ b/cisticola/scraper/twitter.py
@@ -10,18 +10,8 @@ class TwitterScraper(cisticola.scraper.base.Scraper):
    """An implementation of a Scraper for Twitter, using snscrape library"""
    __version__ = "TwitterScraper 0.0.1"
    # TODO snscrape should be able to scrape from user ID alone, but there is
    # currently a bug/other issue, so it is extracting the username from URL
    def get_username_from_url(url):
        username = url.split("twitter.com/")[1]
        if len(username.split("/")) > 1:
            return None
        return username
    def get_posts(self, channel: cisticola.base.Channel, since: cisticola.base.ScraperResult = None) -> List[cisticola.base.ScraperResult]:
-        scraper = snscrape.modules.twitter.TwitterProfileScraper(
+        scraper = snscrape.modules.twitter.TwitterProfileScraper(channel.platform_id)
            TwitterScraper.get_username_from_url(channel.url))
        first = True
@@ -66,5 +56,5 @@ class TwitterScraper(cisticola.scraper.base.Scraper):
                archived_urls=archived_urls)
    def can_handle(self, channel):
-        if channel.platform == "Twitter" and TwitterScraper.get_username_from_url(channel.url) is not None:
+        if channel.platform == "Twitter" and channel.platform_id:
            return True