From 628074d6fc9ceb406a08b92f22c99015cbde8a5f Mon Sep 17 00:00:00 2001 From: JustAnotherArchivist Date: Mon, 1 Jul 2019 01:35:00 +0000 Subject: [PATCH] Print contents when ignoring a link-less entry --- snscrape/modules/facebook.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/snscrape/modules/facebook.py b/snscrape/modules/facebook.py index 938dd57..5ac2961 100644 --- a/snscrape/modules/facebook.py +++ b/snscrape/modules/facebook.py @@ -84,7 +84,7 @@ class FacebookCommonScraper(snscrape.base.Scraper): entryA = entry.find('a', class_ = '_5pcq') # There can be more than one, e.g. when a post is shared by another user, but the first one is always the one of this entry. mediaSetA = entry.find('a', class_ = '_17z-') if not mediaSetA and not entryA: - logger.warning(f'Ignoring link-less entry after {cleanUrl}') + logger.warning(f'Ignoring link-less entry after {cleanUrl}: {entry.text!r}') continue if mediaSetA and (not entryA or entryA['href'] == '#'): href = mediaSetA['href']