From 67ac960221779557f31844f266411b9a14a82eff Mon Sep 17 00:00:00 2001 From: Martin Rotter Date: Tue, 18 Oct 2022 06:40:45 +0200 Subject: [PATCH] fix full site scraper! --- resources/scripts/scrapers/scrape-full-articles.py | 11 ++++++++--- 1 file changed, 8 insertions(+), 3 deletions(-) diff --git a/resources/scripts/scrapers/scrape-full-articles.py b/resources/scripts/scrapers/scrape-full-articles.py index 466530c1e..102ca6993 100644 --- a/resources/scripts/scrapers/scrape-full-articles.py +++ b/resources/scripts/scrapers/scrape-full-articles.py @@ -44,9 +44,14 @@ def process_article(article, is_rss, is_atom): if is_rss: article.find("description").text = scraped_article elif is_atom: - article.find("atom:content", atom_ns).text = scraped_article - except: - pass + at_con = article.find("atom:content", atom_ns) + + if at_con is None: + article.find("atom:summary", atom_ns).text = scraped_article + else: + at_con.text = scraped_article + except Exception as e: + print(e) def main():