From 8c58681f1e1c6db42812197afeb93cdf3d2749e3 Mon Sep 17 00:00:00 2001 From: vas3k Date: Fri, 24 Jan 2020 16:05:00 +0100 Subject: [PATCH] Skip items without links --- scripts/update.py | 11 ++++++----- 1 file changed, 6 insertions(+), 5 deletions(-) diff --git a/scripts/update.py b/scripts/update.py index 9fbe505..86f6217 100644 --- a/scripts/update.py +++ b/scripts/update.py @@ -111,10 +111,11 @@ def refresh_feed(item): feed = feedparser.parse(item['rss']) for entry in feed.entries[:DEFAULT_ENTRIES_LIMIT]: entry_title = parse_title(entry) - if not entry_title: + entry_link = entry.get("link") + if not entry_title or not entry_link: continue - print(f"- article: '{entry_title}' {entry.link}") + print(f"- article: '{entry_title}' {entry_link}") conditions = item.get("conditions") if conditions: @@ -126,10 +127,10 @@ def refresh_feed(item): article, is_created = Article.objects.get_or_create( board_id=item["board_id"], feed_id=item["id"], - uniq_id=entry.get("id") or entry.get("guid") or entry.link, + uniq_id=entry.get("id") or entry.get("guid") or entry_link, defaults=dict( - url=entry.link[:2000], - domain=parse_domain(entry.link)[:256], + url=entry_link[:2000], + domain=parse_domain(entry_link)[:256], created_at=parse_datetime(entry), updated_at=datetime.utcnow(), title=entry_title[:256],