Don’t parse old articles

This commit is contained in:
vas3k
2020-09-26 12:04:33 +02:00
parent 48ede21d96
commit f33ba7da46

View File

@@ -143,9 +143,14 @@ def fetch_rss(item, rss):
if conditions:
is_valid = check_conditions(conditions, entry)
if not is_valid:
print(f"Condition {conditions} does not match. Skipped")
print(f"- condition {conditions} does not match. Skipped")
continue
created_at = parse_datetime(entry)
if created_at <= datetime.utcnow() - DELETE_OLD_ARTICLES_DELTA:
print(f"- article is too old. Skipped")
continue
article, is_created = Article.objects.get_or_create(
board_id=item["board_id"],
feed_id=item["id"],
@@ -153,7 +158,7 @@ def fetch_rss(item, rss):
defaults=dict(
url=entry_link[:2000],
domain=parse_domain(entry_link)[:256],
created_at=parse_datetime(entry),
created_at=created_at,
updated_at=datetime.utcnow(),
title=entry_title[:256],
image=str(parse_rss_image(entry) or "")[:512],