Add ‘remove_hashtags’ filter

This commit is contained in:
vas3k
2022-03-29 19:11:38 +02:00
parent 32b2b2bf03
commit 1c53cccdcb
2 changed files with 18 additions and 4 deletions

View File

@@ -646,18 +646,19 @@ boards:
url: https://t.me/howtoberlin
rss: https://infomate.club/parsing/telegram/howtoberlin?only=text
icon: https://i.vas3k.ru/cfd6db4e48b2abc24a24883e6933720b4482376a3a69fd2961489933c74a314b.jpg
is_parsable: false
- name: "Berlin.de Events"
url: https://www.berlin.de/en/events/
rss: https://www.berlin.de/en/events/rubric.rss
icon: https://i.vas3k.ru/fjc.png
- name: "Comedy in English"
url: https://comedyinenglish.de/full-calendar/
rss: http://fetchrss.com/rss/5e1485a98a93f87e1f8b45685e15a6ea8a93f86d5d8b4567.xml
icon: https://i.vas3k.ru/flr.jpg
- name: "Eventbrite"
url: https://www.eventbrite.com/d/germany--berlin/all-events/
rss: http://fetchrss.com/rss/6242ddaac45b4250ef751de26242ddebad9ae2191c2b8af2.xml
icon: https://i.vas3k.ru/91ed89e5c03aed45b7fdddbcaee1a859821f5c62ff9bb8e58af68c91ede6c496.png
- name: "Comedy in English"
url: https://comedyinenglish.de/full-calendar/
rss: http://fetchrss.com/rss/5e1485a98a93f87e1f8b45685e15a6ea8a93f86d5d8b4567.xml
icon: https://i.vas3k.ru/flr.jpg
- name: "Детский Берлин"
url: https://kinderberlin.com/
rss: https://kinderberlin.com/feed/
@@ -674,6 +675,8 @@ boards:
- name: "Канал Воздух над Берлином"
url: https://t.me/alleinvater
rss: https://infomate.club/parsing/telegram/alleinvater?only=text
filters:
- remove_hashtags
is_parsable: false
- name: "Канал Travelclever"
url: https://t.me/travelclever

View File

@@ -1,3 +1,6 @@
import re
def echomsk_title_fix(entry):
title = entry.get("title")
if len(title) > 20 and title[17] == ":":
@@ -16,8 +19,16 @@ def databrew_podcast_clean_title(entry):
entry["title"] = title.replace('Data Brew ', '').replace(' Episode ', 'E')
return entry
def remove_hashtags(entry):
title = entry.get("title")
entry["title"] = re.sub("#[A-Za-z0-9_]+", "", title)
return entry
FILTERS = {
"echomsk_title_fix": echomsk_title_fix,
"moscow_python_podcast_clean_title": moscow_python_podcast_clean_title,
"databrew_podcast_clean_title": databrew_podcast_clean_title,
"remove_hashtags": remove_hashtags,
}