Skip to content

Commit 266f2f6

Browse files
committed
filter URLs including /podcast/
1 parent dec0f8b commit 266f2f6

File tree

1 file changed

+2
-0
lines changed

1 file changed

+2
-0
lines changed

src/fundus/publishers/be/__init__.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,7 @@
11
from fundus.publishers.base_objects import Publisher, PublisherGroup
22
from fundus.publishers.be.nieuwsblad import NieuwsbladParser
33
from fundus.publishers.be.politico_eu import PoliticoEuParser
4+
from fundus.scraping.filter import regex_filter
45
from fundus.scraping.url import NewsMap, RSSFeed, Sitemap
56

67

@@ -28,4 +29,5 @@ class BE(metaclass=PublisherGroup):
2829
Sitemap("https://www.politico.eu/sitemap.xml", languages={"en"}),
2930
NewsMap("https://www.politico.eu/news-sitemap.xml", languages={"en"}),
3031
],
32+
url_filter=regex_filter("/podcast/"),
3133
)

0 commit comments

Comments
 (0)