From e3a128de6b0ebba15427a11107773a1ee3244094 Mon Sep 17 00:00:00 2001 From: MuslemRahimi Date: Mon, 28 Oct 2024 15:18:45 +0100 Subject: [PATCH] update news cron job --- app/cron_company_news.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/app/cron_company_news.py b/app/cron_company_news.py index ccec947..49bb66a 100644 --- a/app/cron_company_news.py +++ b/app/cron_company_news.py @@ -30,7 +30,7 @@ async def filter_and_deduplicate(data, excluded_domains=None, deduplicate_key='t Filter out items with specified domains in their URL and remove duplicates based on a specified key. """ if excluded_domains is None: - excluded_domains = ['prnewswire.com', 'globenewswire.com', 'accesswire.com'] + excluded_domains = ['prnewswire.com', 'globenewswire.com', 'accesswire.com', 'youtube.com'] seen_keys = set() filtered_data = [] for item in data: