From 513310abba5e78a7394f026d9d5583d37d811ab0 Mon Sep 17 00:00:00 2001 From: Celes Renata Date: Thu, 16 Apr 2026 18:09:50 +0000 Subject: [PATCH] =?UTF-8?q?fix:=20stop=20tagging=20all=20macro=5Fnews=20ar?= =?UTF-8?q?ticles=20as=20macro=5Fevent=20=E2=80=94=20default=20to=20articl?= =?UTF-8?q?e,=20let=20extractor=20reclassify.=20Also=20reduced=20fetch=20l?= =?UTF-8?q?imit=20to=2020=20and=20cadence=20to=2030min?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- services/shared/metadata.py | 9 +++++++-- 1 file changed, 7 insertions(+), 2 deletions(-) diff --git a/services/shared/metadata.py b/services/shared/metadata.py index ac15db3..46c3c01 100644 --- a/services/shared/metadata.py +++ b/services/shared/metadata.py @@ -209,12 +209,17 @@ async def persist_broker_event( def _resolve_document_type(source_type: str) -> str: - """Map source_type to a document_type value.""" + """Map source_type to a document_type value. + + Note: macro_news articles default to 'article' — the extractor + reclassifies them as 'macro_event' only if the content is truly + about macro/global events (not company-specific news). + """ mapping = { "news_api": "article", "filings_api": "filing", "web_scrape": "press_release", - "macro_news": "macro_event", + "macro_news": "article", } return mapping.get(source_type, "article")