Skip to content
Open
Show file tree
Hide file tree
Changes from 1 commit
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
4 changes: 3 additions & 1 deletion api/_rss-allowed-domains.js
Original file line number Diff line number Diff line change
Expand Up @@ -323,5 +323,7 @@ export default [
"rss.libsyn.com",
"feeds.megaphone.fm",
"rss.art19.com",
"idp.nature.com"
"idp.nature.com",
"www.pap.pl",
"wiadomosci.onet.pl",
];
4 changes: 3 additions & 1 deletion scripts/shared/rss-allowed-domains.json
Original file line number Diff line number Diff line change
Expand Up @@ -320,5 +320,7 @@
"rss.libsyn.com",
"feeds.megaphone.fm",
"rss.art19.com",
"idp.nature.com"
"idp.nature.com",
"www.pap.pl",
"wiadomosci.onet.pl"
]
14 changes: 10 additions & 4 deletions scripts/shared/source-tiers.json
Original file line number Diff line number Diff line change
Expand Up @@ -47,7 +47,7 @@
"The National": 2,
"Yonhap News": 2,
"Chosun Ilbo": 2,
"El País": 2,
"El Pa\u00eds": 2,
"El Mundo": 2,
"BBC Mundo": 2,
"Brasil Paralelo": 2,
Expand All @@ -71,7 +71,7 @@
"HVG": 2,
"444.hu": 2,
"24.hu": 2,
"Híradó": 2,
"H\u00edrad\u00f3": 2,
"Portfolio.hu": 2,
"ATV": 2,
"BBC Russian": 2,
Expand Down Expand Up @@ -217,7 +217,7 @@
"Entrackr (India)": 3,
"India Tech News": 3,
"Taiwan Tech News": 3,
"La Silla Vacía": 3,
"La Silla Vac\u00eda": 3,
"LATAM Tech News": 3,
"Startups.co (LATAM)": 3,
"Contxto (LATAM)": 3,
Expand Down Expand Up @@ -262,5 +262,11 @@
"ArXiv AI": 4,
"AI News": 4,
"Layoffs News": 4,
"GloNewswire (Taiwan)": 4
"GloNewswire (Taiwan)": 4,
"PAP": 1,
"Gazeta Wyborcza": 1,
"Polityka": 2,
"Onet": 2,
"OKO.press": 2,
"TVP Info": 2
}
11 changes: 11 additions & 0 deletions server/worldmonitor/news/v1/_feeds.ts
Original file line number Diff line number Diff line change
Expand Up @@ -55,6 +55,17 @@ export const VARIANT_FEEDS: Record<string, Record<string, ServerFeed[]>> = {
{ name: 'Híradó', url: gnLocale('site:hirado.hu when:2d', 'hu', 'HU', 'HU:hu'), lang: 'hu' },
{ name: 'Portfolio.hu', url: 'https://portfolio.hu/rss/all.xml', lang: 'hu' },
{ name: 'ATV', url: 'https://www.atv.hu/rss', lang: 'hu' },
// Polish (PL) existing feeds — server parity
{ name: 'TVN24', url: 'https://tvn24.pl/swiat.xml', lang: 'pl' },
{ name: 'Polsat News', url: 'https://www.polsatnews.pl/rss/wszystkie.xml', lang: 'pl' },
{ name: 'Rzeczpospolita', url: 'https://www.rp.pl/rss_main', lang: 'pl' },
// Polish (PL) additions
{ name: 'PAP', url: 'https://www.pap.pl/rss.xml', lang: 'pl' },
{ name: 'Gazeta Wyborcza', url: gnLocale('site:wyborcza.pl when:2d', 'pl', 'PL', 'PL:pl'), lang: 'pl' },
{ name: 'Polityka', url: gnLocale('site:polityka.pl when:2d', 'pl', 'PL', 'PL:pl'), lang: 'pl' },
{ name: 'Onet', url: 'https://wiadomosci.onet.pl/rss/index.xml', lang: 'pl' },
{ name: 'OKO.press', url: gnLocale('site:oko.press when:2d', 'pl', 'PL', 'PL:pl'), lang: 'pl' },
{ name: 'TVP Info', url: gnLocale('site:tvp.info when:2d', 'pl', 'PL', 'PL:pl'), lang: 'pl' },
],
middleeast: [
{ name: 'BBC Middle East', url: 'https://feeds.bbci.co.uk/news/world/middle_east/rss.xml' },
Expand Down
4 changes: 3 additions & 1 deletion shared/rss-allowed-domains.json
Original file line number Diff line number Diff line change
Expand Up @@ -320,5 +320,7 @@
"rss.libsyn.com",
"feeds.megaphone.fm",
"rss.art19.com",
"idp.nature.com"
"idp.nature.com",
"www.pap.pl",
"wiadomosci.onet.pl"
]
14 changes: 10 additions & 4 deletions shared/source-tiers.json
Original file line number Diff line number Diff line change
Expand Up @@ -47,7 +47,7 @@
"The National": 2,
"Yonhap News": 2,
"Chosun Ilbo": 2,
"El País": 2,
"El Pa\u00eds": 2,
Copy link
Copy Markdown
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

P2 Unintentional Unicode escape conversion on existing entries

Three pre-existing entries with accented characters — El País, Híradó, and La Silla Vacía — were rewritten from their native UTF-8 form to JSON Unicode escapes (\u00ed, \u00f3, \u00ed). The same change appears in scripts/shared/source-tiers.json. Both representations parse identically, but the diff noise suggests this was a side-effect of the editor or tool used to append the new entries. If any code does string-literal comparison against the raw JSON bytes rather than the parsed value, this would silently break those checks.

"El Mundo": 2,
"BBC Mundo": 2,
"Brasil Paralelo": 2,
Expand All @@ -71,7 +71,7 @@
"HVG": 2,
"444.hu": 2,
"24.hu": 2,
"Híradó": 2,
"H\u00edrad\u00f3": 2,
"Portfolio.hu": 2,
"ATV": 2,
"BBC Russian": 2,
Expand Down Expand Up @@ -217,7 +217,7 @@
"Entrackr (India)": 3,
"India Tech News": 3,
"Taiwan Tech News": 3,
"La Silla Vacía": 3,
"La Silla Vac\u00eda": 3,
"LATAM Tech News": 3,
"Startups.co (LATAM)": 3,
"Contxto (LATAM)": 3,
Expand Down Expand Up @@ -262,5 +262,11 @@
"ArXiv AI": 4,
"AI News": 4,
"Layoffs News": 4,
"GloNewswire (Taiwan)": 4
"GloNewswire (Taiwan)": 4,
"PAP": 1,
"Gazeta Wyborcza": 1,
"Polityka": 2,
"Onet": 2,
"OKO.press": 2,
"TVP Info": 2
}
9 changes: 9 additions & 0 deletions src/config/feeds.ts
Original file line number Diff line number Diff line change
Expand Up @@ -52,6 +52,8 @@ export const SOURCE_TYPES: Record<string, SourceType> = {
'Telex': 'mainstream', 'Index.hu': 'mainstream', 'HVG': 'mainstream',
'444.hu': 'mainstream', '24.hu': 'mainstream', 'Híradó': 'mainstream',
'ATV': 'mainstream', 'Portfolio.hu': 'market',
// Polish (PL) additions
'PAP': 'wire', 'Gazeta Wyborcza': 'mainstream', 'Polityka': 'mainstream', 'Onet': 'mainstream', 'OKO.press': 'intel', 'TVP Info': 'mainstream',
Comment on lines +55 to +56
Copy link
Copy Markdown
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

P2 Pre-existing TVN24, Polsat News, Rzeczpospolita still absent from SOURCE_TYPES

The server-parity fix adds these three feeds to _feeds.ts, but they remain missing from SOURCE_TYPES in this file. getSourceType() falls back to 'other' for any key not found in the map (line 103), so the analysis worker classifies all three as 'other' rather than 'mainstream'. Since this PR explicitly touches the Polish source set and SOURCE_TYPES, it's a natural place to close this gap alongside the six new entries.

'SVT Nyheter': 'mainstream', 'Dagens Nyheter': 'mainstream', 'Svenska Dagbladet': 'mainstream',
// Brazilian Addition
'Brasil Paralelo': 'mainstream',
Expand Down Expand Up @@ -278,6 +280,13 @@ const FULL_FEEDS: Record<string, Feed[]> = {
{ name: 'in.gr', url: rss('https://www.in.gr/feed/'), lang: 'el' },
{ name: 'iefimerida', url: rss('https://www.iefimerida.gr/rss.xml'), lang: 'el' },
{ name: 'Proto Thema', url: rss('https://news.google.com/rss/search?q=site:protothema.gr+when:2d&hl=el&gl=GR&ceid=GR:el'), lang: 'el' },
// Polish (PL) additions
{ name: 'PAP', url: rss('https://www.pap.pl/rss.xml'), lang: 'pl' },
{ name: 'Gazeta Wyborcza', url: rss('https://news.google.com/rss/search?q=site:wyborcza.pl+when:2d&hl=pl&gl=PL&ceid=PL:pl'), lang: 'pl' },
{ name: 'Polityka', url: rss('https://news.google.com/rss/search?q=site:polityka.pl+when:2d&hl=pl&gl=PL&ceid=PL:pl'), lang: 'pl' },
{ name: 'Onet', url: rss('https://wiadomosci.onet.pl/rss/index.xml'), lang: 'pl' },
{ name: 'OKO.press', url: rss('https://news.google.com/rss/search?q=site:oko.press+when:2d&hl=pl&gl=PL&ceid=PL:pl'), lang: 'pl' },
{ name: 'TVP Info', url: rss('https://news.google.com/rss/search?q=site:tvp.info+when:2d&hl=pl&gl=PL&ceid=PL:pl'), lang: 'pl' },
// Russia & Ukraine (independent sources)
{ name: 'BBC Russian', url: rss('https://feeds.bbci.co.uk/russian/rss.xml'), lang: 'ru' },
{ name: 'Meduza', url: rss('https://meduza.io/rss/all'), lang: 'ru' },
Expand Down
2 changes: 2 additions & 0 deletions vite.config.ts
Original file line number Diff line number Diff line change
Expand Up @@ -577,6 +577,8 @@ const RSS_PROXY_ALLOWED_DOMAINS = new Set([
'abcnews.go.com', 'abcnews.com', 'www.corriere.it', 'www.rt.com', 'www.alarabiya.net', 'tuoitrenews.vn',
'www.yonhapnewstv.co.kr', 'www.chosun.com', 'rss.libsyn.com', 'feeds.megaphone.fm', 'rss.art19.com',
'idp.nature.com',
'www.pap.pl',
'wiadomosci.onet.pl',
]);

function rssProxyPlugin(): Plugin {
Expand Down
Loading