From 1a7a5d1e4e4174167924e3eabd9bb24fb73a10b5 Mon Sep 17 00:00:00 2001 From: The Policybot Lab <74462173+policybot2020@users.noreply.github.com> Date: Fri, 15 Nov 2024 16:46:05 -0500 Subject: [PATCH 1/2] Update config.yaml --- config.yaml | 117 +++++++++++++++++++++++++++++++++++++++++++++++++--- 1 file changed, 112 insertions(+), 5 deletions(-) diff --git a/config.yaml b/config.yaml index 6dbf6e0..9b9cdf5 100644 --- a/config.yaml +++ b/config.yaml @@ -1,18 +1,123 @@ # RSS sources sources: - Source_1: + Source_0: url: "http://rss.cnn.com/rss/edition_world.rss" name: "CNN" # not used description: "Edition World" # not used category: "Example 1" # not used id: 1 + + Source_1: + url: "https://rss.nytimes.com/services/xml/rss/nyt/World.xml" + name: "New York Times" + description: "World News" + category: "International" + id: 1 + Source_2: - url: "http://feeds.bbci.co.uk/news/world/rss.xml" - name: "BBC" - description: "News World" - category: "Example 2" + url: "https://moxie.foxnews.com/google-publisher/world.xml" + name: "Fox News" + description: "World News" + category: "International" id: 2 + Source_3: + url: "http://feeds.bbci.co.uk/news/world/rss.xml" + name: "BBC News" + description: "World News" + category: "International" + id: 3 + + Source_4: + url: "https://www.theguardian.com/world/rss" + name: "The Guardian" + description: "World News" + category: "International" + id: 4 + + Source_5: + url: "https://www.aljazeera.com/xml/rss/all.xml" + name: "Al Jazeera" + description: "All News" + category: "International" + id: 5 + + Source_6: + url: "https://timesofindia.indiatimes.com/rssfeeds/296589292.cms" + name: "Times of India" + description: "World News" + category: "International" + id: 6 + + Source_7: + url: "https://www.rt.com/rss/" + name: "RT" + description: "All News" + category: "International" + id: 7 + + Source_8: + url: "https://rss.dw.com/xml/rss-en-all" + name: "DW News" + description: "All News" + category: "International" + id: 8 + + Source_9: + url: "https://en.mehrnews.com/rss/tp/561" + name: "Mehr News" + description: "Top Stories" + category: "International" + id: 9 + + Source_10: + url: "http://www.chinadaily.com.cn/rss/world_rss.xml" + name: "China Daily" + description: "World News" + category: "International" + id: 10 + + Source_11: + url: "https://www.scmp.com/rss/91/feed" + name: "South China Morning Post" + description: "World News" + category: "International" + id: 11 + + Source_12: + url: "https://www.telesurenglish.net/pages/rss.html" + name: "Telesur" + description: "World News" + category: "International" + id: 12 + + Source_13: + url: "https://www.france24.com/en/rss" + name: "France 24" + description: "Top Stories" + category: "International" + id: 13 + + Source_14: + url: "https://www.news24.com/World/Rss" + name: "News24" + description: "World News" + category: "International" + id: 14 + + Source_15: + url: "https://www.sowetanlive.co.za/rss/?section=news" + name: "Sowetan" + description: "News" + category: "International" + id: 15 + + Source_16: + url: "https://punchng.com/feed/" + name: "The Punch" + description: "All News" + category: "International" + id: 16 # Mapping for all columns of the target table on the database # Add columns as needed @@ -21,6 +126,7 @@ dbMapping: source_id: "source_id" # generated here source: "source" title: "title" + author:"author" link: "link" text: "text" timestamp_feed_updated: "ts_last_feed_updated" @@ -32,6 +138,7 @@ rssMapping: source_id: "source_id" # generated here source: "feed_title" title: "item_title" + author:"author" link: "item_link" text: "item_text" timestamp_feed_updated: "feed_last_build_date" From 0b51f6491323168696182527f1a3b3e728833d79 Mon Sep 17 00:00:00 2001 From: SarahWagner Date: Fri, 22 Nov 2024 19:04:19 +0100 Subject: [PATCH 2/2] fix config --- config.yaml | 70 ++++++++++++++++++++++++++--------------------------- 1 file changed, 35 insertions(+), 35 deletions(-) diff --git a/config.yaml b/config.yaml index 9b9cdf5..fdc2495 100644 --- a/config.yaml +++ b/config.yaml @@ -1,123 +1,123 @@ # RSS sources sources: - Source_0: + Source_1: url: "http://rss.cnn.com/rss/edition_world.rss" name: "CNN" # not used description: "Edition World" # not used category: "Example 1" # not used id: 1 - Source_1: + Source_2: url: "https://rss.nytimes.com/services/xml/rss/nyt/World.xml" name: "New York Times" description: "World News" category: "International" - id: 1 + id: 2 - Source_2: + Source_3: url: "https://moxie.foxnews.com/google-publisher/world.xml" name: "Fox News" description: "World News" category: "International" - id: 2 + id: 3 - Source_3: + Source_4: url: "http://feeds.bbci.co.uk/news/world/rss.xml" name: "BBC News" description: "World News" category: "International" - id: 3 + id: 4 - Source_4: + Source_5: url: "https://www.theguardian.com/world/rss" name: "The Guardian" description: "World News" category: "International" - id: 4 + id: 5 - Source_5: + Source_6: url: "https://www.aljazeera.com/xml/rss/all.xml" name: "Al Jazeera" description: "All News" category: "International" - id: 5 + id: 6 - Source_6: + Source_7: url: "https://timesofindia.indiatimes.com/rssfeeds/296589292.cms" name: "Times of India" description: "World News" category: "International" - id: 6 + id: 7 - Source_7: + Source_8: url: "https://www.rt.com/rss/" name: "RT" description: "All News" category: "International" - id: 7 + id: 8 - Source_8: + Source_9: url: "https://rss.dw.com/xml/rss-en-all" name: "DW News" description: "All News" category: "International" - id: 8 + id: 9 - Source_9: + Source_10: url: "https://en.mehrnews.com/rss/tp/561" name: "Mehr News" description: "Top Stories" category: "International" - id: 9 + id: 10 - Source_10: + Source_11: url: "http://www.chinadaily.com.cn/rss/world_rss.xml" name: "China Daily" description: "World News" category: "International" - id: 10 + id: 11 - Source_11: + Source_12: url: "https://www.scmp.com/rss/91/feed" name: "South China Morning Post" description: "World News" category: "International" - id: 11 + id: 12 - Source_12: + Source_13: url: "https://www.telesurenglish.net/pages/rss.html" name: "Telesur" description: "World News" category: "International" - id: 12 + id: 13 - Source_13: + Source_14: url: "https://www.france24.com/en/rss" name: "France 24" description: "Top Stories" category: "International" - id: 13 + id: 14 - Source_14: + Source_15: url: "https://www.news24.com/World/Rss" name: "News24" description: "World News" category: "International" - id: 14 + id: 15 - Source_15: + Source_16: url: "https://www.sowetanlive.co.za/rss/?section=news" name: "Sowetan" description: "News" category: "International" - id: 15 + id: 16 - Source_16: + Source_17: url: "https://punchng.com/feed/" name: "The Punch" description: "All News" category: "International" - id: 16 + id: 17 # Mapping for all columns of the target table on the database # Add columns as needed @@ -126,7 +126,7 @@ dbMapping: source_id: "source_id" # generated here source: "source" title: "title" - author:"author" + author: "author" link: "link" text: "text" timestamp_feed_updated: "ts_last_feed_updated" @@ -138,7 +138,7 @@ rssMapping: source_id: "source_id" # generated here source: "feed_title" title: "item_title" - author:"author" + author: "author" link: "item_link" text: "item_text" timestamp_feed_updated: "feed_last_build_date"