From b6ed4726ce2d7fd1fbd441702968b17931d5b7a1 Mon Sep 17 00:00:00 2001 From: Schimon Jehudah Date: Wed, 15 Nov 2023 13:28:21 +0000 Subject: [PATCH] Update datasets --- datasets/catalogues/audiobooks.csv | 2 ++ datasets/catalogues/{book.csv => books.csv} | 0 datasets/catalogues/quotes.csv | 3 +++ datasets/catalogues/torrent.csv | 3 +++ datasets/corporations/computing.csv | 2 ++ datasets/news/blockchain.csv | 3 +++ datasets/news/christianity.csv | 1 + datasets/news/computing.csv | 5 +++++ datasets/news/crime.csv | 2 ++ datasets/news/culture.csv | 4 ++++ datasets/news/electronics.csv | 2 ++ datasets/news/family.csv | 3 +++ datasets/news/finance.csv | 4 ++++ datasets/news/fluoride.csv | 2 ++ datasets/news/food.csv | 2 ++ datasets/news/gaming.csv | 1 + datasets/news/general.csv | 4 ++++ datasets/news/government.csv | 5 +++++ datasets/news/health.csv | 4 ++++ datasets/news/internet.csv | 2 ++ datasets/news/israel.csv | 5 ++++- datasets/news/judaism.csv | 3 ++- datasets/news/lifestyle.csv | 1 + datasets/news/linux.csv | 1 + datasets/news/middle_east.csv | 2 ++ datasets/news/nature.csv | 2 ++ datasets/news/occult.csv | 2 ++ datasets/news/opinions.csv | 2 ++ datasets/news/pharma.csv | 2 ++ datasets/news/privacy.csv | 1 + datasets/news/propaganda.csv | 3 ++- datasets/news/security.csv | 1 + datasets/news/sports.csv | 1 + datasets/news/survival.csv | 2 ++ datasets/news/technology.csv | 4 ++++ datasets/news/travel.csv | 2 ++ datasets/news/united_states.csv | 6 ++++++ datasets/news/vehicle.csv | 2 ++ datasets/news/war.csv | 2 ++ datasets/organizations/netherlands.csv | 2 ++ datasets/tutorials/data.csv | 2 ++ datasets/tutorials/python.csv | 10 ++++++++++ datasets/wiki/computing.csv | 2 ++ 43 files changed, 111 insertions(+), 3 deletions(-) create mode 100644 datasets/catalogues/audiobooks.csv rename datasets/catalogues/{book.csv => books.csv} (100%) create mode 100644 datasets/catalogues/quotes.csv create mode 100644 datasets/catalogues/torrent.csv create mode 100644 datasets/corporations/computing.csv create mode 100644 datasets/news/blockchain.csv create mode 100644 datasets/news/crime.csv create mode 100644 datasets/news/electronics.csv create mode 100644 datasets/news/family.csv create mode 100644 datasets/news/finance.csv create mode 100644 datasets/news/fluoride.csv create mode 100644 datasets/news/food.csv create mode 100644 datasets/news/health.csv create mode 100644 datasets/news/internet.csv create mode 100644 datasets/news/nature.csv create mode 100644 datasets/news/occult.csv create mode 100644 datasets/news/pharma.csv create mode 100644 datasets/news/travel.csv create mode 100644 datasets/news/united_states.csv create mode 100644 datasets/news/vehicle.csv create mode 100644 datasets/organizations/netherlands.csv create mode 100644 datasets/tutorials/data.csv create mode 100644 datasets/tutorials/python.csv create mode 100644 datasets/wiki/computing.csv diff --git a/datasets/catalogues/audiobooks.csv b/datasets/catalogues/audiobooks.csv new file mode 100644 index 0000000..ba6a44b --- /dev/null +++ b/datasets/catalogues/audiobooks.csv @@ -0,0 +1,2 @@ +name, url, language, country +AudioBook Bay (ABB), https://audiobookbay.is/feed/atom/, en-US, USA diff --git a/datasets/catalogues/book.csv b/datasets/catalogues/books.csv similarity index 100% rename from datasets/catalogues/book.csv rename to datasets/catalogues/books.csv diff --git a/datasets/catalogues/quotes.csv b/datasets/catalogues/quotes.csv new file mode 100644 index 0000000..81af401 --- /dev/null +++ b/datasets/catalogues/quotes.csv @@ -0,0 +1,3 @@ +name, url, language, country +Linux-Unix Daily Fortunes - Quotes & Quips - motd.ambians.com, https://motd.ambians.com/out/rss/daily-fortunes.xml, en-US, USA +Shakespeare Quotes & Plays, https://shakespearequotesandplays.com/feed/, en-US, USA diff --git a/datasets/catalogues/torrent.csv b/datasets/catalogues/torrent.csv new file mode 100644 index 0000000..3bff9dd --- /dev/null +++ b/datasets/catalogues/torrent.csv @@ -0,0 +1,3 @@ +name, url, language, country +Nyaa, https://nyaa.si/?page=rss, en-US, Worldwide +Torlock, https://www.torlock.com/rss.xml, en-US, Worldwide diff --git a/datasets/corporations/computing.csv b/datasets/corporations/computing.csv new file mode 100644 index 0000000..a49b4bf --- /dev/null +++ b/datasets/corporations/computing.csv @@ -0,0 +1,2 @@ +name, url, language, country +Panic Blog, https://www.panic.com/blog/feed/, en-US, United States diff --git a/datasets/news/blockchain.csv b/datasets/news/blockchain.csv new file mode 100644 index 0000000..5997e2d --- /dev/null +++ b/datasets/news/blockchain.csv @@ -0,0 +1,3 @@ +name, url, language, country +CryptoSlate, https://cryptoslate.com/feed/, en-US, USA +CryptoPotato, https://cryptopotato.com/feed/, en-US, USA diff --git a/datasets/news/christianity.csv b/datasets/news/christianity.csv index 35070b3..dbb6a93 100644 --- a/datasets/news/christianity.csv +++ b/datasets/news/christianity.csv @@ -2,3 +2,4 @@ name, url, language, country Evangelical Endtimemachine, https://www.evangelicalendtimemachine.com/feed/, ce-PH ja-JP nl-NL , Worldwide Orthodox Christianity, https://orthochristian.com/xml/rss.xml, en-US, USA Legio Christi, https://legiochristi.com/rss/, en-US, USA +Jerm Warfare, https://jermwarfare.com/feed, en-US, USA diff --git a/datasets/news/computing.csv b/datasets/news/computing.csv index a73a1fd..78e7588 100644 --- a/datasets/news/computing.csv +++ b/datasets/news/computing.csv @@ -4,3 +4,8 @@ Jacob McCormick, https://mccor.xyz/rss.xml, en-US, USA ju_hnny5, https://blog.jbriault.fr/rss/, fr-FR, France Lazy Reading | The Cyber Vanguard, https://cyber.dabamos.de/blog/feed.rss, en-US, USA XXIIVV, https://wiki.xxiivv.com/links/rss.xml, en-US, Canada +Proycon's website, https://proycon.anaproy.nl/rss.xml, en-US, Netherlands +Nathan R. Yergler, https://yergler.net/feed.xml, en-US, USA +ynet - דיגיטל, https://www.ynet.co.il/Integration/StoryRss544.xml, he-IL, Israel +schollz, https://schollz.com/index.xml, en-US, USA +The Logs, https://www.flu0r1ne.net/logs/rss.xml, en-US, USA diff --git a/datasets/news/crime.csv b/datasets/news/crime.csv new file mode 100644 index 0000000..e43a1cb --- /dev/null +++ b/datasets/news/crime.csv @@ -0,0 +1,2 @@ +name, url, language, country +The Smoking Gun RSS, http://thesmokinggun.com/rss, en-US, USA diff --git a/datasets/news/culture.csv b/datasets/news/culture.csv index 3585d9f..df08a7e 100644 --- a/datasets/news/culture.csv +++ b/datasets/news/culture.csv @@ -1,2 +1,6 @@ name, url, language, country The Organic Prepper, https://www.theorganicprepper.com/feed/, en-US, USA +The Public Domain Review, https://publicdomainreview.org/rss.xml, en-US, USA +ynet - תרבות, https://www.ynet.co.il/Integration/StoryRss538.xml, he-IL, Israel +ynet - Culture, https://www.ynet.co.il/Integration/StoryRss3086.xml, en-IL, Israel +ynet - חדר משלך, https://www.ynet.co.il/Integration/StoryRss4111.xml, he-IL, Israel diff --git a/datasets/news/electronics.csv b/datasets/news/electronics.csv new file mode 100644 index 0000000..d495e2c --- /dev/null +++ b/datasets/news/electronics.csv @@ -0,0 +1,2 @@ +name, url, language, country +The Logs, https://www.flu0r1ne.net/logs/rss.xml, en-US, USA diff --git a/datasets/news/family.csv b/datasets/news/family.csv new file mode 100644 index 0000000..5cc4477 --- /dev/null +++ b/datasets/news/family.csv @@ -0,0 +1,3 @@ +name, url, language, country +Mom on a Mission, https://www.mom-on-a-mission.blog/all-posts?format=rss, en-US, USA +ynet - הורים, https://www.ynet.co.il/Integration/StoryRss3052.xml, he-IL, Israel diff --git a/datasets/news/finance.csv b/datasets/news/finance.csv new file mode 100644 index 0000000..a80e068 --- /dev/null +++ b/datasets/news/finance.csv @@ -0,0 +1,4 @@ +name, url, language, country +CryptoSlate, https://cryptoslate.com/feed/, en-US, USA +CryptoPotato, https://cryptopotato.com/feed/, en-US, USA +Mail Online - Money, https://www.dailymail.co.uk/money/index.rss, en-US, UK diff --git a/datasets/news/fluoride.csv b/datasets/news/fluoride.csv new file mode 100644 index 0000000..141b11f --- /dev/null +++ b/datasets/news/fluoride.csv @@ -0,0 +1,2 @@ +name, url, language, country +Fluoride Action Network, https://fluoridealert.org/feed/, en-US, USA diff --git a/datasets/news/food.csv b/datasets/news/food.csv new file mode 100644 index 0000000..318843d --- /dev/null +++ b/datasets/news/food.csv @@ -0,0 +1,2 @@ +name, url, language, country +ynet - אוכל, https://www.ynet.co.il/Integration/StoryRss975.xml, he-IL, Israel diff --git a/datasets/news/gaming.csv b/datasets/news/gaming.csv index c088e1e..0e2b89f 100644 --- a/datasets/news/gaming.csv +++ b/datasets/news/gaming.csv @@ -1 +1,2 @@ name, url, language, country +DESIGNER NOTES, http://www.designer-notes.com/feed/, en-US, USA diff --git a/datasets/news/general.csv b/datasets/news/general.csv index be1fecc..7f7001e 100644 --- a/datasets/news/general.csv +++ b/datasets/news/general.csv @@ -6,3 +6,7 @@ National Vanguard, https://nationalvanguard.org/feed/, en-US, USA Vanguard News Network, http://www.vanguardnewsnetwork.com/feed/, en-US, USA Courageous Discourse™ with Dr. Peter McCullough & John Leake, https://petermcculloughmd.substack.com/feed, en-US, USA DER SPIEGEL - International, https://www.spiegel.de/international/index.rss, en-US, Germany +nobulart - Exploring the Great Reset, https://nobulart.com/feed/, en-US, USA +Jerm Warfare, https://jermwarfare.com/feed, en-US, USA +Daily Stormer, https://dailystormer.in/feed/, en-US, USA +Associated Press News, https://apnews.com/index.rss, en-US, USA diff --git a/datasets/news/government.csv b/datasets/news/government.csv index 4c9f850..17298eb 100644 --- a/datasets/news/government.csv +++ b/datasets/news/government.csv @@ -1,4 +1,9 @@ name, url, language, country The Corbett Report, https://www.corbettreport.com/feed/, en-US, Japan ZeroGov, https://zerogov.com/feed/, en-US, USA +Daily Stormer, https://dailystormer.in/feed/, en-US, USA The Organic Prepper, https://www.theorganicprepper.com/feed/, en-US, USA +The Hill News, https://thehill.com/feed/?feed=partnerfeed-news-feed&format=rss, en-US, USA +nobulart - Exploring the Great Reset, https://nobulart.com/feed/, en-US, USA +John W. Whitehead, Constitutional Attorney, https://agovernmentofwolves.com/feed/, en-US, USA +BlackListed News, https://www.blacklistednews.com/rss.php, en-US, USA diff --git a/datasets/news/health.csv b/datasets/news/health.csv new file mode 100644 index 0000000..d28fb9b --- /dev/null +++ b/datasets/news/health.csv @@ -0,0 +1,4 @@ +name, url, language, country +Fluoride Action Network, https://fluoridealert.org/feed/, en-US, USA +MyGNUSolidario, https://my.gnusolidario.org/feed/, en-US, USA +ynet - בריאות, https://www.ynet.co.il/Integration/StoryRss1208.xml, he-IL, Israel diff --git a/datasets/news/internet.csv b/datasets/news/internet.csv new file mode 100644 index 0000000..107882e --- /dev/null +++ b/datasets/news/internet.csv @@ -0,0 +1,2 @@ +name, url, language, country +soeren-hentzschel.at - Aktuelles zu Mozilla, https://www.soeren-hentzschel.at/feed/, de-DE, Germany diff --git a/datasets/news/israel.csv b/datasets/news/israel.csv index 54a9eb8..a85dadd 100644 --- a/datasets/news/israel.csv +++ b/datasets/news/israel.csv @@ -1,7 +1,10 @@ name, url, language, country +MintPress News, https://www.mintpressnews.com/feed/, en-US, USA בחדרי חרדים, https://www.bhol.co.il/rss/index.xml, he-IL, Israel ynet - מבזקים, https://www.ynet.co.il/Integration/StoryRss1854.xml, he-IL, Israel ynet - חדשות, https://www.ynet.co.il/Integration/StoryRss2.xml, he-IL, Israel -ynet - News, https://www.ynet.co.il/3rdparty/mobile/rss/ynetnews/3082/, en-IL, Israel +ynet - News, https://www.ynet.co.il/Integration/StoryRss3082.xml, en-IL, Israel העין השביעית, https://www.the7eye.org.il/feed, he-IL, Israel +ynet - מעורבות, https://www.ynet.co.il/Integration/StoryRss3262.xml, he-IL, Israel +Jerm Warfare, https://jermwarfare.com/feed, en-US, USA diff --git a/datasets/news/judaism.csv b/datasets/news/judaism.csv index aebd7e4..ce925f9 100644 --- a/datasets/news/judaism.csv +++ b/datasets/news/judaism.csv @@ -1,5 +1,6 @@ name, url, language, country בחדרי חרדים, https://www.bhol.co.il/rss/index.xml, he-IL, Israel ynet - יהדות, https://www.ynet.co.il/Integration/StoryRss4403.xml, he-IL, Israel -ynet - Jewish, https://www.ynet.co.il/3rdparty/mobile/rss/ynetnews/3443/, en-IL, Israel +ynet - Jewish, https://www.ynet.co.il/Integration/StoryRss3443.xml, en-IL, Israel +Jerm Warfare, https://jermwarfare.com/feed, en-US, USA diff --git a/datasets/news/lifestyle.csv b/datasets/news/lifestyle.csv index 3e96a3b..9f5488f 100644 --- a/datasets/news/lifestyle.csv +++ b/datasets/news/lifestyle.csv @@ -2,3 +2,4 @@ name, url, language, country Jacob McCormick, https://mccor.xyz/rss.xml, en-US, USA The Organic Prepper, https://www.theorganicprepper.com/feed/, en-US, USA XXIIVV, https://wiki.xxiivv.com/links/rss.xml, en-US, Canada +Divine Lifestyle, https://divinelifestyle.com/feed/, en-US, USA diff --git a/datasets/news/linux.csv b/datasets/news/linux.csv index d443772..fa98607 100644 --- a/datasets/news/linux.csv +++ b/datasets/news/linux.csv @@ -1,3 +1,4 @@ name, url, language, country Linux Professional Institute (LPI), https://www.lpi.org/feed/, en-US, Canada LinuxConfig, https://linuxconfig.org/feed, en-US, Worldwide +The Logs, https://www.flu0r1ne.net/logs/rss.xml, en-US, USA diff --git a/datasets/news/middle_east.csv b/datasets/news/middle_east.csv index d65c693..ffee8f1 100644 --- a/datasets/news/middle_east.csv +++ b/datasets/news/middle_east.csv @@ -1,2 +1,4 @@ name, url, language, country MintPress News, https://www.mintpressnews.com/feed/, en-US, USA +Al-Mayadeen, https://www.almayadeen.net/feed/, ar-AR, Lebanon +Jerm Warfare, https://jermwarfare.com/feed, en-US, USA diff --git a/datasets/news/nature.csv b/datasets/news/nature.csv new file mode 100644 index 0000000..3edfec1 --- /dev/null +++ b/datasets/news/nature.csv @@ -0,0 +1,2 @@ +name, url, language, country +ynet - ירוק, https://www.ynet.co.il/Integration/StoryRss4872.xml, he-IL, Israel diff --git a/datasets/news/occult.csv b/datasets/news/occult.csv new file mode 100644 index 0000000..4c1bfd1 --- /dev/null +++ b/datasets/news/occult.csv @@ -0,0 +1,2 @@ +name, url, language, country +nobulart - Exploring the Great Reset, https://nobulart.com/feed/, en-US, USA diff --git a/datasets/news/opinions.csv b/datasets/news/opinions.csv index f6ceda9..82f12ad 100644 --- a/datasets/news/opinions.csv +++ b/datasets/news/opinions.csv @@ -2,4 +2,6 @@ name, url, language, country National Vanguard, https://nationalvanguard.org/feed/, en-US, USA Vanguard News Network, http://www.vanguardnewsnetwork.com/feed/, en-US, USA דה מרקר - פרשנויות היום, https://www.themarker.com/srv/tm-opinions, he-IL, Israel +Richard Stallman's Political Notes, https://stallman.org/rss/rss.xml, en-US, USA +ynet - דעות, https://www.ynet.co.il/Integration/StoryRss194.xml, he-IL, Israel diff --git a/datasets/news/pharma.csv b/datasets/news/pharma.csv new file mode 100644 index 0000000..d1dc4fd --- /dev/null +++ b/datasets/news/pharma.csv @@ -0,0 +1,2 @@ +name, url, language, country +STAT, https://www.statnews.com/feed/, en-US, USA diff --git a/datasets/news/privacy.csv b/datasets/news/privacy.csv index c088e1e..d495e2c 100644 --- a/datasets/news/privacy.csv +++ b/datasets/news/privacy.csv @@ -1 +1,2 @@ name, url, language, country +The Logs, https://www.flu0r1ne.net/logs/rss.xml, en-US, USA diff --git a/datasets/news/propaganda.csv b/datasets/news/propaganda.csv index 9d14b6d..01a0682 100644 --- a/datasets/news/propaganda.csv +++ b/datasets/news/propaganda.csv @@ -1,3 +1,4 @@ name, url, language, country -העין השביעית, https://www.the7eye.org.il/feed, he-IL, Israel +Daily Stormer, https://dailystormer.in/feed/, en-US, USA Fakeologist, https://fakeologist.com/feed/, en-US, Canada +העין השביעית, https://www.the7eye.org.il/feed, he-IL, Israel diff --git a/datasets/news/security.csv b/datasets/news/security.csv index 3585d9f..01c5ad0 100644 --- a/datasets/news/security.csv +++ b/datasets/news/security.csv @@ -1,2 +1,3 @@ name, url, language, country The Organic Prepper, https://www.theorganicprepper.com/feed/, en-US, USA +The Logs, https://www.flu0r1ne.net/logs/rss.xml, en-US, USA diff --git a/datasets/news/sports.csv b/datasets/news/sports.csv index c088e1e..b723ecb 100644 --- a/datasets/news/sports.csv +++ b/datasets/news/sports.csv @@ -1 +1,2 @@ name, url, language, country +ynet - ספורט, https://www.ynet.co.il/Integration/StoryRss3.xml, he-IL, Israel diff --git a/datasets/news/survival.csv b/datasets/news/survival.csv index 3585d9f..60d1641 100644 --- a/datasets/news/survival.csv +++ b/datasets/news/survival.csv @@ -1,2 +1,4 @@ name, url, language, country The Organic Prepper, https://www.theorganicprepper.com/feed/, en-US, USA +nobulart - Exploring the Great Reset, https://nobulart.com/feed/, en-US, USA + diff --git a/datasets/news/technology.csv b/datasets/news/technology.csv index e9efbcd..e5ae212 100644 --- a/datasets/news/technology.csv +++ b/datasets/news/technology.csv @@ -1,2 +1,6 @@ name, url, language, country Developpez, https://www.developpez.com/index/atom, fr-FR, France +The Logs, https://www.flu0r1ne.net/logs/rss.xml, en-US, USA +CryptoSlate, https://cryptoslate.com/feed/, en-US, USA +Daily Stormer, https://dailystormer.in/feed/, en-US, USA +Futurism, https://futurism.com/feed, en-US, USA diff --git a/datasets/news/travel.csv b/datasets/news/travel.csv new file mode 100644 index 0000000..3b7b392 --- /dev/null +++ b/datasets/news/travel.csv @@ -0,0 +1,2 @@ +name, url, language, country +ynet - תיירות, https://www.ynet.co.il/Integration/StoryRss598.xml, he-IL, Israel diff --git a/datasets/news/united_states.csv b/datasets/news/united_states.csv new file mode 100644 index 0000000..f83b1cc --- /dev/null +++ b/datasets/news/united_states.csv @@ -0,0 +1,6 @@ +name, url, language, country +ZeroGov, https://zerogov.com/feed/, en-US, USA +The Organic Prepper, https://www.theorganicprepper.com/feed/, en-US, USA +The Hill News, https://thehill.com/feed/?feed=partnerfeed-news-feed&format=rss, en-US, USA +John W. Whitehead, Constitutional Attorney, https://agovernmentofwolves.com/feed/, en-US, USA +BlackListed News, https://www.blacklistednews.com/rss.php, en-US, USA diff --git a/datasets/news/vehicle.csv b/datasets/news/vehicle.csv new file mode 100644 index 0000000..f6f00f6 --- /dev/null +++ b/datasets/news/vehicle.csv @@ -0,0 +1,2 @@ +name, url, language, country +ynet - רכב, https://www.ynet.co.il/Integration/StoryRss550.xml, he-IL, Israel diff --git a/datasets/news/war.csv b/datasets/news/war.csv index c088e1e..c01a38c 100644 --- a/datasets/news/war.csv +++ b/datasets/news/war.csv @@ -1 +1,3 @@ name, url, language, country +Jerm Warfare, https://jermwarfare.com/feed, en-US, USA +Daily Stormer, https://dailystormer.in/feed/, en-US, USA diff --git a/datasets/organizations/netherlands.csv b/datasets/organizations/netherlands.csv new file mode 100644 index 0000000..2789b01 --- /dev/null +++ b/datasets/organizations/netherlands.csv @@ -0,0 +1,2 @@ +name, url, language, country +NLnet news, https://nlnet.nl/feed.atom, en-US, Netherlands diff --git a/datasets/tutorials/data.csv b/datasets/tutorials/data.csv new file mode 100644 index 0000000..6a7df58 --- /dev/null +++ b/datasets/tutorials/data.csv @@ -0,0 +1,2 @@ +name, url, language, country +Data Science Parichay, https://datascienceparichay.com/feed/, en-US, Worldwide diff --git a/datasets/tutorials/python.csv b/datasets/tutorials/python.csv new file mode 100644 index 0000000..12be047 --- /dev/null +++ b/datasets/tutorials/python.csv @@ -0,0 +1,10 @@ +name, url, language, country +Data Science Parichay, https://datascienceparichay.com/feed/, en-US, Worldwide +Super Fast Python, https://superfastpython.com/feed/, en-US, Worldwide +Python Clear, https://www.pythonclear.com/feed/, en-US, Worldwide +Python Guides, https://pythonguides.com/feed/, en-US, Worldwide +AskPython, https://www.askpython.com/feed, en-US, Worldwide +Python Morsels, https://www.pythonmorsels.com/topics/feed/, en-US, Worldwide +Python GUIs, https://www.pythonguis.com/feeds/atom.xml, en-US, Worldwide +Python Examples, https://pythonexamples.org/feed/, en-US, Worldwide +AppDividend, https://appdividend.com/feed/, en-US, Worldwide diff --git a/datasets/wiki/computing.csv b/datasets/wiki/computing.csv new file mode 100644 index 0000000..35b4059 --- /dev/null +++ b/datasets/wiki/computing.csv @@ -0,0 +1,2 @@ +name, url, language, country +[ ChaoticWiki ] Content for /., https://wiki.chaotic.ninja/.rss_full, en-US, Worldwide