Spaces:
Running
Running
Update rss_processor.py
Browse files- rss_processor.py +37 -2
rss_processor.py
CHANGED
@@ -12,10 +12,45 @@ logger = logging.getLogger(__name__)
|
|
12 |
# Constants
|
13 |
LOCAL_DB_DIR = "chroma_db"
|
14 |
RSS_FEEDS = [
|
15 |
-
"https://www.nasa.gov/rss/dyn/breaking_news.rss",
|
16 |
"https://www.sciencedaily.com/rss/top/science.xml",
|
|
|
|
|
|
|
|
|
|
|
17 |
"https://www.wired.com/feed/rss",
|
18 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
19 |
]
|
20 |
|
21 |
# Initialize embedding model and vector DB
|
|
|
12 |
# Constants
|
13 |
LOCAL_DB_DIR = "chroma_db"
|
14 |
RSS_FEEDS = [
|
|
|
15 |
"https://www.sciencedaily.com/rss/top/science.xml",
|
16 |
+
"https://www.horoscope.com/us/horoscopes/general/rss/horoscope-rss.aspx",
|
17 |
+
"http://rss.cnn.com/rss/cnn_allpolitics.rss",
|
18 |
+
"https://phys.org/rss-feed/physics-news/",
|
19 |
+
"https://www.spaceweatherlive.com/en/news/rss",
|
20 |
+
"https://weather.com/feeds/rss",
|
21 |
"https://www.wired.com/feed/rss",
|
22 |
+
"https://www.nasa.gov/rss/dyn/breaking_news.rss",
|
23 |
+
"https://www.nationalgeographic.com/feed/",
|
24 |
+
"https://www.nature.com/nature.rss",
|
25 |
+
"https://www.scientificamerican.com/rss/",
|
26 |
+
"https://www.newscientist.com/feed/home/",
|
27 |
+
"https://www.livescience.com/feeds/all",
|
28 |
+
"https://astrostyle.com/feed/",
|
29 |
+
"https://www.vogue.com/feed/rss",
|
30 |
+
"https://feeds.bbci.co.uk/news/politics/rss.xml",
|
31 |
+
"https://www.reuters.com/arc/outboundfeeds/newsletter-politics/?outputType=xml",
|
32 |
+
"https://www.politico.com/rss/politics.xml",
|
33 |
+
"https://thehill.com/feed/",
|
34 |
+
"https://www.aps.org/publications/apsnews/updates/rss.cfm",
|
35 |
+
"https://www.quantamagazine.org/feed/",
|
36 |
+
"https://www.sciencedaily.com/rss/matter_energy/physics.xml",
|
37 |
+
"https://physicsworld.com/feed/",
|
38 |
+
"https://www.swpc.noaa.gov/rss.xml",
|
39 |
+
"https://feeds.bbci.co.uk/weather/feeds/rss/5day/world/",
|
40 |
+
"https://www.weather.gov/rss",
|
41 |
+
"https://www.foxweather.com/rss",
|
42 |
+
"https://techcrunch.com/feed/",
|
43 |
+
"https://arstechnica.com/feed/",
|
44 |
+
"https://gizmodo.com/rss",
|
45 |
+
"https://www.theverge.com/rss/index.xml",
|
46 |
+
"https://www.space.com/feeds/all",
|
47 |
+
"https://www.universetoday.com/feed/",
|
48 |
+
"https://skyandtelescope.org/feed/",
|
49 |
+
"https://www.esa.int/rss",
|
50 |
+
"https://www.smithsonianmag.com/rss/",
|
51 |
+
"https://www.popsci.com/rss.xml",
|
52 |
+
"https://www.discovermagazine.com/rss",
|
53 |
+
"https://www.atlasobscura.com/feeds/latest"
|
54 |
]
|
55 |
|
56 |
# Initialize embedding model and vector DB
|