broadfield-dev commited on
Commit
d8b8e62
·
verified ·
1 Parent(s): 715921b

Update rss_processor.py

Browse files
Files changed (1) hide show
  1. rss_processor.py +37 -2
rss_processor.py CHANGED
@@ -12,10 +12,45 @@ logger = logging.getLogger(__name__)
12
  # Constants
13
  LOCAL_DB_DIR = "chroma_db"
14
  RSS_FEEDS = [
15
- "https://www.nasa.gov/rss/dyn/breaking_news.rss",
16
  "https://www.sciencedaily.com/rss/top/science.xml",
 
 
 
 
 
17
  "https://www.wired.com/feed/rss",
18
- # Add more feeds as needed; starting with reliable ones
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
19
  ]
20
 
21
  # Initialize embedding model and vector DB
 
12
  # Constants
13
  LOCAL_DB_DIR = "chroma_db"
14
  RSS_FEEDS = [
 
15
  "https://www.sciencedaily.com/rss/top/science.xml",
16
+ "https://www.horoscope.com/us/horoscopes/general/rss/horoscope-rss.aspx",
17
+ "http://rss.cnn.com/rss/cnn_allpolitics.rss",
18
+ "https://phys.org/rss-feed/physics-news/",
19
+ "https://www.spaceweatherlive.com/en/news/rss",
20
+ "https://weather.com/feeds/rss",
21
  "https://www.wired.com/feed/rss",
22
+ "https://www.nasa.gov/rss/dyn/breaking_news.rss",
23
+ "https://www.nationalgeographic.com/feed/",
24
+ "https://www.nature.com/nature.rss",
25
+ "https://www.scientificamerican.com/rss/",
26
+ "https://www.newscientist.com/feed/home/",
27
+ "https://www.livescience.com/feeds/all",
28
+ "https://astrostyle.com/feed/",
29
+ "https://www.vogue.com/feed/rss",
30
+ "https://feeds.bbci.co.uk/news/politics/rss.xml",
31
+ "https://www.reuters.com/arc/outboundfeeds/newsletter-politics/?outputType=xml",
32
+ "https://www.politico.com/rss/politics.xml",
33
+ "https://thehill.com/feed/",
34
+ "https://www.aps.org/publications/apsnews/updates/rss.cfm",
35
+ "https://www.quantamagazine.org/feed/",
36
+ "https://www.sciencedaily.com/rss/matter_energy/physics.xml",
37
+ "https://physicsworld.com/feed/",
38
+ "https://www.swpc.noaa.gov/rss.xml",
39
+ "https://feeds.bbci.co.uk/weather/feeds/rss/5day/world/",
40
+ "https://www.weather.gov/rss",
41
+ "https://www.foxweather.com/rss",
42
+ "https://techcrunch.com/feed/",
43
+ "https://arstechnica.com/feed/",
44
+ "https://gizmodo.com/rss",
45
+ "https://www.theverge.com/rss/index.xml",
46
+ "https://www.space.com/feeds/all",
47
+ "https://www.universetoday.com/feed/",
48
+ "https://skyandtelescope.org/feed/",
49
+ "https://www.esa.int/rss",
50
+ "https://www.smithsonianmag.com/rss/",
51
+ "https://www.popsci.com/rss.xml",
52
+ "https://www.discovermagazine.com/rss",
53
+ "https://www.atlasobscura.com/feeds/latest"
54
  ]
55
 
56
  # Initialize embedding model and vector DB