KotVasily commited on
Commit
033b00b
·
verified ·
1 Parent(s): d00cf91

Update news.py

Browse files
Files changed (1) hide show
  1. news.py +13 -5
news.py CHANGED
@@ -20,12 +20,20 @@ class NewsData:
20
  ("https://ru.investing.com/news/forex-news/", "forex-news"),
21
  ("https://ru.investing.com/news/commodities-news/", "commodities-news"),
22
  ]
23
- self.headers = {
24
- 'User-Agent': 'Mozilla/5.0 (Linux i656 ) AppleWebKit/600.38 (KHTML, like Gecko) Chrome/54.0.2398.331 Safari/603',
25
- 'Accept-Language': 'en-US,en;q=0.5',
26
- 'Referer': 'http://google.com'
 
 
27
  }
28
 
 
 
 
 
 
 
29
  self.morph = pymorphy2.MorphAnalyzer() # С помощь него мы будем приводить слова в начальную форму
30
  self.scraper = cloudscraper.create_scraper()
31
 
@@ -39,7 +47,7 @@ class NewsData:
39
  while True:
40
  url = f"{base_url}{page}/"
41
  #response = requests.get(url, headers=self.headers)
42
- response = self.scraper.get(url, headers=self.headers)
43
  print(response)
44
 
45
  if response.status_code == 200:
 
20
  ("https://ru.investing.com/news/forex-news/", "forex-news"),
21
  ("https://ru.investing.com/news/commodities-news/", "commodities-news"),
22
  ]
23
+ self.headers = self.headers = {
24
+ 'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36',
25
+ 'Accept-Language': 'ru-RU,ru;q=0.9,en-US;q=0.8,en;q=0.7',
26
+ 'Accept-Encoding': 'gzip, deflate, br',
27
+ 'Connection': 'keep-alive',
28
+ 'Referer': 'https://www.google.com/'
29
  }
30
 
31
+ self.proxies = {
32
+ "http": "http://46.47.197.210:8080",
33
+ "https": "https://46.47.197.210:8080"
34
+ }
35
+
36
+
37
  self.morph = pymorphy2.MorphAnalyzer() # С помощь него мы будем приводить слова в начальную форму
38
  self.scraper = cloudscraper.create_scraper()
39
 
 
47
  while True:
48
  url = f"{base_url}{page}/"
49
  #response = requests.get(url, headers=self.headers)
50
+ response = self.scraper.get(url, headers=self.headers, proxies=self.proxies)
51
  print(response)
52
 
53
  if response.status_code == 200: