webscrapper

Sleeping

Arafath10 commited on Oct 2, 2024

Commit

b8a08e6

verified ·

1 Parent(s): 1d74e32

Update scraper.py

Files changed (1) hide show

scraper.py CHANGED Viewed

@@ -17,13 +17,6 @@ class Scraper:
                 user_agent="Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36"
             )
-            # Set additional headers to force HTTP/1.1 and avoid detection
-            await context.set_extra_http_headers({
-                "Accept-Language": "en-US,en;q=0.9",
-                "Upgrade-Insecure-Requests": "1",
-                "Connection": "keep-alive"  # Force HTTP/1.1 instead of HTTP/2
-            })
             # Open a new page
             page = await context.new_page()
@@ -114,7 +107,7 @@ class Scraper:
     @staticmethod
     async def scrape(url):
         try:
-            headers = {'User-Agent': 'Mozilla/5.0'}
             response = requests.get(url,timeout=3)
             soup = BeautifulSoup(response.content, 'html.parser')

                 user_agent="Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36"
             )
             # Open a new page
             page = await context.new_page()
     @staticmethod
     async def scrape(url):
         try:
+            headers = {'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36'}
             response = requests.get(url,timeout=3)
             soup = BeautifulSoup(response.content, 'html.parser')