First_agent_template

Sleeping

App Files Files Community

dvt81 commited on Mar 19

Commit

ac0f86b

verified ·

1 Parent(s): f9e8166

added more debugging

Browse files

more debugging to solve the chrome driver problem

Files changed (1) hide show

app.py +17 -11

app.py CHANGED Viewed

@@ -24,36 +24,42 @@ def get_zh_top_news() -> tuple[str, str]:
     """
     # Set up Chrome options for headless browsing
     chrome_options = Options()
-    chrome_options.add_argument("--headless")  # Run without opening a browser window
-    chrome_options.add_argument("--disable-gpu")  # Disable GPU for headless mode
-    chrome_options.add_argument("--no-sandbox")  # Required for Docker environments
-    chrome_options.add_argument("--disable-dev-shm-usage")  # Avoid memory issues in containers
     # Specify ChromeDriver path (installed via Dockerfile)
     service = Service(executable_path="/usr/local/bin/chromedriver")
-    # Initialize the WebDriver
-    driver = webdriver.Chrome(service=service, options=chrome_options)
     try:
         # Navigate to ZeroHedge homepage
         driver.get("https://www.zerohedge.com")
         # Find the first <h2> with class starting with 'Article_title___'
         top_article = driver.find_element(By.CSS_SELECTOR, "h2[class^='Article_title___']")
-        print(f" article object: {top_article}")
         # Extract the title from the <a> tag inside the <h2>
-        article_title = top_article.find_element(By.TAG_NAME, "a").text.strip()
         # Extract the URL from the href attribute of the <a> tag
-        article_link = top_article.find_element(By.TAG_NAME, "a").get_attribute("href")
         # Ensure the link is absolute
         if not article_link.startswith("http"):
             article_link = f"https://www.zerohedge.com{article_link}"
         return article_title, article_link
     except Exception as e:

     """
     # Set up Chrome options for headless browsing
     chrome_options = Options()
+    chrome_options.add_argument("--headless")
+    chrome_options.add_argument("--disable-gpu")
+    chrome_options.add_argument("--no-sandbox")
+    chrome_options.add_argument("--disable-dev-shm-usage")
     # Specify ChromeDriver path (installed via Dockerfile)
     service = Service(executable_path="/usr/local/bin/chromedriver")
+    try:
+        # Initialize the WebDriver
+        driver = webdriver.Chrome(service=service, options=chrome_options)
+        print("DEBUG: WebDriver initialized successfully")
+    except Exception as e:
+        print(f"DEBUG: Failed to initialize WebDriver: {e}")
+        return "Error: WebDriver failed", "https://www.zerohedge.com"
     try:
         # Navigate to ZeroHedge homepage
         driver.get("https://www.zerohedge.com")
+        print("DEBUG: Page loaded")
         # Find the first <h2> with class starting with 'Article_title___'
         top_article = driver.find_element(By.CSS_SELECTOR, "h2[class^='Article_title___']")
+        print(f"DEBUG: Found article object: {top_article}")
         # Extract the title from the <a> tag inside the <h2>
+        article_title = top_article.find_element(By.TAG_NAME, "a").text.strip() or "No title found"
         # Extract the URL from the href attribute of the <a> tag
+        article_link = top_article.find_element(By.TAG_NAME, "a").get_attribute("href") or "https://www.zerohedge.com"
         # Ensure the link is absolute
         if not article_link.startswith("http"):
             article_link = f"https://www.zerohedge.com{article_link}"
+        print(f"DEBUG: Returning title='{article_title}', link='{article_link}'")
         return article_title, article_link
     except Exception as e: