First_agent_template

Sleeping

App Files Files Community

Adding a custom tool to scrape the top news result from the ZeroHedge News feed

by dvt81 - opened Mar 18

base: refs/heads/main

←

from: refs/pr/1

Discussion Files changed

+45

-9

Files changed (1) hide show

app.py +45 -9

app.py CHANGED Viewed

@@ -7,16 +7,52 @@ from tools.final_answer import FinalAnswerTool
 from Gradio_UI import GradioUI
-# Below is an example of a tool that does nothing. Amaze us with your creativity !
 @tool
-def my_custom_tool(arg1:str, arg2:int)-> str: #it's import to specify the return type
-    #Keep this format for the description / args / args description but feel free to modify the tool
-    """A tool that does nothing yet
-    Args:
-        arg1: the first argument
-        arg2: the second argument
     """
-    return "What magic will you build ?"
 @tool
 def get_current_time_in_timezone(timezone: str) -> str:
@@ -55,7 +91,7 @@ with open("prompts.yaml", 'r') as stream:
 agent = CodeAgent(
     model=model,
-    tools=[final_answer], ## add your tools here (don't remove final answer)
     max_steps=6,
     verbosity_level=1,
     grammar=None,

 from Gradio_UI import GradioUI
+from selenium import webdriver
 @tool
+def get_zh_top_news() -> tuple[str, str]:
+    """A tool that retrieves the current top news article's title and URL from www.zerohedge.com.
+    Returns:
+        tuple[str, str]: A tuple containing the article title (str) and its URL (str).
+    Raises:
+        Exception: If the page fails to load or the expected element is not found.
     """
+    # Set up Chrome options for headless browsing (optional, improves performance)
+    chrome_options = Options()
+    chrome_options.add_argument("--headless")  # Run without opening a browser window
+    chrome_options.add_argument("--disable-gpu")  # Disable GPU acceleration in headless mode
+    # Initialize the Selenium WebDriver (assumes chromedriver is in PATH or specify path via Service)
+    driver = webdriver.Chrome(options=chrome_options)
+    try:
+        # Navigate to ZeroHedge homepage
+        driver.get("https://www.zerohedge.com")
+        # Find the top article element using a CSS selector
+        # Based on ZeroHedge's structure, the top headline is typically the first prominent article
+        top_article = driver.find_element(By.CSS_SELECTOR, "article .ArticleTeaser_titleLink__mK4rX")
+        # Extract the title from the text content of the link
+        article_title = top_article.text.strip()
+        # Extract the URL from the href attribute
+        article_link = top_article.get_attribute("href")
+        # Ensure the link is absolute (ZeroHedge uses relative URLs)
+        if not article_link.startswith("http"):
+            article_link = f"https://www.zerohedge.com{article_link}"
+        return article_title, article_link
+    except Exception as e:
+        return "Error: Headline not found", "https://www.zerohedge.com"
+    finally:
+        # Always close the browser session to free resources
+        driver.quit()
 @tool
 def get_current_time_in_timezone(timezone: str) -> str:
 agent = CodeAgent(
     model=model,
+    tools=[get_zh_top_news,get_current_time_in_timezone,final_answer], ## add your tools here (don't remove final answer)
     max_steps=6,
     verbosity_level=1,
     grammar=None,