dvt81's picture
simplifying with curl
a5390b7 verified
from smolagents import CodeAgent, DuckDuckGoSearchTool, HfApiModel, load_tool, tool
import datetime
import requests
import pytz
import yaml
from tools.final_answer import FinalAnswerTool
from Gradio_UI import GradioUI
from bs4 import BeautifulSoup
import subprocess
@tool
def get_zh_top_news() -> tuple[str, str]:
"""A tool that retrieves the current top news article's title and URL from www.zerohedge.com.
Returns:
tuple[str, str]: A tuple containing the article title (str) and its URL (str).
"""
try:
# Use curl to fetch the HTML content
result = subprocess.run(
["curl", "-s", "https://www.zerohedge.com"],
capture_output=True,
text=True,
check=True
)
html_content = result.stdout
print(f"DEBUG: Fetched HTML length: {len(html_content)}") # Debug: Check if content is retrieved
# Parse HTML with BeautifulSoup
soup = BeautifulSoup(html_content, "html.parser")
# Find the first <h2> with class starting with 'Article_title___'
top_article = soup.find("h2", class_=lambda x: x and x.startswith("Article_title___"))
if not top_article:
print("DEBUG: No matching <h2> found")
return "Error: Headline not found", "https://www.zerohedge.com"
# Extract the <a> tag inside the <h2>
link_tag = top_article.find("a")
if not link_tag:
print("DEBUG: No <a> tag found in top article")
return "Error: Headline not found", "https://www.zerohedge.com"
# Get title and URL
article_title = link_tag.get_text(strip=True) or "No title found"
article_link = link_tag.get("href") or "https://www.zerohedge.com"
# Ensure the link is absolute
if not article_link.startswith("http"):
article_link = f"https://www.zerohedge.com{article_link}"
print(f"DEBUG: Title = '{article_title}', Link = '{article_link}'")
return article_title, article_link
except subprocess.CalledProcessError as e:
print(f"Error fetching page with curl: {e}")
return "Error: Fetch failed", "https://www.zerohedge.com"
except Exception as e:
print(f"Error parsing content: {e}")
return "Error: Headline not found", "https://www.zerohedge.com"
@tool
def get_current_time_in_timezone(timezone: str) -> str:
"""A tool that fetches the current local time in a specified timezone.
Args:
timezone: A string representing a valid timezone (e.g., 'America/New_York').
"""
try:
tz = pytz.timezone(timezone)
local_time = datetime.datetime.now(tz).strftime("%Y-%m-%d %H:%M:%S")
return f"The current local time in {timezone} is: {local_time}"
except Exception as e:
return f"Error fetching time for timezone '{timezone}': {str(e)}"
final_answer = FinalAnswerTool()
model = HfApiModel(
max_tokens=2096,
temperature=0.5,
model_id='Qwen/Qwen2.5-Coder-32B-Instruct',
custom_role_conversions=None,
)
image_generation_tool = load_tool("agents-course/text-to-image", trust_remote_code=True)
with open("prompts.yaml", 'r') as stream:
prompt_templates = yaml.safe_load(stream)
agent = CodeAgent(
model=model,
tools=[get_zh_top_news, get_current_time_in_timezone, final_answer],
max_steps=6,
verbosity_level=1,
grammar=None,
planning_interval=None,
name=None,
description=None,
prompt_templates=prompt_templates
)
GradioUI(agent).launch()