First_agent_template

Sleeping

App Files Files Community

SilviuMatei commited on Feb 21

Commit

6553c90

verified ·

1 Parent(s): 2a86392

Update tools/getDeviceInfo.py

Browse files

Files changed (1) hide show

tools/getDeviceInfo.py +40 -16

tools/getDeviceInfo.py CHANGED Viewed

@@ -1,26 +1,47 @@
-from typing import Any
-from smolagents.tools import Tool
-import playwright.sync_api as playwright
-class GetDeviceInfoTool(Tool):
-    name = "get_device_info"
-    description = "Opens a browser and uses JavaScript to retrieve device information silently."
-    inputs = {}
-    output_type = "string"
-    def forward(self) -> str:
-        """
-        Opens a headless browser using Playwright and executes JavaScript to silently retrieve device information.
-        Returns:
-            str: A string containing device details such as user agent, platform, and screen resolution.
-        """
         with playwright.sync_api.sync_playwright() as p:
             browser = p.chromium.launch(headless=True)
             page = browser.new_page()
             script = """
-            () => JSON.stringify({
                 userAgent: navigator.userAgent,
                 platform: navigator.platform,
                 language: navigator.language,
@@ -33,7 +54,10 @@ class GetDeviceInfoTool(Tool):
             device_info = page.evaluate(script)
             browser.close()
-        return device_info
     def __init__(self, *args, **kwargs):
         self.is_initialized = False

+class VisitWebpageTool(Tool):
+    name = "visit_webpage"
+    description = "Visits a webpage at the given URL, reads its content as a markdown string, and extracts device information."
+    inputs = {'url': {'type': 'string', 'description': 'The URL of the webpage to visit.'}}
+    output_type = "dict"
+    def forward(self, url: str) -> dict:
+        try:
+            import requests
+            from markdownify import markdownify
+            from requests.exceptions import RequestException
+            from smolagents.utils import truncate_content
+        except ImportError as e:
+            raise ImportError(
+                "You must install packages `markdownify` and `requests` to run this tool: for instance run `pip install markdownify requests`."
+            ) from e
+        try:
+            # Send a GET request to the URL with a 20-second timeout
+            response = requests.get(url, timeout=20)
+            response.raise_for_status()  # Raise an exception for bad status codes
+            # Convert the HTML content to Markdown
+            markdown_content = markdownify(response.text).strip()
+            # Remove multiple line breaks
+            markdown_content = re.sub(r"\n{3,}", "\n\n", markdown_content)
+            webpage_content = truncate_content(markdown_content, 10000)
+        except requests.exceptions.Timeout:
+            webpage_content = "The request timed out. Please try again later or check the URL."
+        except RequestException as e:
+            webpage_content = f"Error fetching the webpage: {str(e)}"
+        except Exception as e:
+            webpage_content = f"An unexpected error occurred: {str(e)}"
+        # Extract device information using Playwright
         with playwright.sync_api.sync_playwright() as p:
             browser = p.chromium.launch(headless=True)
             page = browser.new_page()
             script = """
+            () => ({
                 userAgent: navigator.userAgent,
                 platform: navigator.platform,
                 language: navigator.language,
             device_info = page.evaluate(script)
             browser.close()
+        return {
+            "webpage_content": webpage_content,
+            "device_info": device_info
+        }
     def __init__(self, *args, **kwargs):
         self.is_initialized = False