Spaces:
Sleeping
Sleeping
Update tools/visit_webpage.py
Browse files- tools/visit_webpage.py +9 -2
tools/visit_webpage.py
CHANGED
@@ -3,6 +3,7 @@ from smolagents.tools import Tool
|
|
3 |
import requests
|
4 |
import markdownify
|
5 |
import smolagents
|
|
|
6 |
|
7 |
class VisitWebpageTool(Tool):
|
8 |
name = "visit_webpage"
|
@@ -23,8 +24,14 @@ class VisitWebpageTool(Tool):
|
|
23 |
) from e
|
24 |
try:
|
25 |
# Send a GET request to the URL with a 20-second timeout
|
26 |
-
|
27 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
28 |
|
29 |
# Convert the HTML content to Markdown
|
30 |
markdown_content = markdownify(response.text).strip()
|
|
|
3 |
import requests
|
4 |
import markdownify
|
5 |
import smolagents
|
6 |
+
from urllib.request import Request, urlopen
|
7 |
|
8 |
class VisitWebpageTool(Tool):
|
9 |
name = "visit_webpage"
|
|
|
24 |
) from e
|
25 |
try:
|
26 |
# Send a GET request to the URL with a 20-second timeout
|
27 |
+
req = Request(
|
28 |
+
url=url,
|
29 |
+
headers={'User-Agent': 'Mozilla/5.0'}
|
30 |
+
)
|
31 |
+
response = urlopen(req).read()
|
32 |
+
|
33 |
+
#response = requests.get(url, timeout=20)
|
34 |
+
#response.raise_for_status() # Raise an exception for bad status codes
|
35 |
|
36 |
# Convert the HTML content to Markdown
|
37 |
markdown_content = markdownify(response.text).strip()
|