zvl commited on
Commit
27f26c0
·
verified ·
1 Parent(s): ae7a494

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +29 -6
app.py CHANGED
@@ -4,19 +4,42 @@ import requests
4
  import pytz
5
  import yaml
6
  from tools.final_answer import FinalAnswerTool
 
7
 
8
  from Gradio_UI import GradioUI
9
 
10
  # Below is an example of a tool that does nothing. Amaze us with your creativity !
11
  @tool
12
- def my_custom_tool(arg1:str, arg2:int)-> str: #it's import to specify the return type
13
- #Keep this format for the description / args / args description but feel free to modify the tool
14
- """A tool that does nothing yet
15
  Args:
16
- arg1: the first argument
17
- arg2: the second argument
 
 
18
  """
19
- return "What magic will you build ?"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
20
 
21
  @tool
22
  def get_current_time_in_timezone(timezone: str) -> str:
 
4
  import pytz
5
  import yaml
6
  from tools.final_answer import FinalAnswerTool
7
+ from bs4 import BeautifulSoup
8
 
9
  from Gradio_UI import GradioUI
10
 
11
  # Below is an example of a tool that does nothing. Amaze us with your creativity !
12
  @tool
13
+ def extract_metadata_from_url(url: str) -> dict:
14
+ """Extrae todos los metadatos de una página web.
15
+
16
  Args:
17
+ url: La URL de la página web a analizar.
18
+
19
+ Returns:
20
+ Un diccionario con los metadatos encontrados.
21
  """
22
+ try:
23
+ # Obtener el contenido de la página
24
+ headers = {'User-Agent': 'Mozilla/5.0'}
25
+ response = requests.get(url, headers=headers)
26
+ response.raise_for_status() # Lanza un error si el request falla
27
+
28
+ # Parsear el contenido HTML con BeautifulSoup
29
+ soup = BeautifulSoup(response.text, 'html.parser')
30
+
31
+ # Extraer los metadatos de la página
32
+ metadata = {}
33
+ for meta in soup.find_all('meta'):
34
+ if 'name' in meta.attrs and 'content' in meta.attrs:
35
+ metadata[meta['name']] = meta['content']
36
+ elif 'property' in meta.attrs and 'content' in meta.attrs:
37
+ metadata[meta['property']] = meta['content']
38
+
39
+ return metadata if metadata else {"error": "No se encontraron metadatos en la página."}
40
+
41
+ except requests.exceptions.RequestException as e:
42
+ return {"error": f"Error al acceder a la URL: {str(e)}"}
43
 
44
  @tool
45
  def get_current_time_in_timezone(timezone: str) -> str: