Spaces:

mgokg
/

google_search

Running

App Files Files Community

mgokg commited on Jan 7

Commit

10ae401

verified ·

1 Parent(s): ba251cc

Update app.py

Browse files

Files changed (1) hide show

app.py +5 -34

app.py CHANGED Viewed

@@ -62,7 +62,6 @@ def list_of_clubs(ort):
             target_div = soup.select_one('div.row-cols-1:nth-child(4)')
             if target_div:
-                #links = [urljoin(base_url, a['href']) for a in target_div.find_all('a', href=True)]
                 texts = [a.text for a in target_div.find_all('a', href=True)]
                 all_links_text.extend(texts)
             else:
@@ -74,56 +73,28 @@ def list_of_clubs(ort):
     all_links_text = all_links_text[0::2]
     return all_links_text
-def google_search(query):
-    headers = {
-        "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36"
-    }
-    # Führt die Suche durch und erhält das erste Ergebnis
-    for result in search(query, num_results=1):
-        url = result
-        break
-    response = requests.get(url)
-    soup = BeautifulSoup(response.text, 'html.parser')
-    #first_div = soup.find('div', class_='MjjYud')
-    first_div = soup.find('body')
-    return first_div.text.strip()
 def process_ort(ort):
     links_text = list_of_clubs(ort)
     vereine = []
     for verein in links_text:
-        #query = f"impressum {verein}"
         headers = {
             "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36"
         }
-        #search_results = google_search(search_term)
         url = f"https://www.google.com/search?q=impressum {verein}"
         response = requests.get(url, headers=headers)
         soup = BeautifulSoup(response.content, 'html.parser')
         impressum_div = soup.find('body')
-        #return impressum_div.text
-        #uri = f"https://www.google.com/search?q={query}"
-        #response = requests.get(uri)
-        #soup = BeautifulSoup(response.text, 'html.parser')
-        #first_div = soup.find('body')
-        #erg = llm(first_div.text)
-        #return first_div.text
         contact_detailes = impressum_div.text
-        #json_object = llm(contact_detailes)
-        vereine.append(contact_detailes)
-        #vereine.append(json_object)
-        #vereine.extend(json_object)
     return vereine
-    return links_text
 demo = gr.Interface(
-    #fn=google_search,
     fn=process_ort,
     inputs=gr.Textbox(lines=1, placeholder="Geben Sie Ihre Suchanfrage ein..."),
     outputs="text",

             target_div = soup.select_one('div.row-cols-1:nth-child(4)')
             if target_div:
                 texts = [a.text for a in target_div.find_all('a', href=True)]
                 all_links_text.extend(texts)
             else:
     all_links_text = all_links_text[0::2]
     return all_links_text
 def process_ort(ort):
     links_text = list_of_clubs(ort)
     vereine = []
     for verein in links_text:
         headers = {
             "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36"
         }
         url = f"https://www.google.com/search?q=impressum {verein}"
         response = requests.get(url, headers=headers)
         soup = BeautifulSoup(response.content, 'html.parser')
         impressum_div = soup.find('body')
         contact_detailes = impressum_div.text
+        json_object = llm(contact_detailes)
+        #vereine.append(contact_detailes)
+        vereine.append(json_object)
     return vereine
 demo = gr.Interface(
     fn=process_ort,
     inputs=gr.Textbox(lines=1, placeholder="Geben Sie Ihre Suchanfrage ein..."),
     outputs="text",