Spaces:

datenwerkzeuge
/

Webseiten-URL-Extraktor

Sleeping

bsenst commited on Dec 8, 2024

Commit

dced2cd

verified ·

1 Parent(s): 4f61c6e

Create app.py

Files changed (1) hide show

app.py ADDED Viewed

+import streamlit as st
+import requests
+from bs4 import BeautifulSoup
+# Funktion, um alle URLs von einer Webseite zu extrahieren
+def extract_urls(url):
+    try:
+        response = requests.get(url)
+        response.raise_for_status()
+        soup = BeautifulSoup(response.text, 'html.parser')
+        links = [a.get('href') for a in soup.find_all('a', href=True)]
+        return links
+    except Exception as e:
+        return str(e)
+# Streamlit App
+st.title("Webseiten-URL-Extraktor")
+# Eingabefeld für die URL
+url_input = st.text_input("Gib die URL der Webseite ein:", placeholder="https://example.com")
+# Wenn der Nutzer eine URL eingibt und auf den Button klickt
+if st.button("URLs extrahieren"):
+    if url_input:
+        st.write(f"Extrahiere URLs von: {url_input}")
+        urls = extract_urls(url_input)