Spaces:

mgokg
/

schichtplan

Runtime error

App Files Files Community

mgokg commited on Jan 24

Commit

7d31ac3

verified ·

1 Parent(s): bca18f5

Update app.py

Browse files

Files changed (1) hide show

app.py +27 -15

app.py CHANGED Viewed

@@ -17,6 +17,7 @@ client = Groq(api_key=api_key)
 def process_audio(audio_bytes):
     """Verarbeitet Audio-Bytes und gibt Transkript zurück"""
     try:
         # Konvertiere Bytes in Audio-Daten
         audio_io = io.BytesIO(audio_bytes)
@@ -27,7 +28,7 @@ def process_audio(audio_bytes):
             with open(tmpfile.name, "rb") as audio_file:
                 transcription = client.audio.transcriptions.create(
-                    file=(tmpfile.name, audio_file, "audio/wav"),
                     model="whisper-large-v3-turbo",
                     language="de",
                     response_format="text"
@@ -37,25 +38,36 @@ def process_audio(audio_bytes):
     except Exception as e:
         return f"Fehler: {str(e)}"
     finally:
-        if 'tmpfile' in locals():
             os.unlink(tmpfile.name)
 # Streamlit UI
 st.title("🎤 Audio Transkription")
 st.info("Funktioniert auf Hugging Face Spaces!")
-#sr_outputs = st.text
-audio_bytes = st.audio_input(
-    "Oder sprechen Sie jetzt:",
 )
-if audio_bytes:
-    # Verarbeitung Mikrofonaufnahme
-    try:
-        # Konvertiere Bytes in Audio-Daten
-        audio_io = io.BytesIO(audio_bytes)
-        audio_data = sf.read(audio_io)
-        transcription = processaudio(audio_data)
-        st.text(transcription)
-    except Exception as e:
-        st.text(f"Fehler bei der Aufnahmeverarbeitung: {str(e)}")

 def process_audio(audio_bytes):
     """Verarbeitet Audio-Bytes und gibt Transkript zurück"""
+    tmpfile = None  # Initialisierung für finally-Block
     try:
         # Konvertiere Bytes in Audio-Daten
         audio_io = io.BytesIO(audio_bytes)
             with open(tmpfile.name, "rb") as audio_file:
                 transcription = client.audio.transcriptions.create(
+                    file=(os.path.basename(tmpfile.name), audio_file),  # Korrigierte Parameter
                     model="whisper-large-v3-turbo",
                     language="de",
                     response_format="text"
     except Exception as e:
         return f"Fehler: {str(e)}"
     finally:
+        if tmpfile and os.path.exists(tmpfile.name):
             os.unlink(tmpfile.name)
 # Streamlit UI
 st.title("🎤 Audio Transkription")
 st.info("Funktioniert auf Hugging Face Spaces!")
+# Kombinierter Uploader für Datei und Mikrofon
+audio_file = st.file_uploader(
+    "Aufnahme starten oder Datei hochladen",
+    type=["wav"],
+    accept_multiple_files=False,
+    help="Klicken Sie auf 'Browse Files' und wählen Sie im Browser 'Take a recording'"
 )
+if audio_file:
+    with st.spinner("Verarbeite Audio..."):
+        try:
+            # Datei in Bytes lesen
+            audio_bytes = audio_file.read()
+            # Transkription durchführen
+            result = process_audio(audio_bytes)
+            # Ergebnis anzeigen
+            st.subheader("Transkription:")
+            st.success(result)
+            # Audio-Player anzeigen
+            st.audio(audio_bytes, format="audio/wav")
+        except Exception as e:
+            st.error(f"Fehler: {str(e)}")