Spaces:

mgokg
/

schichtplan

Running

mgokg commited on Jan 23

Commit

dacc07c

verified ·

1 Parent(s): 7cc7769

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -3,6 +3,7 @@ import os
 from groq import Groq
 import soundfile as sf
 from tempfile import NamedTemporaryFile
 # Load the API key from the environment variable
 api_key = os.getenv('groqwhisper')
@@ -38,30 +39,27 @@ def processaudio(audio_data):
     except Exception as e:
         return f"Ein Fehler ist aufgetreten: {str(e)}"
-def process_audio(file_path):
-    try:
-        # Open the audio file
-        with open(file_path, "rb") as file:
-            # Create a transcription of the audio file
-            transcription = client.audio.transcriptions.create(
-                file=(os.path.basename(file_path), file.read()),  # Correct passing of filename
-                model="whisper-large-v3-turbo",  # Required model to use for transcription
-                prompt="transcribe",  # Optional
-                language="de",  # Optional
-                response_format="json",  # Optional
-                temperature=0.0  # Optional
-            )
-            # Return the transcription text
-            return transcription.text
-    except Exception as e:
-        return f"Ein Fehler ist aufgetreten: {str(e)}"
 # Streamlit Interface
 st.title("Audio Transkription")
-sr_outputs = st.empty()  # Platzhalter für die Transkription
-sr_inputs = st.file_uploader("Laden Sie eine Audiodatei hoch", type=["wav", "mp3"])
-if sr_inputs is not None:
-    audio_data = sf.read(sr_inputs)
     transcription = processaudio(audio_data)
     sr_outputs.text(transcription)

 from groq import Groq
 import soundfile as sf
 from tempfile import NamedTemporaryFile
+import io  # Für Bytes-IO hinzugefügt
 # Load the API key from the environment variable
 api_key = os.getenv('groqwhisper')
     except Exception as e:
         return f"Ein Fehler ist aufgetreten: {str(e)}"
 # Streamlit Interface
 st.title("Audio Transkription")
+sr_outputs = st.empty()
+# Dateiupload und Mikrofonaufnahme als getrennte Eingaben
+uploaded_file = st.file_uploader("Laden Sie eine Audiodatei hoch", type=["wav", "mp3"])
+audio_bytes = st.audio_input("Oder sprechen Sie jetzt:", type="wav")
+if uploaded_file:
+    # Verarbeitung hochgeladener Datei
+    audio_data = sf.read(uploaded_file)
     transcription = processaudio(audio_data)
     sr_outputs.text(transcription)
+elif audio_bytes:
+    # Verarbeitung Mikrofonaufnahme
+    try:
+        # Konvertiere Bytes in Audio-Daten
+        audio_io = io.BytesIO(audio_bytes)
+        audio_data = sf.read(audio_io)
+        transcription = processaudio(audio_data)
+        sr_outputs.text(transcription)
+    except Exception as e:
+        sr_outputs.text(f"Fehler bei der Aufnahmeverarbeitung: {str(e)}")