Spaces:

Nitzantry1
/

pyannote-diarization

Runtime error

File size: 1,516 Bytes

e58bff7
d9e71ec
 
 
e58bff7
d9e71ec
e58bff7
c82bffb
d9e71ec
e58bff7
d9e71ec
c82bffb
 
d9e71ec
c82bffb
 
 
 
e58bff7
 
 
c82bffb
8640564
1c24637
d9e71ec
 
8640564
d9e71ec
 
c82bffb
 
 
d9e71ec
c82bffb
d9e71ec
c82bffb
 
e58bff7
d9e71ec
e58bff7
d9e71ec
 
 
e58bff7
d9e71ec
e58bff7
 
d9e71ec

import os
import tempfile
import gradio as gr
from pyannote.audio import Pipeline

# שליפת Hugging Face Token מה-Secret
hf_token = os.getenv("HF_TOKEN")
if not hf_token:
    raise ValueError("HF_TOKEN is missing. Please set it in the Secrets section.")

# טעינת מודל pyannote לזיהוי דוברים
try:
    pipeline = Pipeline.from_pretrained(
        "pyannote/speaker-diarization",
        use_auth_token=hf_token
    )
except Exception as e:
    raise RuntimeError(f"Failed to load the pipeline: {e}")

# פונקציה לזיהוי דוברים
def diarize(audio):
    try:
        # Gradio שולח tuple בפורמט (נתיב קובץ, sample_rate)
        audio_file_path = audio[0]  # הוצאת נתיב הקובץ מה-`tuple`

        # עיבוד האודיו עם pyannote
        diarization = pipeline(audio_file_path)

        # עיבוד התוצאה לזיהוי דוברים
        result = []
        for turn, _, speaker in diarization.itertracks(yield_label=True):
            result.append(f"{speaker}: {turn.start:.1f}s - {turn.end:.1f}s")

        return "\n".join(result)

    except Exception as e:
        return f"Error during diarization: {e}"

# יצירת ממשק Gradio
interface = gr.Interface(
    fn=diarize,
    inputs="audio",
    outputs="text",
    title="Speaker Diarization",
    description="Upload an audio file (WAV, MP3, etc.) to detect speakers and their timestamps."
)

# הפעלת הממשק
if __name__ == "__main__":
    interface.launch()