Spaces:

marioluciofjr
/

voxsense

Sleeping

App Files Files Community

marioluciofjr commited on Sep 27, 2024

Commit

8d4e3a2

verified ·

1 Parent(s): beacf7a

Update app.py

Browse files

Files changed (1) hide show

app.py +27 -15

app.py CHANGED Viewed

@@ -2,44 +2,56 @@ import gradio as gr
 from transformers import pipeline
 import torch
 # Carregando o modelo Whisper para transcrição de áudio
 transcriber = pipeline(
     task="automatic-speech-recognition",
     model="openai/whisper-small",
-    device=torch.device('cuda' if torch.cuda.is_available() else 'cpu')
 )
-# Carregando o modelo de análise de sentimentos em português
-sentiment_analyzer = pipeline(
-    "sentiment-analysis",
-    model="nlptown/bert-base-multilingual-uncased-sentiment"
 )
 def transcribe_and_analyze(audio_file):
     """
-    Recebe um arquivo de áudio, transcreve e analisa o sentimento.
     """
     # Transcrevendo o áudio
     transcription = transcriber(audio_file)["text"]
-    # Analisando o sentimento da transcrição
-    sentiment = sentiment_analyzer(transcription)[0]
-    # Formatando a saída do sentimento
-    sentiment_output = f"{sentiment['label']} (confiança: {sentiment['score']:.2f})"
-    return transcription, sentiment_output
 # Criando a interface Gradio
 interface = gr.Interface(
     fn=transcribe_and_analyze,
-    inputs=gr.Audio(type="filepath", label="Faça upload do seu áudio"), # Removed source argument
     outputs=[
         gr.Textbox(label="Transcrição do Áudio"),
-        gr.Textbox(label="Análise de Sentimento")
     ],
-    title="Transcrição e Análise de Sentimentos de Áudio",
-    description="Envie um arquivo de áudio de até 1 hora para transcrição e análise de sentimentos.",
     theme="default"
 )

 from transformers import pipeline
 import torch
+# Verificando se a GPU está disponível
+device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
 # Carregando o modelo Whisper para transcrição de áudio
 transcriber = pipeline(
     task="automatic-speech-recognition",
     model="openai/whisper-small",
+    device=device
 )
+# Carregando o pipeline de classificação zero-shot
+classifier = pipeline(
+    "zero-shot-classification",
+    model="joeddav/xlm-roberta-large-xnli",
+    device=device
 )
 def transcribe_and_analyze(audio_file):
     """
+    Recebe um arquivo de áudio, transcreve e analisa as emoções presentes.
     """
     # Transcrevendo o áudio
     transcription = transcriber(audio_file)["text"]
+    # Lista de emoções para a classificação
+    emotions = ["medo", "rancor", "ódio", "raiva", "felicidade", "amor", "tristeza", "ansiedade", "inveja", "sarcasmo", "vergonha"]
+    # Realizando a classificação zero-shot na transcrição
+    classification = classifier(transcription, emotions, multi_label=True)
+    # Formatando os resultados
+    results = []
+    for label, score in zip(classification["labels"], classification["scores"]):
+        results.append(f"{label}: {score:.2f}")
+    # Unindo os resultados em uma string
+    emotion_output = "\n".join(results)
+    return transcription, emotion_output
 # Criando a interface Gradio
 interface = gr.Interface(
     fn=transcribe_and_analyze,
+    inputs=gr.Audio(type="filepath", label="Faça upload do seu áudio"),
     outputs=[
         gr.Textbox(label="Transcrição do Áudio"),
+        gr.Textbox(label="Emoções Detectadas")
     ],
+    title="TranscriSentimento",
+    description="Envie um arquivo de áudio de até 1 hora para transcrição e análise de emoções.",
     theme="default"
 )