Spaces:

ankush13r
/

faster-whisper

Running

Ankush Rana commited on Sep 22, 2024

Commit

88a8f61

1 Parent(s): 23dbd9b

change to largev3

Files changed (1) hide show

app.py CHANGED Viewed

@@ -7,7 +7,7 @@ import torch
 device = "cuda" if torch.cuda.is_available() else "cpu"
 torch_dtype = "float32"
-MODEL_NAME = "Systran/faster-whisper-medium"
 print("Loading model ...")
 model = WhisperModel(MODEL_NAME, compute_type=torch_dtype)
 print("Loading model done.")
@@ -23,6 +23,8 @@ def transcribe(inputs):
         # chunk_length=30,
         task="transcribe",
         word_timestamps=False,
     )
     text = ""
@@ -47,7 +49,7 @@ with gr.Blocks(theme=theme) as demo:
             input = gr.Audio(sources=["upload", "microphone"], type="filepath", label="Audio")
         with gr.Column(scale=1):
-            output = gr.Textbox(label="Output", lines=8)
     with gr.Row(variant="panel"):
             clear_btn = gr.Button("Clear")

 device = "cuda" if torch.cuda.is_available() else "cpu"
 torch_dtype = "float32"
+MODEL_NAME = "Systran/faster-whisper-large-v3"
 print("Loading model ...")
 model = WhisperModel(MODEL_NAME, compute_type=torch_dtype)
 print("Loading model done.")
         # chunk_length=30,
         task="transcribe",
         word_timestamps=False,
+        repetition_penalty=1.2,
+        without_timestamps=True
     )
     text = ""
             input = gr.Audio(sources=["upload", "microphone"], type="filepath", label="Audio")
         with gr.Column(scale=1):
+            output = gr.Textbox(label="Output")
     with gr.Row(variant="panel"):
             clear_btn = gr.Button("Clear")