StevenChen16 commited on
Commit
5855353
·
1 Parent(s): 69b1e14

second update

Browse files
Files changed (1) hide show
  1. app.py +16 -17
app.py CHANGED
@@ -1,23 +1,22 @@
1
  import gradio as gr
2
  import whisperx
3
- import whisper
4
 
5
- def transcribe(audio_file):
6
- device = "cuda" if torch.cuda.is_available() else "cpu"
7
 
8
- # Transcribe with original Whisper
9
- model = whisper.load_model("large", device)
10
- result = model.transcribe(audio_file)
 
11
 
12
- # Load alignment model and metadata
13
- model_a, metadata = whisperx.load_align_model(language_code=result["language"], device=device)
 
 
 
 
 
 
14
 
15
- # Align Whisper output
16
- result_aligned = whisperx.align(result["segments"], model_a, metadata, audio_file, device)
17
-
18
- return {"aligned": result_aligned["segments"], "word_segments": result_aligned["word_segments"]}
19
-
20
- inputs = gr.inputs.Audio(source="upload", type="filepath")
21
- outputs = gr.outputs.JSON()
22
-
23
- gr.Interface(fn=transcribe, inputs=inputs, outputs=outputs).launch()
 
1
  import gradio as gr
2
  import whisperx
 
3
 
4
+ # 加载WhisperX模型
5
+ model = whisperx.load_model("base", device="cpu") # 如果有GPU,可将"cpu"改为"cuda"
6
 
7
+ def transcribe(audio_path):
8
+ # 使用WhisperX进行转录
9
+ result = model.transcribe(audio_path)
10
+ return result['text']
11
 
12
+ # 创建Gradio接口
13
+ iface = gr.Interface(
14
+ fn=transcribe,
15
+ inputs=gr.Audio(source="upload", type="filepath"),
16
+ outputs="text",
17
+ title="WhisperX 语音转文字",
18
+ description="上传音频文件,使用WhisperX模型进行转录。"
19
+ )
20
 
21
+ if __name__ == "__main__":
22
+ iface.launch()