Spaces:

oza75
/

bambara-asr

Sleeping

oza75 commited on Feb 26

Commit

ad4bd3d

verified ·

1 Parent(s): 11cbb5f

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -40,6 +40,7 @@ revision = None
 #model_checkpoint = "oza75/bm-whisper-large-turbo-v4"
 #model_checkpoint = "oza75/bm-whisper-large-v3-base"
 model_checkpoint = "oza75/bm-whisper-large-v3-sft-3"
 # language = "sundanese"
 # Load the custom tokenizer designed for Bambara and the ASR model
@@ -47,7 +48,7 @@ model_checkpoint = "oza75/bm-whisper-large-v3-sft-3"
 tokenizer = WhisperTokenizer.from_pretrained(model_checkpoint, device=device)
 pipe = pipeline("automatic-speech-recognition", model=model_checkpoint, tokenizer=tokenizer, device=device, revision=revision)
-LANGUAGES = {"bambara": "sundanese", "french": "french", "english": "english"}
 def resample_audio(audio_path, target_sample_rate=16000):
     """

 #model_checkpoint = "oza75/bm-whisper-large-turbo-v4"
 #model_checkpoint = "oza75/bm-whisper-large-v3-base"
 model_checkpoint = "oza75/bm-whisper-large-v3-sft-3"
+model_checkpoint = "djelia/djelia-whisper-v2"
 # language = "sundanese"
 # Load the custom tokenizer designed for Bambara and the ASR model
 tokenizer = WhisperTokenizer.from_pretrained(model_checkpoint, device=device)
 pipe = pipeline("automatic-speech-recognition", model=model_checkpoint, tokenizer=tokenizer, device=device, revision=revision)
+LANGUAGES = {"bambara": "french", "french": "french", "english": "english"}
 def resample_audio(audio_path, target_sample_rate=16000):
     """