Irpan commited on
Commit
7bc4048
·
1 Parent(s): ed17acd
Files changed (2) hide show
  1. app.py +2 -1
  2. asr.py +6 -6
app.py CHANGED
@@ -8,7 +8,7 @@ mms_transcribe = gr.Interface(
8
  inputs=[
9
  gr.Audio(),
10
  gr.Dropdown(
11
- choices=[model for model in asr.models_info] + ["Compare All Models"],
12
  label="Select a Model for ASR",
13
  value="ixxan/wav2vec2-large-mms-1b-uyghur-latin",
14
  interactive=True
@@ -54,6 +54,7 @@ tabbed_interface = gr.TabbedInterface(
54
  )
55
 
56
  with gr.Blocks() as demo:
 
57
  tabbed_interface.render()
58
 
59
  if __name__ == "__main__":
 
8
  inputs=[
9
  gr.Audio(),
10
  gr.Dropdown(
11
+ choices=[model for model in asr.models_info],
12
  label="Select a Model for ASR",
13
  value="ixxan/wav2vec2-large-mms-1b-uyghur-latin",
14
  interactive=True
 
54
  )
55
 
56
  with gr.Blocks() as demo:
57
+ gr.Markdown("Comparision of STT and TTS models for Uyghur language.")
58
  tabbed_interface.render()
59
 
60
  if __name__ == "__main__":
asr.py CHANGED
@@ -19,6 +19,12 @@ models_info = {
19
  "ctc_model": False,
20
  "arabic_script": False
21
  },
 
 
 
 
 
 
22
  "ixxan/whisper-small-thugy20": {
23
  "processor": AutoProcessor.from_pretrained("ixxan/whisper-small-thugy20"),
24
  "model": AutoModelForSpeechSeq2Seq.from_pretrained("ixxan/whisper-small-thugy20"),
@@ -31,12 +37,6 @@ models_info = {
31
  "ctc_model": False,
32
  "arabic_script": False
33
  },
34
- "Meta-MMS": {
35
- "processor": AutoProcessor.from_pretrained("facebook/mms-1b-all", target_lang='uig-script_arabic'),
36
- "model": AutoModelForCTC.from_pretrained("facebook/mms-1b-all", target_lang='uig-script_arabic', ignore_mismatched_sizes=True),
37
- "ctc_model": True,
38
- "arabic_script": True
39
- },
40
  "ixxan/wav2vec2-large-mms-1b-uyghur-latin": {
41
  "processor": Wav2Vec2Processor.from_pretrained("ixxan/wav2vec2-large-mms-1b-uyghur-latin", target_lang='uig-script_latin'),
42
  "model": Wav2Vec2ForCTC.from_pretrained("ixxan/wav2vec2-large-mms-1b-uyghur-latin", target_lang='uig-script_latin'),
 
19
  "ctc_model": False,
20
  "arabic_script": False
21
  },
22
+ "Meta-MMS-Uyghur": {
23
+ "processor": AutoProcessor.from_pretrained("facebook/mms-1b-all", target_lang='uig-script_arabic'),
24
+ "model": AutoModelForCTC.from_pretrained("facebook/mms-1b-all", target_lang='uig-script_arabic', ignore_mismatched_sizes=True),
25
+ "ctc_model": True,
26
+ "arabic_script": True
27
+ },
28
  "ixxan/whisper-small-thugy20": {
29
  "processor": AutoProcessor.from_pretrained("ixxan/whisper-small-thugy20"),
30
  "model": AutoModelForSpeechSeq2Seq.from_pretrained("ixxan/whisper-small-thugy20"),
 
37
  "ctc_model": False,
38
  "arabic_script": False
39
  },
 
 
 
 
 
 
40
  "ixxan/wav2vec2-large-mms-1b-uyghur-latin": {
41
  "processor": Wav2Vec2Processor.from_pretrained("ixxan/wav2vec2-large-mms-1b-uyghur-latin", target_lang='uig-script_latin'),
42
  "model": Wav2Vec2ForCTC.from_pretrained("ixxan/wav2vec2-large-mms-1b-uyghur-latin", target_lang='uig-script_latin'),