Spaces:
Running
Running
Irpan
commited on
Commit
·
7bc4048
1
Parent(s):
ed17acd
asr
Browse files
app.py
CHANGED
@@ -8,7 +8,7 @@ mms_transcribe = gr.Interface(
|
|
8 |
inputs=[
|
9 |
gr.Audio(),
|
10 |
gr.Dropdown(
|
11 |
-
choices=[model for model in asr.models_info]
|
12 |
label="Select a Model for ASR",
|
13 |
value="ixxan/wav2vec2-large-mms-1b-uyghur-latin",
|
14 |
interactive=True
|
@@ -54,6 +54,7 @@ tabbed_interface = gr.TabbedInterface(
|
|
54 |
)
|
55 |
|
56 |
with gr.Blocks() as demo:
|
|
|
57 |
tabbed_interface.render()
|
58 |
|
59 |
if __name__ == "__main__":
|
|
|
8 |
inputs=[
|
9 |
gr.Audio(),
|
10 |
gr.Dropdown(
|
11 |
+
choices=[model for model in asr.models_info],
|
12 |
label="Select a Model for ASR",
|
13 |
value="ixxan/wav2vec2-large-mms-1b-uyghur-latin",
|
14 |
interactive=True
|
|
|
54 |
)
|
55 |
|
56 |
with gr.Blocks() as demo:
|
57 |
+
gr.Markdown("Comparision of STT and TTS models for Uyghur language.")
|
58 |
tabbed_interface.render()
|
59 |
|
60 |
if __name__ == "__main__":
|
asr.py
CHANGED
@@ -19,6 +19,12 @@ models_info = {
|
|
19 |
"ctc_model": False,
|
20 |
"arabic_script": False
|
21 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
22 |
"ixxan/whisper-small-thugy20": {
|
23 |
"processor": AutoProcessor.from_pretrained("ixxan/whisper-small-thugy20"),
|
24 |
"model": AutoModelForSpeechSeq2Seq.from_pretrained("ixxan/whisper-small-thugy20"),
|
@@ -31,12 +37,6 @@ models_info = {
|
|
31 |
"ctc_model": False,
|
32 |
"arabic_script": False
|
33 |
},
|
34 |
-
"Meta-MMS": {
|
35 |
-
"processor": AutoProcessor.from_pretrained("facebook/mms-1b-all", target_lang='uig-script_arabic'),
|
36 |
-
"model": AutoModelForCTC.from_pretrained("facebook/mms-1b-all", target_lang='uig-script_arabic', ignore_mismatched_sizes=True),
|
37 |
-
"ctc_model": True,
|
38 |
-
"arabic_script": True
|
39 |
-
},
|
40 |
"ixxan/wav2vec2-large-mms-1b-uyghur-latin": {
|
41 |
"processor": Wav2Vec2Processor.from_pretrained("ixxan/wav2vec2-large-mms-1b-uyghur-latin", target_lang='uig-script_latin'),
|
42 |
"model": Wav2Vec2ForCTC.from_pretrained("ixxan/wav2vec2-large-mms-1b-uyghur-latin", target_lang='uig-script_latin'),
|
|
|
19 |
"ctc_model": False,
|
20 |
"arabic_script": False
|
21 |
},
|
22 |
+
"Meta-MMS-Uyghur": {
|
23 |
+
"processor": AutoProcessor.from_pretrained("facebook/mms-1b-all", target_lang='uig-script_arabic'),
|
24 |
+
"model": AutoModelForCTC.from_pretrained("facebook/mms-1b-all", target_lang='uig-script_arabic', ignore_mismatched_sizes=True),
|
25 |
+
"ctc_model": True,
|
26 |
+
"arabic_script": True
|
27 |
+
},
|
28 |
"ixxan/whisper-small-thugy20": {
|
29 |
"processor": AutoProcessor.from_pretrained("ixxan/whisper-small-thugy20"),
|
30 |
"model": AutoModelForSpeechSeq2Seq.from_pretrained("ixxan/whisper-small-thugy20"),
|
|
|
37 |
"ctc_model": False,
|
38 |
"arabic_script": False
|
39 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
40 |
"ixxan/wav2vec2-large-mms-1b-uyghur-latin": {
|
41 |
"processor": Wav2Vec2Processor.from_pretrained("ixxan/wav2vec2-large-mms-1b-uyghur-latin", target_lang='uig-script_latin'),
|
42 |
"model": Wav2Vec2ForCTC.from_pretrained("ixxan/wav2vec2-large-mms-1b-uyghur-latin", target_lang='uig-script_latin'),
|