alakxender commited on
Commit
cb3f68b
·
1 Parent(s): 700fda9
Files changed (1) hide show
  1. app.py +14 -14
app.py CHANGED
@@ -136,20 +136,20 @@ if __name__ == "__main__":
136
  torch_dtype = torch.float16 if torch.cuda.is_available() else torch.float32
137
 
138
  MODEL_NAME = "alakxender/wav2vec2-large-mms-1b-dv-syn-md" # Trained on 100% Synthetic Data (150 Hours)
139
- # MODEL_NAME = "alakxender/wav2vec2-large-mms-1b-cv" # Trained on Common Voice Data (Unknown Hours)
140
- # MODEL_NAME = "alakxender/whisper-small-dv-syn-md" # Trained on 100% Synthetic Data (150 Hours)
141
- # MODEL_NAME = "alakxender/whisper-small-cv" # Trained on Common Voice Data (Unknown Hours)
142
- # MODEL_NAME = "alakxender/whisper-medium-dv-syn-md" # Trained on 100% Synthetic Data (150 Hours)
143
- # MODEL_NAME = "alakxender/whisper-medium-cv" # Trained on Common Voice Data (Unknown Hours)
144
- # MODEL_NAME = "alakxender/whisper-large-v3-dv-syn-md" # Trained on 100% Synthetic Data (150 Hours)
145
- # MODEL_NAME = "alakxender/whisper-large-v3-cv" # Trained on Common Voice Data (Unknown Hours)
146
- # MODEL_NAME = "alakxender/whisper-large-v3-calls-md" # Trained on phone calls (65 Hours)
147
- # MODEL_NAME = "alakxender/wav2vec2-large-mms-1b-calls-md" # Trained on phone calls (65 Hours)
148
- # MODEL_NAME = "alakxender/wav2vec2-large-xlsr-calls-md" # Trained on phone calls (23 Hours)
149
- # MODEL_NAME = "alakxender/wav2vec2-large-xlsr-dv-syn-md" # Trained on 100% Synthetic Data (80 Hours)
150
- # MODEL_NAME = "alakxender/dhivehi-asr-full-ctc" # Trained on multiple datasets (350+ Hours)
151
- # MODEL_NAME = "alakxender/dhivehi-asr-full-ctc-v2" # Trained on multiple datasets (350+ Hours)
152
- # MODEL_NAME = "alakxender/dhivehi-asr-full-whisper-v3" # Trained on multiple datasets (350+ Hours)
153
 
154
  # Load model and processor with LM
155
  processor = Wav2Vec2ProcessorWithLM.from_pretrained(MODEL_NAME)
 
136
  torch_dtype = torch.float16 if torch.cuda.is_available() else torch.float32
137
 
138
  MODEL_NAME = "alakxender/wav2vec2-large-mms-1b-dv-syn-md" # Trained on 100% Synthetic Data (150 Hours)
139
+ # MODEL_NAME = "/home/rusputin/lab/audio/fine-tunes/wav2vec2-large-mms-1b-cv" # Trained on Common Voice Data (Unknown Hours)
140
+ # MODEL_NAME = "/home/rusputin/lab/audio/fine-tunes/whisper-small-dv-syn-md" # Trained on 100% Synthetic Data (150 Hours)
141
+ # MODEL_NAME = "/home/rusputin/lab/audio/fine-tunes/whisper-small-cv" # Trained on Common Voice Data (Unknown Hours)
142
+ # MODEL_NAME = "/home/rusputin/lab/audio/fine-tunes/whisper-medium-dv-syn-md" # Trained on 100% Synthetic Data (150 Hours)
143
+ # MODEL_NAME = "/home/rusputin/lab/audio/fine-tunes/whisper-medium-cv" # Trained on Common Voice Data (Unknown Hours)
144
+ # MODEL_NAME = "/home/rusputin/lab/audio/fine-tunes/whisper-large-v3-dv-syn-md" # Trained on 100% Synthetic Data (150 Hours)
145
+ # MODEL_NAME = "/home/rusputin/lab/audio/fine-tunes/whisper-large-v3-cv" # Trained on Common Voice Data (Unknown Hours)
146
+ # MODEL_NAME = "/home/rusputin/lab/audio/fine-tunes/whisper-large-v3-calls-md" # Trained on phone calls (65 Hours)
147
+ # MODEL_NAME = "/home/rusputin/lab/audio/fine-tunes/wav2vec2-large-mms-1b-calls-md" # Trained on phone calls (65 Hours)
148
+ # MODEL_NAME = "/home/rusputin/lab/audio/fine-tunes/wav2vec2-large-xlsr-calls-md" # Trained on phone calls (23 Hours)
149
+ # MODEL_NAME = "/home/rusputin/lab/audio/fine-tunes/wav2vec2-large-xlsr-dv-syn-md" # Trained on 100% Synthetic Data (80 Hours)
150
+ # MODEL_NAME = "/home/rusputin/lab/audio/fine-tunes/dhivehi-asr-full-ctc" # Trained on multiple datasets (350+ Hours)
151
+ # MODEL_NAME = "/home/rusputin/lab/audio/fine-tunes/dhivehi-asr-full-ctc-v2" # Trained on multiple datasets (350+ Hours)
152
+ # MODEL_NAME = "/home/rusputin/lab/audio/fine-tunes/dhivehi-asr-full-whisper-v3" # Trained on multiple datasets (350+ Hours)
153
 
154
  # Load model and processor with LM
155
  processor = Wav2Vec2ProcessorWithLM.from_pretrained(MODEL_NAME)