Spaces:
Running
on
Zero
Running
on
Zero
Commit
·
cb3f68b
1
Parent(s):
700fda9
ptlocal
Browse files
app.py
CHANGED
@@ -136,20 +136,20 @@ if __name__ == "__main__":
|
|
136 |
torch_dtype = torch.float16 if torch.cuda.is_available() else torch.float32
|
137 |
|
138 |
MODEL_NAME = "alakxender/wav2vec2-large-mms-1b-dv-syn-md" # Trained on 100% Synthetic Data (150 Hours)
|
139 |
-
# MODEL_NAME = "
|
140 |
-
# MODEL_NAME = "
|
141 |
-
# MODEL_NAME = "
|
142 |
-
# MODEL_NAME = "
|
143 |
-
# MODEL_NAME = "
|
144 |
-
# MODEL_NAME = "
|
145 |
-
# MODEL_NAME = "
|
146 |
-
# MODEL_NAME = "
|
147 |
-
# MODEL_NAME = "
|
148 |
-
# MODEL_NAME = "
|
149 |
-
# MODEL_NAME = "
|
150 |
-
# MODEL_NAME = "
|
151 |
-
# MODEL_NAME = "
|
152 |
-
# MODEL_NAME = "
|
153 |
|
154 |
# Load model and processor with LM
|
155 |
processor = Wav2Vec2ProcessorWithLM.from_pretrained(MODEL_NAME)
|
|
|
136 |
torch_dtype = torch.float16 if torch.cuda.is_available() else torch.float32
|
137 |
|
138 |
MODEL_NAME = "alakxender/wav2vec2-large-mms-1b-dv-syn-md" # Trained on 100% Synthetic Data (150 Hours)
|
139 |
+
# MODEL_NAME = "/home/rusputin/lab/audio/fine-tunes/wav2vec2-large-mms-1b-cv" # Trained on Common Voice Data (Unknown Hours)
|
140 |
+
# MODEL_NAME = "/home/rusputin/lab/audio/fine-tunes/whisper-small-dv-syn-md" # Trained on 100% Synthetic Data (150 Hours)
|
141 |
+
# MODEL_NAME = "/home/rusputin/lab/audio/fine-tunes/whisper-small-cv" # Trained on Common Voice Data (Unknown Hours)
|
142 |
+
# MODEL_NAME = "/home/rusputin/lab/audio/fine-tunes/whisper-medium-dv-syn-md" # Trained on 100% Synthetic Data (150 Hours)
|
143 |
+
# MODEL_NAME = "/home/rusputin/lab/audio/fine-tunes/whisper-medium-cv" # Trained on Common Voice Data (Unknown Hours)
|
144 |
+
# MODEL_NAME = "/home/rusputin/lab/audio/fine-tunes/whisper-large-v3-dv-syn-md" # Trained on 100% Synthetic Data (150 Hours)
|
145 |
+
# MODEL_NAME = "/home/rusputin/lab/audio/fine-tunes/whisper-large-v3-cv" # Trained on Common Voice Data (Unknown Hours)
|
146 |
+
# MODEL_NAME = "/home/rusputin/lab/audio/fine-tunes/whisper-large-v3-calls-md" # Trained on phone calls (65 Hours)
|
147 |
+
# MODEL_NAME = "/home/rusputin/lab/audio/fine-tunes/wav2vec2-large-mms-1b-calls-md" # Trained on phone calls (65 Hours)
|
148 |
+
# MODEL_NAME = "/home/rusputin/lab/audio/fine-tunes/wav2vec2-large-xlsr-calls-md" # Trained on phone calls (23 Hours)
|
149 |
+
# MODEL_NAME = "/home/rusputin/lab/audio/fine-tunes/wav2vec2-large-xlsr-dv-syn-md" # Trained on 100% Synthetic Data (80 Hours)
|
150 |
+
# MODEL_NAME = "/home/rusputin/lab/audio/fine-tunes/dhivehi-asr-full-ctc" # Trained on multiple datasets (350+ Hours)
|
151 |
+
# MODEL_NAME = "/home/rusputin/lab/audio/fine-tunes/dhivehi-asr-full-ctc-v2" # Trained on multiple datasets (350+ Hours)
|
152 |
+
# MODEL_NAME = "/home/rusputin/lab/audio/fine-tunes/dhivehi-asr-full-whisper-v3" # Trained on multiple datasets (350+ Hours)
|
153 |
|
154 |
# Load model and processor with LM
|
155 |
processor = Wav2Vec2ProcessorWithLM.from_pretrained(MODEL_NAME)
|