first
Browse files- run.sh +3 -2
- run_speech_recognition_ctc.py +1 -1
run.sh
CHANGED
@@ -1,10 +1,11 @@
|
|
1 |
python run_speech_recognition_ctc.py \
|
2 |
--dataset_name="NbAiLab/NPSC" \
|
3 |
--model_name_or_path="facebook/wav2vec2-xls-r-300m" \
|
4 |
-
--
|
|
|
5 |
--output_dir="./" \
|
6 |
--overwrite_output_dir \
|
7 |
-
--num_train_epochs="
|
8 |
--per_device_train_batch_size="8" \
|
9 |
--per_device_eval_batch_size="8" \
|
10 |
--gradient_accumulation_steps="4" \
|
|
|
1 |
python run_speech_recognition_ctc.py \
|
2 |
--dataset_name="NbAiLab/NPSC" \
|
3 |
--model_name_or_path="facebook/wav2vec2-xls-r-300m" \
|
4 |
+
--hub_model_id="NbAiLab/wav2vec2-xlsr-300M-NPSC" \
|
5 |
+
--dataset_config_name="16K_mp3" \
|
6 |
--output_dir="./" \
|
7 |
--overwrite_output_dir \
|
8 |
+
--num_train_epochs="75" \
|
9 |
--per_device_train_batch_size="8" \
|
10 |
--per_device_eval_batch_size="8" \
|
11 |
--gradient_accumulation_steps="4" \
|
run_speech_recognition_ctc.py
CHANGED
@@ -393,7 +393,7 @@ def main():
|
|
393 |
|
394 |
# Pre-processing dataset
|
395 |
import re
|
396 |
-
|
397 |
return not re.search("\d|<inaudible>", entry["text"], flags=re.IGNORECASE)
|
398 |
|
399 |
def filter_nynorsk(entry):
|
|
|
393 |
|
394 |
# Pre-processing dataset
|
395 |
import re
|
396 |
+
def filter_inaudible(entry):
|
397 |
return not re.search("\d|<inaudible>", entry["text"], flags=re.IGNORECASE)
|
398 |
|
399 |
def filter_nynorsk(entry):
|