Ubuntu
commited on
Commit
·
0774dc2
1
Parent(s):
a3ebb39
Revert "Training in progress, step 100"
Browse filesThis reverts commit 321b86e9b1b93e44dc9f33b312747e627d0113d1.
- config.json +1 -1
- model.safetensors +1 -1
- run_cmn.sh +10 -10
- runs/Jan23_05-57-07_ip-172-31-68-44/events.out.tfevents.1705989446.ip-172-31-68-44.20295.0 +0 -3
- tokenizer.json +6 -6
- training_args.bin +1 -1
config.json
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "
|
3 |
"activation_dropout": 0.0,
|
4 |
"activation_function": "gelu",
|
5 |
"apply_spec_augment": false,
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "vasista22/whisper-hindi-small",
|
3 |
"activation_dropout": 0.0,
|
4 |
"activation_function": "gelu",
|
5 |
"apply_spec_augment": false,
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 966995080
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96793a88a265c07ef4184ca8fe117b013d58b2b7c85cc356aa07bbb9dcbcf3a6
|
3 |
size 966995080
|
run_cmn.sh
CHANGED
@@ -1,23 +1,23 @@
|
|
1 |
python3 run_speech_recognition_seq2seq_streaming.py \
|
2 |
-
--model_name_or_path="
|
3 |
--dataset_name="mozilla-foundation/common_voice_16_0" \
|
4 |
-
--dataset_config_name="
|
5 |
-
--language="
|
6 |
--train_split_name="train+validation" \
|
7 |
--eval_split_name="test" \
|
8 |
-
--model_index_name="Whisper Base
|
9 |
-
--max_steps="
|
10 |
--output_dir="./" \
|
11 |
--per_device_train_batch_size="16" \
|
12 |
-
--per_device_eval_batch_size="
|
13 |
--gradient_accumulation_steps=4 \
|
14 |
--logging_steps="25" \
|
15 |
-
--learning_rate="
|
16 |
-
--warmup_steps="
|
17 |
--evaluation_strategy="steps" \
|
18 |
-
--eval_steps="
|
19 |
--save_strategy="steps" \
|
20 |
-
--save_steps="
|
21 |
--generation_max_length="225" \
|
22 |
--length_column_name="input_length" \
|
23 |
--max_duration_in_seconds="30" \
|
|
|
1 |
python3 run_speech_recognition_seq2seq_streaming.py \
|
2 |
+
--model_name_or_path="vasista22/whisper-hindi-small" \
|
3 |
--dataset_name="mozilla-foundation/common_voice_16_0" \
|
4 |
+
--dataset_config_name="hi" \
|
5 |
+
--language="hindi" \
|
6 |
--train_split_name="train+validation" \
|
7 |
--eval_split_name="test" \
|
8 |
+
--model_index_name="Whisper Base Bengali" \
|
9 |
+
--max_steps="100" \
|
10 |
--output_dir="./" \
|
11 |
--per_device_train_batch_size="16" \
|
12 |
+
--per_device_eval_batch_size="16" \
|
13 |
--gradient_accumulation_steps=4 \
|
14 |
--logging_steps="25" \
|
15 |
+
--learning_rate="1e-6" \
|
16 |
+
--warmup_steps="10" \
|
17 |
--evaluation_strategy="steps" \
|
18 |
+
--eval_steps="50" \
|
19 |
--save_strategy="steps" \
|
20 |
+
--save_steps="50" \
|
21 |
--generation_max_length="225" \
|
22 |
--length_column_name="input_length" \
|
23 |
--max_duration_in_seconds="30" \
|
runs/Jan23_05-57-07_ip-172-31-68-44/events.out.tfevents.1705989446.ip-172-31-68-44.20295.0
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:0486f429675408de46cc06040fcd0b4163ab6cde2d89a5eebc319fd79fdd9b7f
|
3 |
-
size 6071
|
|
|
|
|
|
|
|
tokenizer.json
CHANGED
@@ -985,7 +985,7 @@
|
|
985 |
},
|
986 |
{
|
987 |
"SpecialToken": {
|
988 |
-
"id": "<|
|
989 |
"type_id": 0
|
990 |
}
|
991 |
},
|
@@ -1023,7 +1023,7 @@
|
|
1023 |
},
|
1024 |
{
|
1025 |
"SpecialToken": {
|
1026 |
-
"id": "<|
|
1027 |
"type_id": 0
|
1028 |
}
|
1029 |
},
|
@@ -1068,13 +1068,13 @@
|
|
1068 |
"<|endoftext|>"
|
1069 |
]
|
1070 |
},
|
1071 |
-
"<|
|
1072 |
-
"id": "<|
|
1073 |
"ids": [
|
1074 |
-
|
1075 |
],
|
1076 |
"tokens": [
|
1077 |
-
"<|
|
1078 |
]
|
1079 |
},
|
1080 |
"<|notimestamps|>": {
|
|
|
985 |
},
|
986 |
{
|
987 |
"SpecialToken": {
|
988 |
+
"id": "<|hi|>",
|
989 |
"type_id": 0
|
990 |
}
|
991 |
},
|
|
|
1023 |
},
|
1024 |
{
|
1025 |
"SpecialToken": {
|
1026 |
+
"id": "<|hi|>",
|
1027 |
"type_id": 0
|
1028 |
}
|
1029 |
},
|
|
|
1068 |
"<|endoftext|>"
|
1069 |
]
|
1070 |
},
|
1071 |
+
"<|hi|>": {
|
1072 |
+
"id": "<|hi|>",
|
1073 |
"ids": [
|
1074 |
+
50276
|
1075 |
],
|
1076 |
"tokens": [
|
1077 |
+
"<|hi|>"
|
1078 |
]
|
1079 |
},
|
1080 |
"<|notimestamps|>": {
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4792
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:982b5193e750d2177a9de84e737d1bca6d1f68d33c76512f2aec4c722e52b389
|
3 |
size 4792
|