hanasim commited on
Commit
dbfa988
1 Parent(s): cd34bd8

End of training

Browse files
README.md CHANGED
@@ -1,39 +1,42 @@
1
  ---
 
 
2
  license: apache-2.0
3
  base_model: openai/whisper-base
4
  tags:
 
5
  - generated_from_trainer
6
  datasets:
7
- - common_voice_16_0
8
  metrics:
9
  - wer
10
  model-index:
11
- - name: breeze-listen-dsw-base-te
12
  results:
13
  - task:
14
  name: Automatic Speech Recognition
15
  type: automatic-speech-recognition
16
  dataset:
17
- name: common_voice_16_0
18
- type: common_voice_16_0
19
  config: te
20
  split: test
21
  args: te
22
  metrics:
23
  - name: Wer
24
  type: wer
25
- value: 90.65934065934066
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
29
  should probably proofread and complete it, then remove this comment. -->
30
 
31
- # breeze-listen-dsw-base-te
32
 
33
- This model is a fine-tuned version of [openai/whisper-base](https://huggingface.co/openai/whisper-base) on the common_voice_16_0 dataset.
34
  It achieves the following results on the evaluation set:
35
- - Loss: 2.2441
36
- - Wer: 90.6593
37
 
38
  ## Model description
39
 
 
1
  ---
2
+ language:
3
+ - te
4
  license: apache-2.0
5
  base_model: openai/whisper-base
6
  tags:
7
+ - whisper-event
8
  - generated_from_trainer
9
  datasets:
10
+ - mozilla-foundation/common_voice_16_0
11
  metrics:
12
  - wer
13
  model-index:
14
+ - name: Breeze DSW Telugu - base
15
  results:
16
  - task:
17
  name: Automatic Speech Recognition
18
  type: automatic-speech-recognition
19
  dataset:
20
+ name: mozilla-foundation/common_voice_16_0 te
21
+ type: mozilla-foundation/common_voice_16_0
22
  config: te
23
  split: test
24
  args: te
25
  metrics:
26
  - name: Wer
27
  type: wer
28
+ value: 89.28571428571429
29
  ---
30
 
31
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
32
  should probably proofread and complete it, then remove this comment. -->
33
 
34
+ # Breeze DSW Telugu - base
35
 
36
+ This model is a fine-tuned version of [openai/whisper-base](https://huggingface.co/openai/whisper-base) on the mozilla-foundation/common_voice_16_0 te dataset.
37
  It achieves the following results on the evaluation set:
38
+ - Loss: 2.0469
39
+ - Wer: 89.2857
40
 
41
  ## Model description
42
 
all_results.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 199.0,
3
+ "eval_loss": 2.046875,
4
+ "eval_runtime": 53.1669,
5
+ "eval_samples_per_second": 0.508,
6
+ "eval_steps_per_second": 0.038,
7
+ "eval_wer": 89.28571428571429,
8
+ "train_loss": 0.0,
9
+ "train_runtime": 16.6622,
10
+ "train_samples_per_second": 3841.032,
11
+ "train_steps_per_second": 120.032
12
+ }
eval_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 199.0,
3
+ "eval_loss": 2.046875,
4
+ "eval_runtime": 53.1669,
5
+ "eval_samples_per_second": 0.508,
6
+ "eval_steps_per_second": 0.038,
7
+ "eval_wer": 89.28571428571429
8
+ }
runs/Jan18_11-19-00_knight/events.out.tfevents.1705573270.knight.157497.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8241354c2c5f8e8862d9e697ecc821956d30e5ea83b0355efa9cb2e92e683f8d
3
+ size 406
train_results.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 199.0,
3
+ "train_loss": 0.0,
4
+ "train_runtime": 16.6622,
5
+ "train_samples_per_second": 3841.032,
6
+ "train_steps_per_second": 120.032
7
+ }
trainer_state.json ADDED
@@ -0,0 +1,144 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 89.28571428571429,
3
+ "best_model_checkpoint": "/cosmos/home/sp-operator/ai/training/models/huggingface/scripts/../breeze-listen-dsw-base-te/checkpoint-200",
4
+ "epoch": 199.001,
5
+ "eval_steps": 200,
6
+ "global_step": 400,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 12.0,
13
+ "learning_rate": 4.973833272194737e-06,
14
+ "loss": 1.7314,
15
+ "step": 25
16
+ },
17
+ {
18
+ "epoch": 24.0,
19
+ "learning_rate": 6.195318418690893e-06,
20
+ "loss": 1.0852,
21
+ "step": 50
22
+ },
23
+ {
24
+ "epoch": 37.0,
25
+ "learning_rate": 6.881634451095711e-06,
26
+ "loss": 0.4273,
27
+ "step": 75
28
+ },
29
+ {
30
+ "epoch": 49.0,
31
+ "learning_rate": 7.361221988663844e-06,
32
+ "loss": 0.0907,
33
+ "step": 100
34
+ },
35
+ {
36
+ "epoch": 62.0,
37
+ "learning_rate": 7.730207550743121e-06,
38
+ "loss": 0.0175,
39
+ "step": 125
40
+ },
41
+ {
42
+ "epoch": 74.0,
43
+ "learning_rate": 8.03016458599496e-06,
44
+ "loss": 0.0032,
45
+ "step": 150
46
+ },
47
+ {
48
+ "epoch": 87.0,
49
+ "learning_rate": 8.282894746203441e-06,
50
+ "loss": 0.0011,
51
+ "step": 175
52
+ },
53
+ {
54
+ "epoch": 99.0,
55
+ "learning_rate": 8.501266121799902e-06,
56
+ "loss": 0.0007,
57
+ "step": 200
58
+ },
59
+ {
60
+ "epoch": 99.0,
61
+ "eval_loss": 2.046875,
62
+ "eval_runtime": 63.8247,
63
+ "eval_samples_per_second": 0.423,
64
+ "eval_steps_per_second": 0.031,
65
+ "eval_wer": 89.28571428571429,
66
+ "step": 200
67
+ },
68
+ {
69
+ "epoch": 112.0,
70
+ "learning_rate": 8.693512601774437e-06,
71
+ "loss": 0.0005,
72
+ "step": 225
73
+ },
74
+ {
75
+ "epoch": 124.0,
76
+ "learning_rate": 8.865222471593567e-06,
77
+ "loss": 0.0004,
78
+ "step": 250
79
+ },
80
+ {
81
+ "epoch": 137.0,
82
+ "learning_rate": 9.020362953730323e-06,
83
+ "loss": 0.0003,
84
+ "step": 275
85
+ },
86
+ {
87
+ "epoch": 149.0,
88
+ "learning_rate": 9.161852281961698e-06,
89
+ "loss": 0.0003,
90
+ "step": 300
91
+ },
92
+ {
93
+ "epoch": 162.0,
94
+ "learning_rate": 9.29189975311636e-06,
95
+ "loss": 0.0002,
96
+ "step": 325
97
+ },
98
+ {
99
+ "epoch": 174.0,
100
+ "learning_rate": 9.412218256259678e-06,
101
+ "loss": 0.0002,
102
+ "step": 350
103
+ },
104
+ {
105
+ "epoch": 187.0,
106
+ "learning_rate": 9.524162683365145e-06,
107
+ "loss": 0.0002,
108
+ "step": 375
109
+ },
110
+ {
111
+ "epoch": 199.0,
112
+ "learning_rate": 9.62882322733502e-06,
113
+ "loss": 0.0002,
114
+ "step": 400
115
+ },
116
+ {
117
+ "epoch": 199.0,
118
+ "eval_loss": 2.244140625,
119
+ "eval_runtime": 56.1817,
120
+ "eval_samples_per_second": 0.481,
121
+ "eval_steps_per_second": 0.036,
122
+ "eval_wer": 90.65934065934066,
123
+ "step": 400
124
+ },
125
+ {
126
+ "epoch": 199.0,
127
+ "step": 400,
128
+ "total_flos": 5.059079773670605e+17,
129
+ "train_loss": 0.0,
130
+ "train_runtime": 16.6622,
131
+ "train_samples_per_second": 3841.032,
132
+ "train_steps_per_second": 120.032
133
+ }
134
+ ],
135
+ "logging_steps": 25,
136
+ "max_steps": 2000,
137
+ "num_input_tokens_seen": 0,
138
+ "num_train_epochs": 9223372036854775807,
139
+ "save_steps": 200,
140
+ "total_flos": 5.059079773670605e+17,
141
+ "train_batch_size": 32,
142
+ "trial_name": null,
143
+ "trial_params": null
144
+ }