agomberto commited on
Commit
f34f25d
·
1 Parent(s): 1aec125

:tada: update new version of the model

Browse files
config.json CHANGED
@@ -78,7 +78,7 @@
78
  "top_p": 1.0,
79
  "torch_dtype": null,
80
  "torchscript": false,
81
- "transformers_version": "4.29.2",
82
  "typical_p": 1.0,
83
  "use_bfloat16": false,
84
  "use_cache": false,
@@ -161,7 +161,7 @@
161
  "top_p": 1.0,
162
  "torch_dtype": null,
163
  "torchscript": false,
164
- "transformers_version": "4.29.2",
165
  "typical_p": 1.0,
166
  "use_bfloat16": false
167
  },
 
78
  "top_p": 1.0,
79
  "torch_dtype": null,
80
  "torchscript": false,
81
+ "transformers_version": "4.30.2",
82
  "typical_p": 1.0,
83
  "use_bfloat16": false,
84
  "use_cache": false,
 
161
  "top_p": 1.0,
162
  "torch_dtype": null,
163
  "torchscript": false,
164
+ "transformers_version": "4.30.2",
165
  "typical_p": 1.0,
166
  "use_bfloat16": false
167
  },
generation_config.json CHANGED
@@ -8,6 +8,6 @@
8
  "no_repeat_ngram_size": 3,
9
  "num_beams": 4,
10
  "pad_token_id": 1,
11
- "transformers_version": "4.29.2",
12
  "use_cache": false
13
  }
 
8
  "no_repeat_ngram_size": 3,
9
  "num_beams": 4,
10
  "pad_token_id": 1,
11
+ "transformers_version": "4.30.2",
12
  "use_cache": false
13
  }
optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ecb2d4811686ae1fa5a5ddbece1088f23033f7ae89187930e91e4367f3af832c
3
+ size 6036958
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5040851d479f1cc732b7bc4266a943eb794c4672076efd0e67969c551c44372f
3
  size 2233126973
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c39317b40076bf60899b4514d6318b68b6e3621172b0356c452f95a4db8e031f
3
  size 2233126973
rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0756790bb996e19575e28b3c5794bed812c7a56143b158c721c60574e44838a
3
+ size 14575
scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac2f6dbce125c240e2f433875ddc84c2eed63df4c51523c9a034cc014ea71382
3
+ size 627
trainer_state.json ADDED
@@ -0,0 +1,144 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.4317134916782379,
3
+ "best_model_checkpoint": "./checkpoint-4000",
4
+ "epoch": 6.592501030078286,
5
+ "global_step": 4000,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.82,
12
+ "learning_rate": 3.835643564356436e-05,
13
+ "loss": 1.3928,
14
+ "step": 500
15
+ },
16
+ {
17
+ "epoch": 0.82,
18
+ "eval_cer": 0.15288597601847026,
19
+ "eval_loss": 0.7451776266098022,
20
+ "eval_runtime": 665.9721,
21
+ "eval_samples_per_second": 13.161,
22
+ "eval_steps_per_second": 0.823,
23
+ "eval_wer": 0.38850250902368166,
24
+ "step": 500
25
+ },
26
+ {
27
+ "epoch": 1.65,
28
+ "learning_rate": 3.6709570957095713e-05,
29
+ "loss": 0.6552,
30
+ "step": 1000
31
+ },
32
+ {
33
+ "epoch": 1.65,
34
+ "eval_cer": 0.11089595590973411,
35
+ "eval_loss": 0.5462419986724854,
36
+ "eval_runtime": 675.2942,
37
+ "eval_samples_per_second": 12.98,
38
+ "eval_steps_per_second": 0.811,
39
+ "eval_wer": 0.2981776564838454,
40
+ "step": 1000
41
+ },
42
+ {
43
+ "epoch": 2.47,
44
+ "learning_rate": 3.5059405940594064e-05,
45
+ "loss": 0.4677,
46
+ "step": 1500
47
+ },
48
+ {
49
+ "epoch": 2.47,
50
+ "eval_cer": 0.10123631488791242,
51
+ "eval_loss": 0.5031750202178955,
52
+ "eval_runtime": 658.2362,
53
+ "eval_samples_per_second": 13.316,
54
+ "eval_steps_per_second": 0.833,
55
+ "eval_wer": 0.28013029315960913,
56
+ "step": 1500
57
+ },
58
+ {
59
+ "epoch": 3.3,
60
+ "learning_rate": 3.3409240924092415e-05,
61
+ "loss": 0.3562,
62
+ "step": 2000
63
+ },
64
+ {
65
+ "epoch": 3.3,
66
+ "eval_cer": 0.0952111417293513,
67
+ "eval_loss": 0.4881753623485565,
68
+ "eval_runtime": 676.7933,
69
+ "eval_samples_per_second": 12.951,
70
+ "eval_steps_per_second": 0.81,
71
+ "eval_wer": 0.2703142882295977,
72
+ "step": 2000
73
+ },
74
+ {
75
+ "epoch": 4.12,
76
+ "learning_rate": 3.175907590759076e-05,
77
+ "loss": 0.2742,
78
+ "step": 2500
79
+ },
80
+ {
81
+ "epoch": 4.12,
82
+ "eval_cer": 0.08611007671110449,
83
+ "eval_loss": 0.45607951283454895,
84
+ "eval_runtime": 672.7042,
85
+ "eval_samples_per_second": 13.029,
86
+ "eval_steps_per_second": 0.815,
87
+ "eval_wer": 0.24729289550136455,
88
+ "step": 2500
89
+ },
90
+ {
91
+ "epoch": 4.94,
92
+ "learning_rate": 3.0108910891089113e-05,
93
+ "loss": 0.2047,
94
+ "step": 3000
95
+ },
96
+ {
97
+ "epoch": 4.94,
98
+ "eval_cer": 0.07996574067178074,
99
+ "eval_loss": 0.43779700994491577,
100
+ "eval_runtime": 670.3674,
101
+ "eval_samples_per_second": 13.075,
102
+ "eval_steps_per_second": 0.817,
103
+ "eval_wer": 0.236596531384805,
104
+ "step": 3000
105
+ },
106
+ {
107
+ "epoch": 5.77,
108
+ "learning_rate": 2.845874587458746e-05,
109
+ "loss": 0.1452,
110
+ "step": 3500
111
+ },
112
+ {
113
+ "epoch": 5.77,
114
+ "eval_cer": 0.07977210099054145,
115
+ "eval_loss": 0.4486931562423706,
116
+ "eval_runtime": 668.3535,
117
+ "eval_samples_per_second": 13.114,
118
+ "eval_steps_per_second": 0.82,
119
+ "eval_wer": 0.2334272383132318,
120
+ "step": 3500
121
+ },
122
+ {
123
+ "epoch": 6.59,
124
+ "learning_rate": 2.680858085808581e-05,
125
+ "loss": 0.1124,
126
+ "step": 4000
127
+ },
128
+ {
129
+ "epoch": 6.59,
130
+ "eval_cer": 0.0765323601698071,
131
+ "eval_loss": 0.4317134916782379,
132
+ "eval_runtime": 669.0454,
133
+ "eval_samples_per_second": 13.101,
134
+ "eval_steps_per_second": 0.819,
135
+ "eval_wer": 0.2277489215599965,
136
+ "step": 4000
137
+ }
138
+ ],
139
+ "max_steps": 12120,
140
+ "num_train_epochs": 20,
141
+ "total_flos": 6.878208895191142e+20,
142
+ "trial_name": null,
143
+ "trial_params": null
144
+ }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:285f662b244cf0221eac8fbf1d07aebf10f2df8284a4689cc217fab5954a40f0
3
  size 4027
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be998148e7fb2d04bbcf0f3ee167cf3efff6718f9f789ec8e4a072fdb3a83554
3
  size 4027