tensorboy commited on
Commit
08580da
·
verified ·
1 Parent(s): 77fdd41

Training in progress, step 10

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:daeea7778cdeda935a2e90f442518eb60512721cd10bce0921a80c47aa8f2543
3
  size 151061672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6449d1e6c9c423fb8849934a1549ffae7f8f17cfec3201f6fc3aa2a077782fa6
3
  size 151061672
runs/Jun25_21-12-28_bharatsahaiyak-test/events.out.tfevents.1719349949.bharatsahaiyak-test.990312.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:edd4300438a7ad67abf772860cada59cd4255716e7200d824dbda51d7c17f72f
3
- size 6070
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29182ce5fbab9e6fcf4da9cfaf764d721c25d1412d041930b309a3de5b0a6875
3
+ size 6382
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:37c1d71d4573028fde34dd156869c75306de202ae193d1b60195dcab72289f8d
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76aa8e1d1d3d0d745a1e6d6e9ca6f5ddf9f945a3ba698d9644e4cbe35394d28f
3
  size 5240
whisper-tiny-hi-checkpoint-1/trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 69.98899144720129,
3
- "best_model_checkpoint": "./whisper-tiny-hi2_test/checkpoint-120",
4
  "epoch": 6.25,
5
  "eval_steps": 40,
6
  "global_step": 200,
@@ -10,126 +10,126 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.625,
13
- "grad_norm": 10.95101547241211,
14
- "learning_rate": 9.200000000000002e-06,
15
- "loss": 2.3747,
16
  "step": 20
17
  },
18
  {
19
  "epoch": 1.25,
20
- "grad_norm": 7.747081279754639,
21
- "learning_rate": 8.2e-06,
22
- "loss": 1.2169,
23
  "step": 40
24
  },
25
  {
26
  "epoch": 1.25,
27
- "eval_loss": 1.0360029935836792,
28
- "eval_runtime": 574.5339,
29
- "eval_samples_per_second": 1.741,
30
- "eval_steps_per_second": 1.741,
31
- "eval_wer": 91.60809552036582,
32
  "step": 40
33
  },
34
  {
35
  "epoch": 1.875,
36
- "grad_norm": 7.32460355758667,
37
- "learning_rate": 7.2000000000000005e-06,
38
- "loss": 0.9058,
39
  "step": 60
40
  },
41
  {
42
  "epoch": 2.5,
43
- "grad_norm": 6.835532188415527,
44
- "learning_rate": 6.200000000000001e-06,
45
- "loss": 0.7302,
46
  "step": 80
47
  },
48
  {
49
  "epoch": 2.5,
50
- "eval_loss": 0.7368654608726501,
51
- "eval_runtime": 549.562,
52
- "eval_samples_per_second": 1.82,
53
- "eval_steps_per_second": 1.82,
54
- "eval_wer": 79.80353967313066,
55
  "step": 80
56
  },
57
  {
58
  "epoch": 3.125,
59
- "grad_norm": 6.408384323120117,
60
- "learning_rate": 5.2e-06,
61
- "loss": 0.6453,
62
  "step": 100
63
  },
64
  {
65
  "epoch": 3.75,
66
- "grad_norm": 5.809150695800781,
67
- "learning_rate": 4.2000000000000004e-06,
68
- "loss": 0.5917,
69
  "step": 120
70
  },
71
  {
72
  "epoch": 3.75,
73
- "eval_loss": 0.6504533886909485,
74
- "eval_runtime": 548.8688,
75
- "eval_samples_per_second": 1.822,
76
- "eval_steps_per_second": 1.822,
77
- "eval_wer": 69.98899144720129,
78
  "step": 120
79
  },
80
  {
81
  "epoch": 4.375,
82
- "grad_norm": 5.724637508392334,
83
- "learning_rate": 3.2000000000000003e-06,
84
- "loss": 0.5356,
85
  "step": 140
86
  },
87
  {
88
  "epoch": 5.0,
89
- "grad_norm": 10.124310493469238,
90
- "learning_rate": 2.2e-06,
91
- "loss": 0.5156,
92
  "step": 160
93
  },
94
  {
95
  "epoch": 5.0,
96
- "eval_loss": 0.6157090663909912,
97
- "eval_runtime": 549.7895,
98
- "eval_samples_per_second": 1.819,
99
- "eval_steps_per_second": 1.819,
100
- "eval_wer": 70.4293335591498,
101
  "step": 160
102
  },
103
  {
104
  "epoch": 5.625,
105
- "grad_norm": 4.947811126708984,
106
- "learning_rate": 1.2000000000000002e-06,
107
- "loss": 0.4986,
108
  "step": 180
109
  },
110
  {
111
  "epoch": 6.25,
112
- "grad_norm": 4.541861057281494,
113
- "learning_rate": 2.0000000000000002e-07,
114
- "loss": 0.481,
115
  "step": 200
116
  },
117
  {
118
  "epoch": 6.25,
119
- "eval_loss": 0.6050636768341064,
120
- "eval_runtime": 552.964,
121
- "eval_samples_per_second": 1.808,
122
- "eval_steps_per_second": 1.808,
123
- "eval_wer": 70.03980015242611,
124
  "step": 200
125
  },
126
  {
127
  "epoch": 6.25,
128
  "step": 200,
129
  "total_flos": 1.5401574531072e+17,
130
- "train_loss": 0.8495243072509766,
131
- "train_runtime": 3592.94,
132
- "train_samples_per_second": 1.781,
133
  "train_steps_per_second": 0.056
134
  }
135
  ],
 
1
  {
2
+ "best_metric": 58.31498729889923,
3
+ "best_model_checkpoint": "./whisper-tiny-hi2_test/checkpoint-80",
4
  "epoch": 6.25,
5
  "eval_steps": 40,
6
  "global_step": 200,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.625,
13
+ "grad_norm": 8.544885635375977,
14
+ "learning_rate": 3.75e-05,
15
+ "loss": 1.8228,
16
  "step": 20
17
  },
18
  {
19
  "epoch": 1.25,
20
+ "grad_norm": 6.32118558883667,
21
+ "learning_rate": 3.75e-05,
22
+ "loss": 0.6803,
23
  "step": 40
24
  },
25
  {
26
  "epoch": 1.25,
27
+ "eval_loss": 0.6102083325386047,
28
+ "eval_runtime": 542.5987,
29
+ "eval_samples_per_second": 1.843,
30
+ "eval_steps_per_second": 1.843,
31
+ "eval_wer": 65.94411515664692,
32
  "step": 40
33
  },
34
  {
35
  "epoch": 1.875,
36
+ "grad_norm": 6.4600510597229,
37
+ "learning_rate": 3.75e-05,
38
+ "loss": 0.4966,
39
  "step": 60
40
  },
41
  {
42
  "epoch": 2.5,
43
+ "grad_norm": 5.194849491119385,
44
+ "learning_rate": 3.75e-05,
45
+ "loss": 0.3649,
46
  "step": 80
47
  },
48
  {
49
  "epoch": 2.5,
50
+ "eval_loss": 0.5036975741386414,
51
+ "eval_runtime": 540.6408,
52
+ "eval_samples_per_second": 1.85,
53
+ "eval_steps_per_second": 1.85,
54
+ "eval_wer": 58.31498729889923,
55
  "step": 80
56
  },
57
  {
58
  "epoch": 3.125,
59
+ "grad_norm": 4.111001014709473,
60
+ "learning_rate": 3.75e-05,
61
+ "loss": 0.3075,
62
  "step": 100
63
  },
64
  {
65
  "epoch": 3.75,
66
+ "grad_norm": 4.358007431030273,
67
+ "learning_rate": 3.75e-05,
68
+ "loss": 0.2296,
69
  "step": 120
70
  },
71
  {
72
  "epoch": 3.75,
73
+ "eval_loss": 0.48966631293296814,
74
+ "eval_runtime": 538.04,
75
+ "eval_samples_per_second": 1.859,
76
+ "eval_steps_per_second": 1.859,
77
+ "eval_wer": 66.71464860287891,
78
  "step": 120
79
  },
80
  {
81
  "epoch": 4.375,
82
+ "grad_norm": 4.111566066741943,
83
+ "learning_rate": 3.75e-05,
84
+ "loss": 0.1811,
85
  "step": 140
86
  },
87
  {
88
  "epoch": 5.0,
89
+ "grad_norm": 6.702174186706543,
90
+ "learning_rate": 3.75e-05,
91
+ "loss": 0.1564,
92
  "step": 160
93
  },
94
  {
95
  "epoch": 5.0,
96
+ "eval_loss": 0.5130774974822998,
97
+ "eval_runtime": 529.7879,
98
+ "eval_samples_per_second": 1.888,
99
+ "eval_steps_per_second": 1.888,
100
+ "eval_wer": 65.34292972057578,
101
  "step": 160
102
  },
103
  {
104
  "epoch": 5.625,
105
+ "grad_norm": 3.0882856845855713,
106
+ "learning_rate": 3.75e-05,
107
+ "loss": 0.101,
108
  "step": 180
109
  },
110
  {
111
  "epoch": 6.25,
112
+ "grad_norm": 4.524318695068359,
113
+ "learning_rate": 3.75e-05,
114
+ "loss": 0.0905,
115
  "step": 200
116
  },
117
  {
118
  "epoch": 6.25,
119
+ "eval_loss": 0.5503659248352051,
120
+ "eval_runtime": 587.5545,
121
+ "eval_samples_per_second": 1.702,
122
+ "eval_steps_per_second": 1.702,
123
+ "eval_wer": 63.903471634208294,
124
  "step": 200
125
  },
126
  {
127
  "epoch": 6.25,
128
  "step": 200,
129
  "total_flos": 1.5401574531072e+17,
130
+ "train_loss": 0.44307032763957976,
131
+ "train_runtime": 3561.8571,
132
+ "train_samples_per_second": 1.797,
133
  "train_steps_per_second": 0.056
134
  }
135
  ],