JEdward7777 commited on
Commit
18af02a
1 Parent(s): 33e472c

End of training

Browse files
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
  "epoch": 39.67,
3
  "eval_accuracy": 1.0,
4
- "eval_loss": 0.22120876610279083,
5
- "eval_runtime": 1.4551,
6
- "eval_samples_per_second": 13.745,
7
- "eval_steps_per_second": 0.687,
8
- "total_flos": 1.7187351594113434e+17,
9
- "train_loss": 0.9913474082946777,
10
- "train_runtime": 823.5099,
11
- "train_samples_per_second": 8.452,
12
- "train_steps_per_second": 0.049
13
  }
 
1
  {
2
  "epoch": 39.67,
3
  "eval_accuracy": 1.0,
4
+ "eval_loss": 0.5916178226470947,
5
+ "eval_runtime": 1.6168,
6
+ "eval_samples_per_second": 13.607,
7
+ "eval_steps_per_second": 0.619,
8
+ "total_flos": 1.893243704668324e+17,
9
+ "train_loss": 1.1570292234420776,
10
+ "train_runtime": 934.4965,
11
+ "train_samples_per_second": 8.218,
12
+ "train_steps_per_second": 0.043
13
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 39.67,
3
  "eval_accuracy": 1.0,
4
- "eval_loss": 0.22120876610279083,
5
- "eval_runtime": 1.4551,
6
- "eval_samples_per_second": 13.745,
7
- "eval_steps_per_second": 0.687
8
  }
 
1
  {
2
  "epoch": 39.67,
3
  "eval_accuracy": 1.0,
4
+ "eval_loss": 0.5916178226470947,
5
+ "eval_runtime": 1.6168,
6
+ "eval_samples_per_second": 13.607,
7
+ "eval_steps_per_second": 0.619
8
  }
runs/Sep06_20-04-48_220e6d6423e1/events.out.tfevents.1662496955.220e6d6423e1.72.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7a660ba04be390e39ee0c1f5bca30acb1452cf7dd1f7b813566d19cc6afd55e
3
+ size 357
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 39.67,
3
- "total_flos": 1.7187351594113434e+17,
4
- "train_loss": 0.9913474082946777,
5
- "train_runtime": 823.5099,
6
- "train_samples_per_second": 8.452,
7
- "train_steps_per_second": 0.049
8
  }
 
1
  {
2
  "epoch": 39.67,
3
+ "total_flos": 1.893243704668324e+17,
4
+ "train_loss": 1.1570292234420776,
5
+ "train_runtime": 934.4965,
6
+ "train_samples_per_second": 8.218,
7
+ "train_steps_per_second": 0.043
8
  }
trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "best_metric": 1.0,
3
- "best_model_checkpoint": "delivery_truck_classification/checkpoint-21",
4
  "epoch": 39.666666666666664,
5
  "global_step": 40,
6
  "is_hyper_param_search": false,
@@ -9,389 +9,389 @@
9
  "log_history": [
10
  {
11
  "epoch": 0.67,
12
- "eval_accuracy": 0.3,
13
- "eval_loss": 1.7282015085220337,
14
- "eval_runtime": 1.367,
15
- "eval_samples_per_second": 14.631,
16
- "eval_steps_per_second": 0.732,
17
  "step": 1
18
  },
19
  {
20
  "epoch": 1.67,
21
- "eval_accuracy": 0.3,
22
- "eval_loss": 1.678601622581482,
23
- "eval_runtime": 1.4785,
24
- "eval_samples_per_second": 13.528,
25
- "eval_steps_per_second": 0.676,
26
  "step": 2
27
  },
28
  {
29
  "epoch": 2.67,
30
- "eval_accuracy": 0.35,
31
- "eval_loss": 1.58110773563385,
32
- "eval_runtime": 1.5261,
33
- "eval_samples_per_second": 13.105,
34
- "eval_steps_per_second": 0.655,
35
  "step": 3
36
  },
37
  {
38
  "epoch": 3.67,
39
- "eval_accuracy": 0.45,
40
- "eval_loss": 1.4410462379455566,
41
- "eval_runtime": 1.4941,
42
- "eval_samples_per_second": 13.386,
43
- "eval_steps_per_second": 0.669,
44
  "step": 4
45
  },
46
  {
47
  "epoch": 4.67,
48
- "eval_accuracy": 0.65,
49
- "eval_loss": 1.2802143096923828,
50
- "eval_runtime": 1.5014,
51
- "eval_samples_per_second": 13.321,
52
- "eval_steps_per_second": 0.666,
53
  "step": 5
54
  },
55
  {
56
  "epoch": 5.67,
57
- "eval_accuracy": 0.75,
58
- "eval_loss": 1.1453020572662354,
59
- "eval_runtime": 1.5188,
60
- "eval_samples_per_second": 13.168,
61
- "eval_steps_per_second": 0.658,
62
  "step": 6
63
  },
64
  {
65
  "epoch": 6.67,
66
- "eval_accuracy": 0.75,
67
- "eval_loss": 1.0252652168273926,
68
- "eval_runtime": 1.5438,
69
- "eval_samples_per_second": 12.955,
70
- "eval_steps_per_second": 0.648,
71
  "step": 7
72
  },
73
  {
74
  "epoch": 7.67,
75
- "eval_accuracy": 0.75,
76
- "eval_loss": 0.9306014180183411,
77
- "eval_runtime": 1.3614,
78
- "eval_samples_per_second": 14.69,
79
- "eval_steps_per_second": 0.735,
80
  "step": 8
81
  },
82
  {
83
  "epoch": 8.67,
84
- "eval_accuracy": 0.8,
85
- "eval_loss": 0.8565734028816223,
86
- "eval_runtime": 1.4936,
87
- "eval_samples_per_second": 13.391,
88
- "eval_steps_per_second": 0.67,
89
  "step": 9
90
  },
91
  {
92
  "epoch": 9.67,
93
- "eval_accuracy": 0.8,
94
- "eval_loss": 0.8048442602157593,
95
- "eval_runtime": 1.5039,
96
- "eval_samples_per_second": 13.299,
97
- "eval_steps_per_second": 0.665,
98
  "step": 10
99
  },
100
  {
101
  "epoch": 10.67,
102
- "eval_accuracy": 0.8,
103
- "eval_loss": 0.7585190534591675,
104
- "eval_runtime": 1.483,
105
- "eval_samples_per_second": 13.486,
106
- "eval_steps_per_second": 0.674,
107
  "step": 11
108
  },
109
  {
110
  "epoch": 11.67,
111
- "eval_accuracy": 0.8,
112
- "eval_loss": 0.7096863985061646,
113
- "eval_runtime": 1.4896,
114
- "eval_samples_per_second": 13.426,
115
- "eval_steps_per_second": 0.671,
116
  "step": 12
117
  },
118
  {
119
  "epoch": 12.67,
120
- "eval_accuracy": 0.8,
121
- "eval_loss": 0.6442805528640747,
122
- "eval_runtime": 1.4975,
123
- "eval_samples_per_second": 13.355,
124
- "eval_steps_per_second": 0.668,
125
  "step": 13
126
  },
127
  {
128
  "epoch": 13.67,
129
- "eval_accuracy": 0.8,
130
- "eval_loss": 0.5771742463111877,
131
- "eval_runtime": 1.5019,
132
- "eval_samples_per_second": 13.317,
133
- "eval_steps_per_second": 0.666,
134
  "step": 14
135
  },
136
  {
137
  "epoch": 14.67,
138
- "eval_accuracy": 0.8,
139
- "eval_loss": 0.5056056380271912,
140
- "eval_runtime": 1.3719,
141
- "eval_samples_per_second": 14.578,
142
- "eval_steps_per_second": 0.729,
143
  "step": 15
144
  },
145
  {
146
  "epoch": 15.67,
147
- "eval_accuracy": 0.8,
148
- "eval_loss": 0.4443889558315277,
149
- "eval_runtime": 1.5003,
150
- "eval_samples_per_second": 13.331,
151
- "eval_steps_per_second": 0.667,
152
  "step": 16
153
  },
154
  {
155
  "epoch": 16.67,
156
- "eval_accuracy": 0.85,
157
- "eval_loss": 0.385681688785553,
158
- "eval_runtime": 1.4857,
159
- "eval_samples_per_second": 13.462,
160
- "eval_steps_per_second": 0.673,
161
  "step": 17
162
  },
163
  {
164
  "epoch": 17.67,
165
- "eval_accuracy": 0.85,
166
- "eval_loss": 0.3330341875553131,
167
- "eval_runtime": 1.5414,
168
- "eval_samples_per_second": 12.975,
169
- "eval_steps_per_second": 0.649,
170
  "step": 18
171
  },
172
  {
173
  "epoch": 18.67,
174
- "eval_accuracy": 0.9,
175
- "eval_loss": 0.2907267212867737,
176
- "eval_runtime": 1.5308,
177
- "eval_samples_per_second": 13.065,
178
- "eval_steps_per_second": 0.653,
179
  "step": 19
180
  },
181
  {
182
  "epoch": 19.67,
183
  "learning_rate": 2.777777777777778e-05,
184
- "loss": 1.4985,
185
  "step": 20
186
  },
187
  {
188
  "epoch": 19.67,
189
- "eval_accuracy": 0.95,
190
- "eval_loss": 0.2552061080932617,
191
- "eval_runtime": 1.5055,
192
- "eval_samples_per_second": 13.285,
193
- "eval_steps_per_second": 0.664,
194
  "step": 20
195
  },
196
  {
197
  "epoch": 20.67,
198
  "eval_accuracy": 1.0,
199
- "eval_loss": 0.22120876610279083,
200
- "eval_runtime": 1.529,
201
- "eval_samples_per_second": 13.081,
202
- "eval_steps_per_second": 0.654,
203
  "step": 21
204
  },
205
  {
206
  "epoch": 21.67,
207
  "eval_accuracy": 1.0,
208
- "eval_loss": 0.19384506344795227,
209
- "eval_runtime": 1.3951,
210
- "eval_samples_per_second": 14.336,
211
- "eval_steps_per_second": 0.717,
212
  "step": 22
213
  },
214
  {
215
  "epoch": 22.67,
216
  "eval_accuracy": 1.0,
217
- "eval_loss": 0.1699182689189911,
218
- "eval_runtime": 1.551,
219
- "eval_samples_per_second": 12.895,
220
- "eval_steps_per_second": 0.645,
221
  "step": 23
222
  },
223
  {
224
  "epoch": 23.67,
225
  "eval_accuracy": 1.0,
226
- "eval_loss": 0.14904645085334778,
227
- "eval_runtime": 1.5503,
228
- "eval_samples_per_second": 12.901,
229
- "eval_steps_per_second": 0.645,
230
  "step": 24
231
  },
232
  {
233
  "epoch": 24.67,
234
  "eval_accuracy": 1.0,
235
- "eval_loss": 0.13287147879600525,
236
- "eval_runtime": 1.5769,
237
- "eval_samples_per_second": 12.683,
238
- "eval_steps_per_second": 0.634,
239
  "step": 25
240
  },
241
  {
242
  "epoch": 25.67,
243
  "eval_accuracy": 1.0,
244
- "eval_loss": 0.12029655277729034,
245
- "eval_runtime": 1.5354,
246
- "eval_samples_per_second": 13.026,
247
- "eval_steps_per_second": 0.651,
248
  "step": 26
249
  },
250
  {
251
  "epoch": 26.67,
252
  "eval_accuracy": 1.0,
253
- "eval_loss": 0.11412191390991211,
254
- "eval_runtime": 1.6538,
255
- "eval_samples_per_second": 12.093,
256
- "eval_steps_per_second": 0.605,
257
  "step": 27
258
  },
259
  {
260
  "epoch": 27.67,
261
  "eval_accuracy": 1.0,
262
- "eval_loss": 0.10837922245264053,
263
- "eval_runtime": 1.5243,
264
- "eval_samples_per_second": 13.121,
265
- "eval_steps_per_second": 0.656,
266
  "step": 28
267
  },
268
  {
269
  "epoch": 28.67,
270
  "eval_accuracy": 1.0,
271
- "eval_loss": 0.10183490812778473,
272
- "eval_runtime": 1.3977,
273
- "eval_samples_per_second": 14.31,
274
- "eval_steps_per_second": 0.715,
275
  "step": 29
276
  },
277
  {
278
  "epoch": 29.67,
279
  "eval_accuracy": 1.0,
280
- "eval_loss": 0.09532036632299423,
281
- "eval_runtime": 1.5184,
282
- "eval_samples_per_second": 13.171,
283
- "eval_steps_per_second": 0.659,
284
  "step": 30
285
  },
286
  {
287
  "epoch": 30.67,
288
  "eval_accuracy": 1.0,
289
- "eval_loss": 0.0878124088048935,
290
- "eval_runtime": 1.4999,
291
- "eval_samples_per_second": 13.334,
292
- "eval_steps_per_second": 0.667,
293
  "step": 31
294
  },
295
  {
296
  "epoch": 31.67,
297
  "eval_accuracy": 1.0,
298
- "eval_loss": 0.07940232753753662,
299
- "eval_runtime": 2.1996,
300
- "eval_samples_per_second": 9.092,
301
- "eval_steps_per_second": 0.455,
302
  "step": 32
303
  },
304
  {
305
  "epoch": 32.67,
306
  "eval_accuracy": 1.0,
307
- "eval_loss": 0.0729844942688942,
308
- "eval_runtime": 1.5148,
309
- "eval_samples_per_second": 13.203,
310
- "eval_steps_per_second": 0.66,
311
  "step": 33
312
  },
313
  {
314
  "epoch": 33.67,
315
  "eval_accuracy": 1.0,
316
- "eval_loss": 0.06873825937509537,
317
- "eval_runtime": 1.5014,
318
- "eval_samples_per_second": 13.321,
319
- "eval_steps_per_second": 0.666,
320
  "step": 34
321
  },
322
  {
323
  "epoch": 34.67,
324
  "eval_accuracy": 1.0,
325
- "eval_loss": 0.06642889976501465,
326
- "eval_runtime": 1.5257,
327
- "eval_samples_per_second": 13.109,
328
- "eval_steps_per_second": 0.655,
329
  "step": 35
330
  },
331
  {
332
  "epoch": 35.67,
333
  "eval_accuracy": 1.0,
334
- "eval_loss": 0.06485584378242493,
335
- "eval_runtime": 1.3992,
336
- "eval_samples_per_second": 14.294,
337
- "eval_steps_per_second": 0.715,
338
  "step": 36
339
  },
340
  {
341
  "epoch": 36.67,
342
  "eval_accuracy": 1.0,
343
- "eval_loss": 0.06402350962162018,
344
- "eval_runtime": 1.5962,
345
- "eval_samples_per_second": 12.53,
346
- "eval_steps_per_second": 0.627,
347
  "step": 37
348
  },
349
  {
350
  "epoch": 37.67,
351
  "eval_accuracy": 1.0,
352
- "eval_loss": 0.06386792659759521,
353
- "eval_runtime": 1.5114,
354
- "eval_samples_per_second": 13.233,
355
- "eval_steps_per_second": 0.662,
356
  "step": 38
357
  },
358
  {
359
  "epoch": 38.67,
360
  "eval_accuracy": 1.0,
361
- "eval_loss": 0.06384583562612534,
362
- "eval_runtime": 1.4982,
363
- "eval_samples_per_second": 13.349,
364
- "eval_steps_per_second": 0.667,
365
  "step": 39
366
  },
367
  {
368
  "epoch": 39.67,
369
  "learning_rate": 0.0,
370
- "loss": 0.4842,
371
  "step": 40
372
  },
373
  {
374
  "epoch": 39.67,
375
  "eval_accuracy": 1.0,
376
- "eval_loss": 0.0637463703751564,
377
- "eval_runtime": 1.4885,
378
- "eval_samples_per_second": 13.436,
379
- "eval_steps_per_second": 0.672,
380
  "step": 40
381
  },
382
  {
383
  "epoch": 39.67,
384
  "step": 40,
385
- "total_flos": 1.7187351594113434e+17,
386
- "train_loss": 0.9913474082946777,
387
- "train_runtime": 823.5099,
388
- "train_samples_per_second": 8.452,
389
- "train_steps_per_second": 0.049
390
  }
391
  ],
392
  "max_steps": 40,
393
  "num_train_epochs": 40,
394
- "total_flos": 1.7187351594113434e+17,
395
  "trial_name": null,
396
  "trial_params": null
397
  }
 
1
  {
2
  "best_metric": 1.0,
3
+ "best_model_checkpoint": "delivery_truck_classification/checkpoint-13",
4
  "epoch": 39.666666666666664,
5
  "global_step": 40,
6
  "is_hyper_param_search": false,
 
9
  "log_history": [
10
  {
11
  "epoch": 0.67,
12
+ "eval_accuracy": 0.18181818181818182,
13
+ "eval_loss": 1.868780255317688,
14
+ "eval_runtime": 1.5131,
15
+ "eval_samples_per_second": 14.54,
16
+ "eval_steps_per_second": 0.661,
17
  "step": 1
18
  },
19
  {
20
  "epoch": 1.67,
21
+ "eval_accuracy": 0.18181818181818182,
22
+ "eval_loss": 1.7919577360153198,
23
+ "eval_runtime": 1.7289,
24
+ "eval_samples_per_second": 12.725,
25
+ "eval_steps_per_second": 0.578,
26
  "step": 2
27
  },
28
  {
29
  "epoch": 2.67,
30
+ "eval_accuracy": 0.36363636363636365,
31
+ "eval_loss": 1.6533408164978027,
32
+ "eval_runtime": 1.6458,
33
+ "eval_samples_per_second": 13.368,
34
+ "eval_steps_per_second": 0.608,
35
  "step": 3
36
  },
37
  {
38
  "epoch": 3.67,
39
+ "eval_accuracy": 0.45454545454545453,
40
+ "eval_loss": 1.4775406122207642,
41
+ "eval_runtime": 1.6663,
42
+ "eval_samples_per_second": 13.203,
43
+ "eval_steps_per_second": 0.6,
44
  "step": 4
45
  },
46
  {
47
  "epoch": 4.67,
48
+ "eval_accuracy": 0.5909090909090909,
49
+ "eval_loss": 1.2912439107894897,
50
+ "eval_runtime": 1.6991,
51
+ "eval_samples_per_second": 12.948,
52
+ "eval_steps_per_second": 0.589,
53
  "step": 5
54
  },
55
  {
56
  "epoch": 5.67,
57
+ "eval_accuracy": 0.7272727272727273,
58
+ "eval_loss": 1.147495150566101,
59
+ "eval_runtime": 1.713,
60
+ "eval_samples_per_second": 12.843,
61
+ "eval_steps_per_second": 0.584,
62
  "step": 6
63
  },
64
  {
65
  "epoch": 6.67,
66
+ "eval_accuracy": 0.7727272727272727,
67
+ "eval_loss": 1.0265945196151733,
68
+ "eval_runtime": 1.5543,
69
+ "eval_samples_per_second": 14.154,
70
+ "eval_steps_per_second": 0.643,
71
  "step": 7
72
  },
73
  {
74
  "epoch": 7.67,
75
+ "eval_accuracy": 0.7727272727272727,
76
+ "eval_loss": 0.9196190237998962,
77
+ "eval_runtime": 1.677,
78
+ "eval_samples_per_second": 13.119,
79
+ "eval_steps_per_second": 0.596,
80
  "step": 8
81
  },
82
  {
83
  "epoch": 8.67,
84
+ "eval_accuracy": 0.8181818181818182,
85
+ "eval_loss": 0.8272687792778015,
86
+ "eval_runtime": 1.7098,
87
+ "eval_samples_per_second": 12.867,
88
+ "eval_steps_per_second": 0.585,
89
  "step": 9
90
  },
91
  {
92
  "epoch": 9.67,
93
+ "eval_accuracy": 0.8181818181818182,
94
+ "eval_loss": 0.7491626739501953,
95
+ "eval_runtime": 1.6687,
96
+ "eval_samples_per_second": 13.184,
97
+ "eval_steps_per_second": 0.599,
98
  "step": 10
99
  },
100
  {
101
  "epoch": 10.67,
102
+ "eval_accuracy": 0.9090909090909091,
103
+ "eval_loss": 0.6857182383537292,
104
+ "eval_runtime": 1.6621,
105
+ "eval_samples_per_second": 13.236,
106
+ "eval_steps_per_second": 0.602,
107
  "step": 11
108
  },
109
  {
110
  "epoch": 11.67,
111
+ "eval_accuracy": 0.9090909090909091,
112
+ "eval_loss": 0.6368551850318909,
113
+ "eval_runtime": 1.555,
114
+ "eval_samples_per_second": 14.148,
115
+ "eval_steps_per_second": 0.643,
116
  "step": 12
117
  },
118
  {
119
  "epoch": 12.67,
120
+ "eval_accuracy": 1.0,
121
+ "eval_loss": 0.5916178226470947,
122
+ "eval_runtime": 1.5463,
123
+ "eval_samples_per_second": 14.227,
124
+ "eval_steps_per_second": 0.647,
125
  "step": 13
126
  },
127
  {
128
  "epoch": 13.67,
129
+ "eval_accuracy": 1.0,
130
+ "eval_loss": 0.5461986660957336,
131
+ "eval_runtime": 1.751,
132
+ "eval_samples_per_second": 12.564,
133
+ "eval_steps_per_second": 0.571,
134
  "step": 14
135
  },
136
  {
137
  "epoch": 14.67,
138
+ "eval_accuracy": 1.0,
139
+ "eval_loss": 0.4926997423171997,
140
+ "eval_runtime": 1.6672,
141
+ "eval_samples_per_second": 13.196,
142
+ "eval_steps_per_second": 0.6,
143
  "step": 15
144
  },
145
  {
146
  "epoch": 15.67,
147
+ "eval_accuracy": 1.0,
148
+ "eval_loss": 0.4390135705471039,
149
+ "eval_runtime": 1.6819,
150
+ "eval_samples_per_second": 13.08,
151
+ "eval_steps_per_second": 0.595,
152
  "step": 16
153
  },
154
  {
155
  "epoch": 16.67,
156
+ "eval_accuracy": 1.0,
157
+ "eval_loss": 0.3913687765598297,
158
+ "eval_runtime": 1.7338,
159
+ "eval_samples_per_second": 12.689,
160
+ "eval_steps_per_second": 0.577,
161
  "step": 17
162
  },
163
  {
164
  "epoch": 17.67,
165
+ "eval_accuracy": 1.0,
166
+ "eval_loss": 0.3446086645126343,
167
+ "eval_runtime": 1.6759,
168
+ "eval_samples_per_second": 13.127,
169
+ "eval_steps_per_second": 0.597,
170
  "step": 18
171
  },
172
  {
173
  "epoch": 18.67,
174
+ "eval_accuracy": 1.0,
175
+ "eval_loss": 0.30193081498146057,
176
+ "eval_runtime": 1.53,
177
+ "eval_samples_per_second": 14.379,
178
+ "eval_steps_per_second": 0.654,
179
  "step": 19
180
  },
181
  {
182
  "epoch": 19.67,
183
  "learning_rate": 2.777777777777778e-05,
184
+ "loss": 1.7058,
185
  "step": 20
186
  },
187
  {
188
  "epoch": 19.67,
189
+ "eval_accuracy": 1.0,
190
+ "eval_loss": 0.26113784313201904,
191
+ "eval_runtime": 1.6899,
192
+ "eval_samples_per_second": 13.018,
193
+ "eval_steps_per_second": 0.592,
194
  "step": 20
195
  },
196
  {
197
  "epoch": 20.67,
198
  "eval_accuracy": 1.0,
199
+ "eval_loss": 0.22893615067005157,
200
+ "eval_runtime": 1.6979,
201
+ "eval_samples_per_second": 12.957,
202
+ "eval_steps_per_second": 0.589,
203
  "step": 21
204
  },
205
  {
206
  "epoch": 21.67,
207
  "eval_accuracy": 1.0,
208
+ "eval_loss": 0.19601884484291077,
209
+ "eval_runtime": 1.7011,
210
+ "eval_samples_per_second": 12.933,
211
+ "eval_steps_per_second": 0.588,
212
  "step": 22
213
  },
214
  {
215
  "epoch": 22.67,
216
  "eval_accuracy": 1.0,
217
+ "eval_loss": 0.17112015187740326,
218
+ "eval_runtime": 1.7223,
219
+ "eval_samples_per_second": 12.774,
220
+ "eval_steps_per_second": 0.581,
221
  "step": 23
222
  },
223
  {
224
  "epoch": 23.67,
225
  "eval_accuracy": 1.0,
226
+ "eval_loss": 0.1567678302526474,
227
+ "eval_runtime": 1.7218,
228
+ "eval_samples_per_second": 12.778,
229
+ "eval_steps_per_second": 0.581,
230
  "step": 24
231
  },
232
  {
233
  "epoch": 24.67,
234
  "eval_accuracy": 1.0,
235
+ "eval_loss": 0.14628903567790985,
236
+ "eval_runtime": 1.5212,
237
+ "eval_samples_per_second": 14.462,
238
+ "eval_steps_per_second": 0.657,
239
  "step": 25
240
  },
241
  {
242
  "epoch": 25.67,
243
  "eval_accuracy": 1.0,
244
+ "eval_loss": 0.13830214738845825,
245
+ "eval_runtime": 1.7359,
246
+ "eval_samples_per_second": 12.673,
247
+ "eval_steps_per_second": 0.576,
248
  "step": 26
249
  },
250
  {
251
  "epoch": 26.67,
252
  "eval_accuracy": 1.0,
253
+ "eval_loss": 0.13232018053531647,
254
+ "eval_runtime": 1.6428,
255
+ "eval_samples_per_second": 13.392,
256
+ "eval_steps_per_second": 0.609,
257
  "step": 27
258
  },
259
  {
260
  "epoch": 27.67,
261
  "eval_accuracy": 1.0,
262
+ "eval_loss": 0.12681324779987335,
263
+ "eval_runtime": 2.2983,
264
+ "eval_samples_per_second": 9.572,
265
+ "eval_steps_per_second": 0.435,
266
  "step": 28
267
  },
268
  {
269
  "epoch": 28.67,
270
  "eval_accuracy": 1.0,
271
+ "eval_loss": 0.1198858991265297,
272
+ "eval_runtime": 1.6718,
273
+ "eval_samples_per_second": 13.16,
274
+ "eval_steps_per_second": 0.598,
275
  "step": 29
276
  },
277
  {
278
  "epoch": 29.67,
279
  "eval_accuracy": 1.0,
280
+ "eval_loss": 0.11446233093738556,
281
+ "eval_runtime": 1.6684,
282
+ "eval_samples_per_second": 13.186,
283
+ "eval_steps_per_second": 0.599,
284
  "step": 30
285
  },
286
  {
287
  "epoch": 30.67,
288
  "eval_accuracy": 1.0,
289
+ "eval_loss": 0.11288688331842422,
290
+ "eval_runtime": 1.5105,
291
+ "eval_samples_per_second": 14.565,
292
+ "eval_steps_per_second": 0.662,
293
  "step": 31
294
  },
295
  {
296
  "epoch": 31.67,
297
  "eval_accuracy": 1.0,
298
+ "eval_loss": 0.10953269153833389,
299
+ "eval_runtime": 1.7039,
300
+ "eval_samples_per_second": 12.911,
301
+ "eval_steps_per_second": 0.587,
302
  "step": 32
303
  },
304
  {
305
  "epoch": 32.67,
306
  "eval_accuracy": 1.0,
307
+ "eval_loss": 0.10787732154130936,
308
+ "eval_runtime": 1.7185,
309
+ "eval_samples_per_second": 12.802,
310
+ "eval_steps_per_second": 0.582,
311
  "step": 33
312
  },
313
  {
314
  "epoch": 33.67,
315
  "eval_accuracy": 1.0,
316
+ "eval_loss": 0.10531877726316452,
317
+ "eval_runtime": 1.8305,
318
+ "eval_samples_per_second": 12.019,
319
+ "eval_steps_per_second": 0.546,
320
  "step": 34
321
  },
322
  {
323
  "epoch": 34.67,
324
  "eval_accuracy": 1.0,
325
+ "eval_loss": 0.10338964313268661,
326
+ "eval_runtime": 1.6703,
327
+ "eval_samples_per_second": 13.171,
328
+ "eval_steps_per_second": 0.599,
329
  "step": 35
330
  },
331
  {
332
  "epoch": 35.67,
333
  "eval_accuracy": 1.0,
334
+ "eval_loss": 0.09904544055461884,
335
+ "eval_runtime": 1.5401,
336
+ "eval_samples_per_second": 14.285,
337
+ "eval_steps_per_second": 0.649,
338
  "step": 36
339
  },
340
  {
341
  "epoch": 36.67,
342
  "eval_accuracy": 1.0,
343
+ "eval_loss": 0.09628929942846298,
344
+ "eval_runtime": 1.5486,
345
+ "eval_samples_per_second": 14.206,
346
+ "eval_steps_per_second": 0.646,
347
  "step": 37
348
  },
349
  {
350
  "epoch": 37.67,
351
  "eval_accuracy": 1.0,
352
+ "eval_loss": 0.09520366042852402,
353
+ "eval_runtime": 1.6769,
354
+ "eval_samples_per_second": 13.12,
355
+ "eval_steps_per_second": 0.596,
356
  "step": 38
357
  },
358
  {
359
  "epoch": 38.67,
360
  "eval_accuracy": 1.0,
361
+ "eval_loss": 0.09436272829771042,
362
+ "eval_runtime": 1.7152,
363
+ "eval_samples_per_second": 12.826,
364
+ "eval_steps_per_second": 0.583,
365
  "step": 39
366
  },
367
  {
368
  "epoch": 39.67,
369
  "learning_rate": 0.0,
370
+ "loss": 0.6083,
371
  "step": 40
372
  },
373
  {
374
  "epoch": 39.67,
375
  "eval_accuracy": 1.0,
376
+ "eval_loss": 0.0941963642835617,
377
+ "eval_runtime": 1.7089,
378
+ "eval_samples_per_second": 12.874,
379
+ "eval_steps_per_second": 0.585,
380
  "step": 40
381
  },
382
  {
383
  "epoch": 39.67,
384
  "step": 40,
385
+ "total_flos": 1.893243704668324e+17,
386
+ "train_loss": 1.1570292234420776,
387
+ "train_runtime": 934.4965,
388
+ "train_samples_per_second": 8.218,
389
+ "train_steps_per_second": 0.043
390
  }
391
  ],
392
  "max_steps": 40,
393
  "num_train_epochs": 40,
394
+ "total_flos": 1.893243704668324e+17,
395
  "trial_name": null,
396
  "trial_params": null
397
  }