|
{ |
|
"best_metric": 0.9692307692307692, |
|
"best_model_checkpoint": "delivery_truck_classification/checkpoint-56", |
|
"epoch": 59.8421052631579, |
|
"global_step": 240, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.84, |
|
"eval_accuracy": 0.18461538461538463, |
|
"eval_loss": 1.9335094690322876, |
|
"eval_runtime": 4.2505, |
|
"eval_samples_per_second": 15.292, |
|
"eval_steps_per_second": 0.706, |
|
"step": 4 |
|
}, |
|
{ |
|
"epoch": 1.84, |
|
"eval_accuracy": 0.26153846153846155, |
|
"eval_loss": 1.83644700050354, |
|
"eval_runtime": 4.7909, |
|
"eval_samples_per_second": 13.567, |
|
"eval_steps_per_second": 0.626, |
|
"step": 8 |
|
}, |
|
{ |
|
"epoch": 2.84, |
|
"eval_accuracy": 0.38461538461538464, |
|
"eval_loss": 1.7054301500320435, |
|
"eval_runtime": 4.2339, |
|
"eval_samples_per_second": 15.352, |
|
"eval_steps_per_second": 0.709, |
|
"step": 12 |
|
}, |
|
{ |
|
"epoch": 3.84, |
|
"eval_accuracy": 0.4153846153846154, |
|
"eval_loss": 1.5629212856292725, |
|
"eval_runtime": 4.6, |
|
"eval_samples_per_second": 14.13, |
|
"eval_steps_per_second": 0.652, |
|
"step": 16 |
|
}, |
|
{ |
|
"epoch": 4.84, |
|
"learning_rate": 4.166666666666667e-05, |
|
"loss": 2.0106, |
|
"step": 20 |
|
}, |
|
{ |
|
"epoch": 4.84, |
|
"eval_accuracy": 0.47692307692307695, |
|
"eval_loss": 1.3906540870666504, |
|
"eval_runtime": 4.2108, |
|
"eval_samples_per_second": 15.437, |
|
"eval_steps_per_second": 0.712, |
|
"step": 20 |
|
}, |
|
{ |
|
"epoch": 5.84, |
|
"eval_accuracy": 0.5692307692307692, |
|
"eval_loss": 1.1983743906021118, |
|
"eval_runtime": 4.4922, |
|
"eval_samples_per_second": 14.47, |
|
"eval_steps_per_second": 0.668, |
|
"step": 24 |
|
}, |
|
{ |
|
"epoch": 6.84, |
|
"eval_accuracy": 0.6615384615384615, |
|
"eval_loss": 0.951930582523346, |
|
"eval_runtime": 4.3052, |
|
"eval_samples_per_second": 15.098, |
|
"eval_steps_per_second": 0.697, |
|
"step": 28 |
|
}, |
|
{ |
|
"epoch": 7.84, |
|
"eval_accuracy": 0.7846153846153846, |
|
"eval_loss": 0.7509785294532776, |
|
"eval_runtime": 4.6224, |
|
"eval_samples_per_second": 14.062, |
|
"eval_steps_per_second": 0.649, |
|
"step": 32 |
|
}, |
|
{ |
|
"epoch": 8.84, |
|
"eval_accuracy": 0.8615384615384616, |
|
"eval_loss": 0.5749186277389526, |
|
"eval_runtime": 5.8947, |
|
"eval_samples_per_second": 11.027, |
|
"eval_steps_per_second": 0.509, |
|
"step": 36 |
|
}, |
|
{ |
|
"epoch": 9.84, |
|
"learning_rate": 4.62962962962963e-05, |
|
"loss": 1.1009, |
|
"step": 40 |
|
}, |
|
{ |
|
"epoch": 9.84, |
|
"eval_accuracy": 0.9384615384615385, |
|
"eval_loss": 0.42441025376319885, |
|
"eval_runtime": 4.917, |
|
"eval_samples_per_second": 13.219, |
|
"eval_steps_per_second": 0.61, |
|
"step": 40 |
|
}, |
|
{ |
|
"epoch": 10.84, |
|
"eval_accuracy": 0.8923076923076924, |
|
"eval_loss": 0.3652417063713074, |
|
"eval_runtime": 4.3232, |
|
"eval_samples_per_second": 15.035, |
|
"eval_steps_per_second": 0.694, |
|
"step": 44 |
|
}, |
|
{ |
|
"epoch": 11.84, |
|
"eval_accuracy": 0.9538461538461539, |
|
"eval_loss": 0.2734673023223877, |
|
"eval_runtime": 4.5868, |
|
"eval_samples_per_second": 14.171, |
|
"eval_steps_per_second": 0.654, |
|
"step": 48 |
|
}, |
|
{ |
|
"epoch": 12.84, |
|
"eval_accuracy": 0.8923076923076924, |
|
"eval_loss": 0.29086846113204956, |
|
"eval_runtime": 4.5389, |
|
"eval_samples_per_second": 14.321, |
|
"eval_steps_per_second": 0.661, |
|
"step": 52 |
|
}, |
|
{ |
|
"epoch": 13.84, |
|
"eval_accuracy": 0.9692307692307692, |
|
"eval_loss": 0.22925466299057007, |
|
"eval_runtime": 4.2293, |
|
"eval_samples_per_second": 15.369, |
|
"eval_steps_per_second": 0.709, |
|
"step": 56 |
|
}, |
|
{ |
|
"epoch": 14.84, |
|
"learning_rate": 4.166666666666667e-05, |
|
"loss": 0.6329, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 14.84, |
|
"eval_accuracy": 0.9076923076923077, |
|
"eval_loss": 0.2562795877456665, |
|
"eval_runtime": 4.6895, |
|
"eval_samples_per_second": 13.861, |
|
"eval_steps_per_second": 0.64, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 15.84, |
|
"eval_accuracy": 0.9230769230769231, |
|
"eval_loss": 0.22179557383060455, |
|
"eval_runtime": 4.4085, |
|
"eval_samples_per_second": 14.744, |
|
"eval_steps_per_second": 0.681, |
|
"step": 64 |
|
}, |
|
{ |
|
"epoch": 16.84, |
|
"eval_accuracy": 0.9538461538461539, |
|
"eval_loss": 0.21023423969745636, |
|
"eval_runtime": 4.6409, |
|
"eval_samples_per_second": 14.006, |
|
"eval_steps_per_second": 0.646, |
|
"step": 68 |
|
}, |
|
{ |
|
"epoch": 17.84, |
|
"eval_accuracy": 0.9230769230769231, |
|
"eval_loss": 0.18287315964698792, |
|
"eval_runtime": 4.2374, |
|
"eval_samples_per_second": 15.339, |
|
"eval_steps_per_second": 0.708, |
|
"step": 72 |
|
}, |
|
{ |
|
"epoch": 18.84, |
|
"eval_accuracy": 0.9230769230769231, |
|
"eval_loss": 0.1991574615240097, |
|
"eval_runtime": 4.6374, |
|
"eval_samples_per_second": 14.016, |
|
"eval_steps_per_second": 0.647, |
|
"step": 76 |
|
}, |
|
{ |
|
"epoch": 19.84, |
|
"learning_rate": 3.7037037037037037e-05, |
|
"loss": 0.497, |
|
"step": 80 |
|
}, |
|
{ |
|
"epoch": 19.84, |
|
"eval_accuracy": 0.9230769230769231, |
|
"eval_loss": 0.18140976130962372, |
|
"eval_runtime": 4.3083, |
|
"eval_samples_per_second": 15.087, |
|
"eval_steps_per_second": 0.696, |
|
"step": 80 |
|
}, |
|
{ |
|
"epoch": 20.84, |
|
"eval_accuracy": 0.9384615384615385, |
|
"eval_loss": 0.18073710799217224, |
|
"eval_runtime": 4.692, |
|
"eval_samples_per_second": 13.853, |
|
"eval_steps_per_second": 0.639, |
|
"step": 84 |
|
}, |
|
{ |
|
"epoch": 21.84, |
|
"eval_accuracy": 0.9538461538461539, |
|
"eval_loss": 0.17651371657848358, |
|
"eval_runtime": 4.3195, |
|
"eval_samples_per_second": 15.048, |
|
"eval_steps_per_second": 0.695, |
|
"step": 88 |
|
}, |
|
{ |
|
"epoch": 22.84, |
|
"eval_accuracy": 0.9230769230769231, |
|
"eval_loss": 0.18682582676410675, |
|
"eval_runtime": 4.7596, |
|
"eval_samples_per_second": 13.657, |
|
"eval_steps_per_second": 0.63, |
|
"step": 92 |
|
}, |
|
{ |
|
"epoch": 23.84, |
|
"eval_accuracy": 0.9384615384615385, |
|
"eval_loss": 0.20892775058746338, |
|
"eval_runtime": 4.337, |
|
"eval_samples_per_second": 14.987, |
|
"eval_steps_per_second": 0.692, |
|
"step": 96 |
|
}, |
|
{ |
|
"epoch": 24.84, |
|
"learning_rate": 3.240740740740741e-05, |
|
"loss": 0.4198, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 24.84, |
|
"eval_accuracy": 0.9384615384615385, |
|
"eval_loss": 0.18977122008800507, |
|
"eval_runtime": 4.6813, |
|
"eval_samples_per_second": 13.885, |
|
"eval_steps_per_second": 0.641, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 25.84, |
|
"eval_accuracy": 0.9230769230769231, |
|
"eval_loss": 0.20645342767238617, |
|
"eval_runtime": 4.2709, |
|
"eval_samples_per_second": 15.219, |
|
"eval_steps_per_second": 0.702, |
|
"step": 104 |
|
}, |
|
{ |
|
"epoch": 26.84, |
|
"eval_accuracy": 0.9230769230769231, |
|
"eval_loss": 0.18446099758148193, |
|
"eval_runtime": 4.7129, |
|
"eval_samples_per_second": 13.792, |
|
"eval_steps_per_second": 0.637, |
|
"step": 108 |
|
}, |
|
{ |
|
"epoch": 27.84, |
|
"eval_accuracy": 0.9230769230769231, |
|
"eval_loss": 0.17242665588855743, |
|
"eval_runtime": 4.2634, |
|
"eval_samples_per_second": 15.246, |
|
"eval_steps_per_second": 0.704, |
|
"step": 112 |
|
}, |
|
{ |
|
"epoch": 28.84, |
|
"eval_accuracy": 0.9384615384615385, |
|
"eval_loss": 0.1611722856760025, |
|
"eval_runtime": 4.5386, |
|
"eval_samples_per_second": 14.322, |
|
"eval_steps_per_second": 0.661, |
|
"step": 116 |
|
}, |
|
{ |
|
"epoch": 29.84, |
|
"learning_rate": 2.777777777777778e-05, |
|
"loss": 0.368, |
|
"step": 120 |
|
}, |
|
{ |
|
"epoch": 29.84, |
|
"eval_accuracy": 0.9538461538461539, |
|
"eval_loss": 0.15382908284664154, |
|
"eval_runtime": 5.2863, |
|
"eval_samples_per_second": 12.296, |
|
"eval_steps_per_second": 0.567, |
|
"step": 120 |
|
}, |
|
{ |
|
"epoch": 30.84, |
|
"eval_accuracy": 0.9538461538461539, |
|
"eval_loss": 0.15675745904445648, |
|
"eval_runtime": 4.6707, |
|
"eval_samples_per_second": 13.916, |
|
"eval_steps_per_second": 0.642, |
|
"step": 124 |
|
}, |
|
{ |
|
"epoch": 31.84, |
|
"eval_accuracy": 0.9692307692307692, |
|
"eval_loss": 0.14750127494335175, |
|
"eval_runtime": 4.2141, |
|
"eval_samples_per_second": 15.425, |
|
"eval_steps_per_second": 0.712, |
|
"step": 128 |
|
}, |
|
{ |
|
"epoch": 32.84, |
|
"eval_accuracy": 0.9538461538461539, |
|
"eval_loss": 0.14530035853385925, |
|
"eval_runtime": 4.5446, |
|
"eval_samples_per_second": 14.303, |
|
"eval_steps_per_second": 0.66, |
|
"step": 132 |
|
}, |
|
{ |
|
"epoch": 33.84, |
|
"eval_accuracy": 0.9692307692307692, |
|
"eval_loss": 0.1576438844203949, |
|
"eval_runtime": 4.2804, |
|
"eval_samples_per_second": 15.186, |
|
"eval_steps_per_second": 0.701, |
|
"step": 136 |
|
}, |
|
{ |
|
"epoch": 34.84, |
|
"learning_rate": 2.314814814814815e-05, |
|
"loss": 0.3709, |
|
"step": 140 |
|
}, |
|
{ |
|
"epoch": 34.84, |
|
"eval_accuracy": 0.9692307692307692, |
|
"eval_loss": 0.14298613369464874, |
|
"eval_runtime": 4.6347, |
|
"eval_samples_per_second": 14.025, |
|
"eval_steps_per_second": 0.647, |
|
"step": 140 |
|
}, |
|
{ |
|
"epoch": 35.84, |
|
"eval_accuracy": 0.9692307692307692, |
|
"eval_loss": 0.13841809332370758, |
|
"eval_runtime": 4.3512, |
|
"eval_samples_per_second": 14.938, |
|
"eval_steps_per_second": 0.689, |
|
"step": 144 |
|
}, |
|
{ |
|
"epoch": 36.84, |
|
"eval_accuracy": 0.9692307692307692, |
|
"eval_loss": 0.14322978258132935, |
|
"eval_runtime": 4.6696, |
|
"eval_samples_per_second": 13.92, |
|
"eval_steps_per_second": 0.642, |
|
"step": 148 |
|
}, |
|
{ |
|
"epoch": 37.84, |
|
"eval_accuracy": 0.9692307692307692, |
|
"eval_loss": 0.13474790751934052, |
|
"eval_runtime": 4.2951, |
|
"eval_samples_per_second": 15.133, |
|
"eval_steps_per_second": 0.698, |
|
"step": 152 |
|
}, |
|
{ |
|
"epoch": 38.84, |
|
"eval_accuracy": 0.9538461538461539, |
|
"eval_loss": 0.1358633041381836, |
|
"eval_runtime": 4.6622, |
|
"eval_samples_per_second": 13.942, |
|
"eval_steps_per_second": 0.643, |
|
"step": 156 |
|
}, |
|
{ |
|
"epoch": 39.84, |
|
"learning_rate": 1.8518518518518518e-05, |
|
"loss": 0.3373, |
|
"step": 160 |
|
}, |
|
{ |
|
"epoch": 39.84, |
|
"eval_accuracy": 0.9538461538461539, |
|
"eval_loss": 0.15974925458431244, |
|
"eval_runtime": 4.2867, |
|
"eval_samples_per_second": 15.163, |
|
"eval_steps_per_second": 0.7, |
|
"step": 160 |
|
}, |
|
{ |
|
"epoch": 40.84, |
|
"eval_accuracy": 0.9692307692307692, |
|
"eval_loss": 0.15224121510982513, |
|
"eval_runtime": 4.6977, |
|
"eval_samples_per_second": 13.837, |
|
"eval_steps_per_second": 0.639, |
|
"step": 164 |
|
}, |
|
{ |
|
"epoch": 41.84, |
|
"eval_accuracy": 0.9538461538461539, |
|
"eval_loss": 0.14772085845470428, |
|
"eval_runtime": 4.316, |
|
"eval_samples_per_second": 15.06, |
|
"eval_steps_per_second": 0.695, |
|
"step": 168 |
|
}, |
|
{ |
|
"epoch": 42.84, |
|
"eval_accuracy": 0.9692307692307692, |
|
"eval_loss": 0.1480209231376648, |
|
"eval_runtime": 4.7164, |
|
"eval_samples_per_second": 13.782, |
|
"eval_steps_per_second": 0.636, |
|
"step": 172 |
|
}, |
|
{ |
|
"epoch": 43.84, |
|
"eval_accuracy": 0.9692307692307692, |
|
"eval_loss": 0.14724673330783844, |
|
"eval_runtime": 4.3123, |
|
"eval_samples_per_second": 15.073, |
|
"eval_steps_per_second": 0.696, |
|
"step": 176 |
|
}, |
|
{ |
|
"epoch": 44.84, |
|
"learning_rate": 1.388888888888889e-05, |
|
"loss": 0.3342, |
|
"step": 180 |
|
}, |
|
{ |
|
"epoch": 44.84, |
|
"eval_accuracy": 0.9692307692307692, |
|
"eval_loss": 0.14734135568141937, |
|
"eval_runtime": 4.5929, |
|
"eval_samples_per_second": 14.152, |
|
"eval_steps_per_second": 0.653, |
|
"step": 180 |
|
}, |
|
{ |
|
"epoch": 45.84, |
|
"eval_accuracy": 0.9692307692307692, |
|
"eval_loss": 0.14583279192447662, |
|
"eval_runtime": 4.3738, |
|
"eval_samples_per_second": 14.861, |
|
"eval_steps_per_second": 0.686, |
|
"step": 184 |
|
}, |
|
{ |
|
"epoch": 46.84, |
|
"eval_accuracy": 0.9692307692307692, |
|
"eval_loss": 0.15290141105651855, |
|
"eval_runtime": 4.6815, |
|
"eval_samples_per_second": 13.884, |
|
"eval_steps_per_second": 0.641, |
|
"step": 188 |
|
}, |
|
{ |
|
"epoch": 47.84, |
|
"eval_accuracy": 0.9692307692307692, |
|
"eval_loss": 0.15495683252811432, |
|
"eval_runtime": 4.3181, |
|
"eval_samples_per_second": 15.053, |
|
"eval_steps_per_second": 0.695, |
|
"step": 192 |
|
}, |
|
{ |
|
"epoch": 48.84, |
|
"eval_accuracy": 0.9692307692307692, |
|
"eval_loss": 0.14939415454864502, |
|
"eval_runtime": 4.7194, |
|
"eval_samples_per_second": 13.773, |
|
"eval_steps_per_second": 0.636, |
|
"step": 196 |
|
}, |
|
{ |
|
"epoch": 49.84, |
|
"learning_rate": 9.259259259259259e-06, |
|
"loss": 0.2914, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 49.84, |
|
"eval_accuracy": 0.9692307692307692, |
|
"eval_loss": 0.1469651609659195, |
|
"eval_runtime": 4.259, |
|
"eval_samples_per_second": 15.262, |
|
"eval_steps_per_second": 0.704, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 50.84, |
|
"eval_accuracy": 0.9692307692307692, |
|
"eval_loss": 0.146009162068367, |
|
"eval_runtime": 4.6878, |
|
"eval_samples_per_second": 13.866, |
|
"eval_steps_per_second": 0.64, |
|
"step": 204 |
|
}, |
|
{ |
|
"epoch": 51.84, |
|
"eval_accuracy": 0.9692307692307692, |
|
"eval_loss": 0.14776931703090668, |
|
"eval_runtime": 4.265, |
|
"eval_samples_per_second": 15.24, |
|
"eval_steps_per_second": 0.703, |
|
"step": 208 |
|
}, |
|
{ |
|
"epoch": 52.84, |
|
"eval_accuracy": 0.9692307692307692, |
|
"eval_loss": 0.1481345295906067, |
|
"eval_runtime": 4.5299, |
|
"eval_samples_per_second": 14.349, |
|
"eval_steps_per_second": 0.662, |
|
"step": 212 |
|
}, |
|
{ |
|
"epoch": 53.84, |
|
"eval_accuracy": 0.9692307692307692, |
|
"eval_loss": 0.14605876803398132, |
|
"eval_runtime": 4.1658, |
|
"eval_samples_per_second": 15.603, |
|
"eval_steps_per_second": 0.72, |
|
"step": 216 |
|
}, |
|
{ |
|
"epoch": 54.84, |
|
"learning_rate": 4.6296296296296296e-06, |
|
"loss": 0.2736, |
|
"step": 220 |
|
}, |
|
{ |
|
"epoch": 54.84, |
|
"eval_accuracy": 0.9692307692307692, |
|
"eval_loss": 0.14581629633903503, |
|
"eval_runtime": 4.4574, |
|
"eval_samples_per_second": 14.583, |
|
"eval_steps_per_second": 0.673, |
|
"step": 220 |
|
}, |
|
{ |
|
"epoch": 55.84, |
|
"eval_accuracy": 0.9692307692307692, |
|
"eval_loss": 0.14382527768611908, |
|
"eval_runtime": 4.1183, |
|
"eval_samples_per_second": 15.783, |
|
"eval_steps_per_second": 0.728, |
|
"step": 224 |
|
}, |
|
{ |
|
"epoch": 56.84, |
|
"eval_accuracy": 0.9692307692307692, |
|
"eval_loss": 0.14272591471672058, |
|
"eval_runtime": 4.5294, |
|
"eval_samples_per_second": 14.351, |
|
"eval_steps_per_second": 0.662, |
|
"step": 228 |
|
}, |
|
{ |
|
"epoch": 57.84, |
|
"eval_accuracy": 0.9692307692307692, |
|
"eval_loss": 0.14175653457641602, |
|
"eval_runtime": 4.1288, |
|
"eval_samples_per_second": 15.743, |
|
"eval_steps_per_second": 0.727, |
|
"step": 232 |
|
}, |
|
{ |
|
"epoch": 58.84, |
|
"eval_accuracy": 0.9692307692307692, |
|
"eval_loss": 0.140133798122406, |
|
"eval_runtime": 4.5233, |
|
"eval_samples_per_second": 14.37, |
|
"eval_steps_per_second": 0.663, |
|
"step": 236 |
|
}, |
|
{ |
|
"epoch": 59.84, |
|
"learning_rate": 0.0, |
|
"loss": 0.2589, |
|
"step": 240 |
|
}, |
|
{ |
|
"epoch": 59.84, |
|
"eval_accuracy": 0.9692307692307692, |
|
"eval_loss": 0.13985498249530792, |
|
"eval_runtime": 4.4933, |
|
"eval_samples_per_second": 14.466, |
|
"eval_steps_per_second": 0.668, |
|
"step": 240 |
|
}, |
|
{ |
|
"epoch": 59.84, |
|
"step": 240, |
|
"total_flos": 8.648855308501955e+17, |
|
"train_loss": 0.5746380070845286, |
|
"train_runtime": 4313.6028, |
|
"train_samples_per_second": 8.081, |
|
"train_steps_per_second": 0.056 |
|
} |
|
], |
|
"max_steps": 240, |
|
"num_train_epochs": 60, |
|
"total_flos": 8.648855308501955e+17, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|