|
{ |
|
"best_metric": 0.9259259259259259, |
|
"best_model_checkpoint": "delivery_truck_classification/checkpoint-66", |
|
"epoch": 39.8, |
|
"global_step": 120, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.8, |
|
"eval_accuracy": 0.2222222222222222, |
|
"eval_loss": 1.8672751188278198, |
|
"eval_runtime": 3.8871, |
|
"eval_samples_per_second": 13.892, |
|
"eval_steps_per_second": 0.515, |
|
"step": 3 |
|
}, |
|
{ |
|
"epoch": 1.8, |
|
"eval_accuracy": 0.25925925925925924, |
|
"eval_loss": 1.7420549392700195, |
|
"eval_runtime": 4.3749, |
|
"eval_samples_per_second": 12.343, |
|
"eval_steps_per_second": 0.457, |
|
"step": 6 |
|
}, |
|
{ |
|
"epoch": 2.8, |
|
"eval_accuracy": 0.42592592592592593, |
|
"eval_loss": 1.5909960269927979, |
|
"eval_runtime": 4.1131, |
|
"eval_samples_per_second": 13.129, |
|
"eval_steps_per_second": 0.486, |
|
"step": 9 |
|
}, |
|
{ |
|
"epoch": 3.8, |
|
"eval_accuracy": 0.5, |
|
"eval_loss": 1.4371126890182495, |
|
"eval_runtime": 3.8435, |
|
"eval_samples_per_second": 14.05, |
|
"eval_steps_per_second": 0.52, |
|
"step": 12 |
|
}, |
|
{ |
|
"epoch": 4.8, |
|
"eval_accuracy": 0.5740740740740741, |
|
"eval_loss": 1.2870995998382568, |
|
"eval_runtime": 4.1635, |
|
"eval_samples_per_second": 12.97, |
|
"eval_steps_per_second": 0.48, |
|
"step": 15 |
|
}, |
|
{ |
|
"epoch": 5.8, |
|
"eval_accuracy": 0.5740740740740741, |
|
"eval_loss": 1.1510515213012695, |
|
"eval_runtime": 4.0675, |
|
"eval_samples_per_second": 13.276, |
|
"eval_steps_per_second": 0.492, |
|
"step": 18 |
|
}, |
|
{ |
|
"epoch": 6.53, |
|
"learning_rate": 4.62962962962963e-05, |
|
"loss": 1.8164, |
|
"step": 20 |
|
}, |
|
{ |
|
"epoch": 6.8, |
|
"eval_accuracy": 0.7222222222222222, |
|
"eval_loss": 0.9362860321998596, |
|
"eval_runtime": 3.7257, |
|
"eval_samples_per_second": 14.494, |
|
"eval_steps_per_second": 0.537, |
|
"step": 21 |
|
}, |
|
{ |
|
"epoch": 7.8, |
|
"eval_accuracy": 0.7777777777777778, |
|
"eval_loss": 0.7902935147285461, |
|
"eval_runtime": 4.0908, |
|
"eval_samples_per_second": 13.2, |
|
"eval_steps_per_second": 0.489, |
|
"step": 24 |
|
}, |
|
{ |
|
"epoch": 8.8, |
|
"eval_accuracy": 0.7592592592592593, |
|
"eval_loss": 0.6839045882225037, |
|
"eval_runtime": 4.2293, |
|
"eval_samples_per_second": 12.768, |
|
"eval_steps_per_second": 0.473, |
|
"step": 27 |
|
}, |
|
{ |
|
"epoch": 9.8, |
|
"eval_accuracy": 0.7777777777777778, |
|
"eval_loss": 0.5660675764083862, |
|
"eval_runtime": 3.7011, |
|
"eval_samples_per_second": 14.59, |
|
"eval_steps_per_second": 0.54, |
|
"step": 30 |
|
}, |
|
{ |
|
"epoch": 10.8, |
|
"eval_accuracy": 0.8518518518518519, |
|
"eval_loss": 0.4638045132160187, |
|
"eval_runtime": 4.0924, |
|
"eval_samples_per_second": 13.195, |
|
"eval_steps_per_second": 0.489, |
|
"step": 33 |
|
}, |
|
{ |
|
"epoch": 11.8, |
|
"eval_accuracy": 0.8703703703703703, |
|
"eval_loss": 0.4015035033226013, |
|
"eval_runtime": 4.126, |
|
"eval_samples_per_second": 13.088, |
|
"eval_steps_per_second": 0.485, |
|
"step": 36 |
|
}, |
|
{ |
|
"epoch": 12.8, |
|
"eval_accuracy": 0.8703703703703703, |
|
"eval_loss": 0.3809252083301544, |
|
"eval_runtime": 3.7332, |
|
"eval_samples_per_second": 14.465, |
|
"eval_steps_per_second": 0.536, |
|
"step": 39 |
|
}, |
|
{ |
|
"epoch": 13.27, |
|
"learning_rate": 3.7037037037037037e-05, |
|
"loss": 0.8525, |
|
"step": 40 |
|
}, |
|
{ |
|
"epoch": 13.8, |
|
"eval_accuracy": 0.9074074074074074, |
|
"eval_loss": 0.32140079140663147, |
|
"eval_runtime": 4.0811, |
|
"eval_samples_per_second": 13.232, |
|
"eval_steps_per_second": 0.49, |
|
"step": 42 |
|
}, |
|
{ |
|
"epoch": 14.8, |
|
"eval_accuracy": 0.8703703703703703, |
|
"eval_loss": 0.31137827038764954, |
|
"eval_runtime": 4.0629, |
|
"eval_samples_per_second": 13.291, |
|
"eval_steps_per_second": 0.492, |
|
"step": 45 |
|
}, |
|
{ |
|
"epoch": 15.8, |
|
"eval_accuracy": 0.8888888888888888, |
|
"eval_loss": 0.30256393551826477, |
|
"eval_runtime": 3.8458, |
|
"eval_samples_per_second": 14.041, |
|
"eval_steps_per_second": 0.52, |
|
"step": 48 |
|
}, |
|
{ |
|
"epoch": 16.8, |
|
"eval_accuracy": 0.8888888888888888, |
|
"eval_loss": 0.2969690263271332, |
|
"eval_runtime": 4.091, |
|
"eval_samples_per_second": 13.2, |
|
"eval_steps_per_second": 0.489, |
|
"step": 51 |
|
}, |
|
{ |
|
"epoch": 17.8, |
|
"eval_accuracy": 0.8888888888888888, |
|
"eval_loss": 0.2597466707229614, |
|
"eval_runtime": 4.0172, |
|
"eval_samples_per_second": 13.442, |
|
"eval_steps_per_second": 0.498, |
|
"step": 54 |
|
}, |
|
{ |
|
"epoch": 18.8, |
|
"eval_accuracy": 0.8888888888888888, |
|
"eval_loss": 0.2791738212108612, |
|
"eval_runtime": 3.7642, |
|
"eval_samples_per_second": 14.346, |
|
"eval_steps_per_second": 0.531, |
|
"step": 57 |
|
}, |
|
{ |
|
"epoch": 19.8, |
|
"learning_rate": 2.777777777777778e-05, |
|
"loss": 0.4831, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 19.8, |
|
"eval_accuracy": 0.8703703703703703, |
|
"eval_loss": 0.3208976984024048, |
|
"eval_runtime": 4.0804, |
|
"eval_samples_per_second": 13.234, |
|
"eval_steps_per_second": 0.49, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 20.8, |
|
"eval_accuracy": 0.9074074074074074, |
|
"eval_loss": 0.2928622364997864, |
|
"eval_runtime": 4.1417, |
|
"eval_samples_per_second": 13.038, |
|
"eval_steps_per_second": 0.483, |
|
"step": 63 |
|
}, |
|
{ |
|
"epoch": 21.8, |
|
"eval_accuracy": 0.9259259259259259, |
|
"eval_loss": 0.24187135696411133, |
|
"eval_runtime": 3.7664, |
|
"eval_samples_per_second": 14.337, |
|
"eval_steps_per_second": 0.531, |
|
"step": 66 |
|
}, |
|
{ |
|
"epoch": 22.8, |
|
"eval_accuracy": 0.9074074074074074, |
|
"eval_loss": 0.24963845312595367, |
|
"eval_runtime": 4.1506, |
|
"eval_samples_per_second": 13.01, |
|
"eval_steps_per_second": 0.482, |
|
"step": 69 |
|
}, |
|
{ |
|
"epoch": 23.8, |
|
"eval_accuracy": 0.9074074074074074, |
|
"eval_loss": 0.29534202814102173, |
|
"eval_runtime": 4.1866, |
|
"eval_samples_per_second": 12.898, |
|
"eval_steps_per_second": 0.478, |
|
"step": 72 |
|
}, |
|
{ |
|
"epoch": 24.8, |
|
"eval_accuracy": 0.8888888888888888, |
|
"eval_loss": 0.30937835574150085, |
|
"eval_runtime": 3.7669, |
|
"eval_samples_per_second": 14.336, |
|
"eval_steps_per_second": 0.531, |
|
"step": 75 |
|
}, |
|
{ |
|
"epoch": 25.8, |
|
"eval_accuracy": 0.9259259259259259, |
|
"eval_loss": 0.2792222201824188, |
|
"eval_runtime": 4.0339, |
|
"eval_samples_per_second": 13.387, |
|
"eval_steps_per_second": 0.496, |
|
"step": 78 |
|
}, |
|
{ |
|
"epoch": 26.53, |
|
"learning_rate": 1.8518518518518518e-05, |
|
"loss": 0.3889, |
|
"step": 80 |
|
}, |
|
{ |
|
"epoch": 26.8, |
|
"eval_accuracy": 0.9259259259259259, |
|
"eval_loss": 0.2522352933883667, |
|
"eval_runtime": 4.0446, |
|
"eval_samples_per_second": 13.351, |
|
"eval_steps_per_second": 0.494, |
|
"step": 81 |
|
}, |
|
{ |
|
"epoch": 27.8, |
|
"eval_accuracy": 0.9259259259259259, |
|
"eval_loss": 0.24507637321949005, |
|
"eval_runtime": 3.701, |
|
"eval_samples_per_second": 14.591, |
|
"eval_steps_per_second": 0.54, |
|
"step": 84 |
|
}, |
|
{ |
|
"epoch": 28.8, |
|
"eval_accuracy": 0.9074074074074074, |
|
"eval_loss": 0.2540915906429291, |
|
"eval_runtime": 4.1415, |
|
"eval_samples_per_second": 13.039, |
|
"eval_steps_per_second": 0.483, |
|
"step": 87 |
|
}, |
|
{ |
|
"epoch": 29.8, |
|
"eval_accuracy": 0.9074074074074074, |
|
"eval_loss": 0.2718075215816498, |
|
"eval_runtime": 4.0783, |
|
"eval_samples_per_second": 13.241, |
|
"eval_steps_per_second": 0.49, |
|
"step": 90 |
|
}, |
|
{ |
|
"epoch": 30.8, |
|
"eval_accuracy": 0.9074074074074074, |
|
"eval_loss": 0.2738485634326935, |
|
"eval_runtime": 3.7309, |
|
"eval_samples_per_second": 14.474, |
|
"eval_steps_per_second": 0.536, |
|
"step": 93 |
|
}, |
|
{ |
|
"epoch": 31.8, |
|
"eval_accuracy": 0.9259259259259259, |
|
"eval_loss": 0.26387789845466614, |
|
"eval_runtime": 4.0527, |
|
"eval_samples_per_second": 13.324, |
|
"eval_steps_per_second": 0.493, |
|
"step": 96 |
|
}, |
|
{ |
|
"epoch": 32.8, |
|
"eval_accuracy": 0.9259259259259259, |
|
"eval_loss": 0.25608906149864197, |
|
"eval_runtime": 4.0393, |
|
"eval_samples_per_second": 13.369, |
|
"eval_steps_per_second": 0.495, |
|
"step": 99 |
|
}, |
|
{ |
|
"epoch": 33.27, |
|
"learning_rate": 9.259259259259259e-06, |
|
"loss": 0.3407, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 33.8, |
|
"eval_accuracy": 0.9259259259259259, |
|
"eval_loss": 0.2497122436761856, |
|
"eval_runtime": 3.7801, |
|
"eval_samples_per_second": 14.285, |
|
"eval_steps_per_second": 0.529, |
|
"step": 102 |
|
}, |
|
{ |
|
"epoch": 34.8, |
|
"eval_accuracy": 0.9259259259259259, |
|
"eval_loss": 0.2501243054866791, |
|
"eval_runtime": 4.0375, |
|
"eval_samples_per_second": 13.374, |
|
"eval_steps_per_second": 0.495, |
|
"step": 105 |
|
}, |
|
{ |
|
"epoch": 35.8, |
|
"eval_accuracy": 0.9259259259259259, |
|
"eval_loss": 0.24550123512744904, |
|
"eval_runtime": 4.0543, |
|
"eval_samples_per_second": 13.319, |
|
"eval_steps_per_second": 0.493, |
|
"step": 108 |
|
}, |
|
{ |
|
"epoch": 36.8, |
|
"eval_accuracy": 0.9259259259259259, |
|
"eval_loss": 0.238052099943161, |
|
"eval_runtime": 3.8053, |
|
"eval_samples_per_second": 14.191, |
|
"eval_steps_per_second": 0.526, |
|
"step": 111 |
|
}, |
|
{ |
|
"epoch": 37.8, |
|
"eval_accuracy": 0.9259259259259259, |
|
"eval_loss": 0.23396454751491547, |
|
"eval_runtime": 4.0536, |
|
"eval_samples_per_second": 13.321, |
|
"eval_steps_per_second": 0.493, |
|
"step": 114 |
|
}, |
|
{ |
|
"epoch": 38.8, |
|
"eval_accuracy": 0.9259259259259259, |
|
"eval_loss": 0.23214255273342133, |
|
"eval_runtime": 4.0625, |
|
"eval_samples_per_second": 13.292, |
|
"eval_steps_per_second": 0.492, |
|
"step": 117 |
|
}, |
|
{ |
|
"epoch": 39.8, |
|
"learning_rate": 0.0, |
|
"loss": 0.3112, |
|
"step": 120 |
|
}, |
|
{ |
|
"epoch": 39.8, |
|
"eval_accuracy": 0.9259259259259259, |
|
"eval_loss": 0.23147787153720856, |
|
"eval_runtime": 3.7365, |
|
"eval_samples_per_second": 14.452, |
|
"eval_steps_per_second": 0.535, |
|
"step": 120 |
|
}, |
|
{ |
|
"epoch": 39.8, |
|
"step": 120, |
|
"total_flos": 4.7393239534534656e+17, |
|
"train_loss": 0.6987951993942261, |
|
"train_runtime": 2118.2023, |
|
"train_samples_per_second": 9.045, |
|
"train_steps_per_second": 0.057 |
|
} |
|
], |
|
"max_steps": 120, |
|
"num_train_epochs": 40, |
|
"total_flos": 4.7393239534534656e+17, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|