delivery_truck_classification / trainer_state.json
JEdward7777's picture
End of training
c0290b8
raw
history blame
16.7 kB
{
"best_metric": 1.0,
"best_model_checkpoint": "delivery_truck_classification/checkpoint-172",
"epoch": 59.94117647058823,
"global_step": 240,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.94,
"eval_accuracy": 0.1864406779661017,
"eval_loss": 1.9123966693878174,
"eval_runtime": 3.7131,
"eval_samples_per_second": 15.89,
"eval_steps_per_second": 0.539,
"step": 4
},
{
"epoch": 1.94,
"eval_accuracy": 0.23728813559322035,
"eval_loss": 1.8094592094421387,
"eval_runtime": 4.4625,
"eval_samples_per_second": 13.221,
"eval_steps_per_second": 0.448,
"step": 8
},
{
"epoch": 2.94,
"eval_accuracy": 0.3898305084745763,
"eval_loss": 1.6757333278656006,
"eval_runtime": 3.88,
"eval_samples_per_second": 15.206,
"eval_steps_per_second": 0.515,
"step": 12
},
{
"epoch": 3.94,
"eval_accuracy": 0.5254237288135594,
"eval_loss": 1.4906411170959473,
"eval_runtime": 3.788,
"eval_samples_per_second": 15.576,
"eval_steps_per_second": 0.528,
"step": 16
},
{
"epoch": 4.94,
"learning_rate": 4.166666666666667e-05,
"loss": 1.8286,
"step": 20
},
{
"epoch": 4.94,
"eval_accuracy": 0.6440677966101694,
"eval_loss": 1.2703886032104492,
"eval_runtime": 4.208,
"eval_samples_per_second": 14.021,
"eval_steps_per_second": 0.475,
"step": 20
},
{
"epoch": 5.94,
"eval_accuracy": 0.6779661016949152,
"eval_loss": 1.0685124397277832,
"eval_runtime": 3.8096,
"eval_samples_per_second": 15.487,
"eval_steps_per_second": 0.525,
"step": 24
},
{
"epoch": 6.94,
"eval_accuracy": 0.7457627118644068,
"eval_loss": 0.8031855225563049,
"eval_runtime": 4.1542,
"eval_samples_per_second": 14.203,
"eval_steps_per_second": 0.481,
"step": 28
},
{
"epoch": 7.94,
"eval_accuracy": 0.7627118644067796,
"eval_loss": 0.6308717131614685,
"eval_runtime": 3.7602,
"eval_samples_per_second": 15.691,
"eval_steps_per_second": 0.532,
"step": 32
},
{
"epoch": 8.94,
"eval_accuracy": 0.847457627118644,
"eval_loss": 0.49890831112861633,
"eval_runtime": 4.1569,
"eval_samples_per_second": 14.193,
"eval_steps_per_second": 0.481,
"step": 36
},
{
"epoch": 9.94,
"learning_rate": 4.62962962962963e-05,
"loss": 0.9342,
"step": 40
},
{
"epoch": 9.94,
"eval_accuracy": 0.847457627118644,
"eval_loss": 0.40634387731552124,
"eval_runtime": 3.8202,
"eval_samples_per_second": 15.444,
"eval_steps_per_second": 0.524,
"step": 40
},
{
"epoch": 10.94,
"eval_accuracy": 0.9152542372881356,
"eval_loss": 0.26924625039100647,
"eval_runtime": 4.1384,
"eval_samples_per_second": 14.257,
"eval_steps_per_second": 0.483,
"step": 44
},
{
"epoch": 11.94,
"eval_accuracy": 0.8983050847457628,
"eval_loss": 0.27362605929374695,
"eval_runtime": 3.707,
"eval_samples_per_second": 15.916,
"eval_steps_per_second": 0.54,
"step": 48
},
{
"epoch": 12.94,
"eval_accuracy": 0.9322033898305084,
"eval_loss": 0.21159349381923676,
"eval_runtime": 4.0712,
"eval_samples_per_second": 14.492,
"eval_steps_per_second": 0.491,
"step": 52
},
{
"epoch": 13.94,
"eval_accuracy": 0.9830508474576272,
"eval_loss": 0.1497751921415329,
"eval_runtime": 3.629,
"eval_samples_per_second": 16.258,
"eval_steps_per_second": 0.551,
"step": 56
},
{
"epoch": 14.94,
"learning_rate": 4.166666666666667e-05,
"loss": 0.5151,
"step": 60
},
{
"epoch": 14.94,
"eval_accuracy": 0.9152542372881356,
"eval_loss": 0.1906394362449646,
"eval_runtime": 4.159,
"eval_samples_per_second": 14.186,
"eval_steps_per_second": 0.481,
"step": 60
},
{
"epoch": 15.94,
"eval_accuracy": 0.9491525423728814,
"eval_loss": 0.16975143551826477,
"eval_runtime": 3.7313,
"eval_samples_per_second": 15.812,
"eval_steps_per_second": 0.536,
"step": 64
},
{
"epoch": 16.94,
"eval_accuracy": 0.9491525423728814,
"eval_loss": 0.1431875377893448,
"eval_runtime": 4.1272,
"eval_samples_per_second": 14.295,
"eval_steps_per_second": 0.485,
"step": 68
},
{
"epoch": 17.94,
"eval_accuracy": 0.9322033898305084,
"eval_loss": 0.16815055906772614,
"eval_runtime": 3.6724,
"eval_samples_per_second": 16.066,
"eval_steps_per_second": 0.545,
"step": 72
},
{
"epoch": 18.94,
"eval_accuracy": 0.9830508474576272,
"eval_loss": 0.10692509263753891,
"eval_runtime": 4.1232,
"eval_samples_per_second": 14.309,
"eval_steps_per_second": 0.485,
"step": 76
},
{
"epoch": 19.94,
"learning_rate": 3.7037037037037037e-05,
"loss": 0.4009,
"step": 80
},
{
"epoch": 19.94,
"eval_accuracy": 0.9830508474576272,
"eval_loss": 0.08214119076728821,
"eval_runtime": 3.6886,
"eval_samples_per_second": 15.995,
"eval_steps_per_second": 0.542,
"step": 80
},
{
"epoch": 20.94,
"eval_accuracy": 0.9830508474576272,
"eval_loss": 0.09025811403989792,
"eval_runtime": 4.3053,
"eval_samples_per_second": 13.704,
"eval_steps_per_second": 0.465,
"step": 84
},
{
"epoch": 21.94,
"eval_accuracy": 0.9661016949152542,
"eval_loss": 0.12810270488262177,
"eval_runtime": 3.7203,
"eval_samples_per_second": 15.859,
"eval_steps_per_second": 0.538,
"step": 88
},
{
"epoch": 22.94,
"eval_accuracy": 0.9830508474576272,
"eval_loss": 0.09356144815683365,
"eval_runtime": 4.118,
"eval_samples_per_second": 14.328,
"eval_steps_per_second": 0.486,
"step": 92
},
{
"epoch": 23.94,
"eval_accuracy": 0.9661016949152542,
"eval_loss": 0.10591834783554077,
"eval_runtime": 3.6933,
"eval_samples_per_second": 15.975,
"eval_steps_per_second": 0.542,
"step": 96
},
{
"epoch": 24.94,
"learning_rate": 3.240740740740741e-05,
"loss": 0.3482,
"step": 100
},
{
"epoch": 24.94,
"eval_accuracy": 0.9491525423728814,
"eval_loss": 0.14312368631362915,
"eval_runtime": 4.1639,
"eval_samples_per_second": 14.169,
"eval_steps_per_second": 0.48,
"step": 100
},
{
"epoch": 25.94,
"eval_accuracy": 0.9661016949152542,
"eval_loss": 0.08986904472112656,
"eval_runtime": 3.7088,
"eval_samples_per_second": 15.908,
"eval_steps_per_second": 0.539,
"step": 104
},
{
"epoch": 26.94,
"eval_accuracy": 0.9661016949152542,
"eval_loss": 0.06888163089752197,
"eval_runtime": 4.1304,
"eval_samples_per_second": 14.284,
"eval_steps_per_second": 0.484,
"step": 108
},
{
"epoch": 27.94,
"eval_accuracy": 0.9661016949152542,
"eval_loss": 0.07510155439376831,
"eval_runtime": 3.7462,
"eval_samples_per_second": 15.749,
"eval_steps_per_second": 0.534,
"step": 112
},
{
"epoch": 28.94,
"eval_accuracy": 0.9661016949152542,
"eval_loss": 0.08912018686532974,
"eval_runtime": 3.7992,
"eval_samples_per_second": 15.53,
"eval_steps_per_second": 0.526,
"step": 116
},
{
"epoch": 29.94,
"learning_rate": 2.777777777777778e-05,
"loss": 0.3306,
"step": 120
},
{
"epoch": 29.94,
"eval_accuracy": 0.9830508474576272,
"eval_loss": 0.05226200073957443,
"eval_runtime": 4.2109,
"eval_samples_per_second": 14.011,
"eval_steps_per_second": 0.475,
"step": 120
},
{
"epoch": 30.94,
"eval_accuracy": 0.9830508474576272,
"eval_loss": 0.07344209402799606,
"eval_runtime": 3.9025,
"eval_samples_per_second": 15.118,
"eval_steps_per_second": 0.512,
"step": 124
},
{
"epoch": 31.94,
"eval_accuracy": 0.9830508474576272,
"eval_loss": 0.07462318241596222,
"eval_runtime": 4.1592,
"eval_samples_per_second": 14.185,
"eval_steps_per_second": 0.481,
"step": 128
},
{
"epoch": 32.94,
"eval_accuracy": 0.9661016949152542,
"eval_loss": 0.04742526262998581,
"eval_runtime": 3.8091,
"eval_samples_per_second": 15.489,
"eval_steps_per_second": 0.525,
"step": 132
},
{
"epoch": 33.94,
"eval_accuracy": 0.9830508474576272,
"eval_loss": 0.044318120926618576,
"eval_runtime": 3.7853,
"eval_samples_per_second": 15.587,
"eval_steps_per_second": 0.528,
"step": 136
},
{
"epoch": 34.94,
"learning_rate": 2.314814814814815e-05,
"loss": 0.2871,
"step": 140
},
{
"epoch": 34.94,
"eval_accuracy": 0.9830508474576272,
"eval_loss": 0.08141448348760605,
"eval_runtime": 4.1875,
"eval_samples_per_second": 14.09,
"eval_steps_per_second": 0.478,
"step": 140
},
{
"epoch": 35.94,
"eval_accuracy": 0.9830508474576272,
"eval_loss": 0.0690697729587555,
"eval_runtime": 3.7869,
"eval_samples_per_second": 15.58,
"eval_steps_per_second": 0.528,
"step": 144
},
{
"epoch": 36.94,
"eval_accuracy": 0.9830508474576272,
"eval_loss": 0.053145911544561386,
"eval_runtime": 4.1845,
"eval_samples_per_second": 14.1,
"eval_steps_per_second": 0.478,
"step": 148
},
{
"epoch": 37.94,
"eval_accuracy": 0.9830508474576272,
"eval_loss": 0.06143573671579361,
"eval_runtime": 3.7811,
"eval_samples_per_second": 15.604,
"eval_steps_per_second": 0.529,
"step": 152
},
{
"epoch": 38.94,
"eval_accuracy": 0.9830508474576272,
"eval_loss": 0.057755034416913986,
"eval_runtime": 4.2237,
"eval_samples_per_second": 13.969,
"eval_steps_per_second": 0.474,
"step": 156
},
{
"epoch": 39.94,
"learning_rate": 1.8518518518518518e-05,
"loss": 0.2754,
"step": 160
},
{
"epoch": 39.94,
"eval_accuracy": 0.9830508474576272,
"eval_loss": 0.05201863497495651,
"eval_runtime": 3.7528,
"eval_samples_per_second": 15.722,
"eval_steps_per_second": 0.533,
"step": 160
},
{
"epoch": 40.94,
"eval_accuracy": 0.9830508474576272,
"eval_loss": 0.05365251377224922,
"eval_runtime": 3.7906,
"eval_samples_per_second": 15.565,
"eval_steps_per_second": 0.528,
"step": 164
},
{
"epoch": 41.94,
"eval_accuracy": 0.9830508474576272,
"eval_loss": 0.04466838762164116,
"eval_runtime": 4.0883,
"eval_samples_per_second": 14.432,
"eval_steps_per_second": 0.489,
"step": 168
},
{
"epoch": 42.94,
"eval_accuracy": 1.0,
"eval_loss": 0.028991766273975372,
"eval_runtime": 3.7894,
"eval_samples_per_second": 15.57,
"eval_steps_per_second": 0.528,
"step": 172
},
{
"epoch": 43.94,
"eval_accuracy": 1.0,
"eval_loss": 0.029105449095368385,
"eval_runtime": 4.1829,
"eval_samples_per_second": 14.105,
"eval_steps_per_second": 0.478,
"step": 176
},
{
"epoch": 44.94,
"learning_rate": 1.388888888888889e-05,
"loss": 0.269,
"step": 180
},
{
"epoch": 44.94,
"eval_accuracy": 0.9830508474576272,
"eval_loss": 0.03256472200155258,
"eval_runtime": 3.7585,
"eval_samples_per_second": 15.698,
"eval_steps_per_second": 0.532,
"step": 180
},
{
"epoch": 45.94,
"eval_accuracy": 0.9830508474576272,
"eval_loss": 0.03297417610883713,
"eval_runtime": 4.155,
"eval_samples_per_second": 14.2,
"eval_steps_per_second": 0.481,
"step": 184
},
{
"epoch": 46.94,
"eval_accuracy": 0.9830508474576272,
"eval_loss": 0.034774668514728546,
"eval_runtime": 3.7675,
"eval_samples_per_second": 15.66,
"eval_steps_per_second": 0.531,
"step": 188
},
{
"epoch": 47.94,
"eval_accuracy": 0.9830508474576272,
"eval_loss": 0.03467889130115509,
"eval_runtime": 4.0766,
"eval_samples_per_second": 14.473,
"eval_steps_per_second": 0.491,
"step": 192
},
{
"epoch": 48.94,
"eval_accuracy": 0.9830508474576272,
"eval_loss": 0.03474270924925804,
"eval_runtime": 3.7643,
"eval_samples_per_second": 15.674,
"eval_steps_per_second": 0.531,
"step": 196
},
{
"epoch": 49.94,
"learning_rate": 9.259259259259259e-06,
"loss": 0.2615,
"step": 200
},
{
"epoch": 49.94,
"eval_accuracy": 0.9830508474576272,
"eval_loss": 0.04243284463882446,
"eval_runtime": 4.0985,
"eval_samples_per_second": 14.395,
"eval_steps_per_second": 0.488,
"step": 200
},
{
"epoch": 50.94,
"eval_accuracy": 0.9830508474576272,
"eval_loss": 0.04514499008655548,
"eval_runtime": 3.9491,
"eval_samples_per_second": 14.94,
"eval_steps_per_second": 0.506,
"step": 204
},
{
"epoch": 51.94,
"eval_accuracy": 0.9830508474576272,
"eval_loss": 0.043262287974357605,
"eval_runtime": 3.6957,
"eval_samples_per_second": 15.964,
"eval_steps_per_second": 0.541,
"step": 208
},
{
"epoch": 52.94,
"eval_accuracy": 0.9830508474576272,
"eval_loss": 0.035157691687345505,
"eval_runtime": 4.172,
"eval_samples_per_second": 14.142,
"eval_steps_per_second": 0.479,
"step": 212
},
{
"epoch": 53.94,
"eval_accuracy": 0.9830508474576272,
"eval_loss": 0.03394060581922531,
"eval_runtime": 3.7213,
"eval_samples_per_second": 15.855,
"eval_steps_per_second": 0.537,
"step": 216
},
{
"epoch": 54.94,
"learning_rate": 4.6296296296296296e-06,
"loss": 0.2386,
"step": 220
},
{
"epoch": 54.94,
"eval_accuracy": 0.9830508474576272,
"eval_loss": 0.03394594043493271,
"eval_runtime": 4.1524,
"eval_samples_per_second": 14.208,
"eval_steps_per_second": 0.482,
"step": 220
},
{
"epoch": 55.94,
"eval_accuracy": 0.9830508474576272,
"eval_loss": 0.03388730436563492,
"eval_runtime": 3.719,
"eval_samples_per_second": 15.864,
"eval_steps_per_second": 0.538,
"step": 224
},
{
"epoch": 56.94,
"eval_accuracy": 0.9830508474576272,
"eval_loss": 0.034843575209379196,
"eval_runtime": 4.1514,
"eval_samples_per_second": 14.212,
"eval_steps_per_second": 0.482,
"step": 228
},
{
"epoch": 57.94,
"eval_accuracy": 0.9830508474576272,
"eval_loss": 0.03663792461156845,
"eval_runtime": 3.7689,
"eval_samples_per_second": 15.654,
"eval_steps_per_second": 0.531,
"step": 232
},
{
"epoch": 58.94,
"eval_accuracy": 0.9830508474576272,
"eval_loss": 0.03743705153465271,
"eval_runtime": 4.1165,
"eval_samples_per_second": 14.333,
"eval_steps_per_second": 0.486,
"step": 236
},
{
"epoch": 59.94,
"learning_rate": 0.0,
"loss": 0.2362,
"step": 240
},
{
"epoch": 59.94,
"eval_accuracy": 0.9830508474576272,
"eval_loss": 0.03746996819972992,
"eval_runtime": 3.7404,
"eval_samples_per_second": 15.774,
"eval_steps_per_second": 0.535,
"step": 240
},
{
"epoch": 59.94,
"step": 240,
"total_flos": 7.88616702456404e+17,
"train_loss": 0.4937874893347422,
"train_runtime": 3820.3512,
"train_samples_per_second": 8.308,
"train_steps_per_second": 0.063
}
],
"max_steps": 240,
"num_train_epochs": 60,
"total_flos": 7.88616702456404e+17,
"trial_name": null,
"trial_params": null
}