delivery_truck_classification / trainer_state.json
JEdward7777's picture
End of training
9f4ff4f
raw
history blame
16.7 kB
{
"best_metric": 0.9846153846153847,
"best_model_checkpoint": "delivery_truck_classification/checkpoint-104",
"epoch": 59.8421052631579,
"global_step": 240,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.84,
"eval_accuracy": 0.3230769230769231,
"eval_loss": 1.819914698600769,
"eval_runtime": 4.4893,
"eval_samples_per_second": 14.479,
"eval_steps_per_second": 0.668,
"step": 4
},
{
"epoch": 1.84,
"eval_accuracy": 0.4153846153846154,
"eval_loss": 1.7274595499038696,
"eval_runtime": 5.1038,
"eval_samples_per_second": 12.736,
"eval_steps_per_second": 0.588,
"step": 8
},
{
"epoch": 2.84,
"eval_accuracy": 0.46153846153846156,
"eval_loss": 1.628129005432129,
"eval_runtime": 4.4017,
"eval_samples_per_second": 14.767,
"eval_steps_per_second": 0.682,
"step": 12
},
{
"epoch": 3.84,
"eval_accuracy": 0.46153846153846156,
"eval_loss": 1.5271515846252441,
"eval_runtime": 4.7528,
"eval_samples_per_second": 13.676,
"eval_steps_per_second": 0.631,
"step": 16
},
{
"epoch": 4.84,
"learning_rate": 4.166666666666667e-05,
"loss": 1.9537,
"step": 20
},
{
"epoch": 4.84,
"eval_accuracy": 0.5076923076923077,
"eval_loss": 1.3667770624160767,
"eval_runtime": 4.3866,
"eval_samples_per_second": 14.818,
"eval_steps_per_second": 0.684,
"step": 20
},
{
"epoch": 5.84,
"eval_accuracy": 0.6,
"eval_loss": 1.0963521003723145,
"eval_runtime": 4.7064,
"eval_samples_per_second": 13.811,
"eval_steps_per_second": 0.637,
"step": 24
},
{
"epoch": 6.84,
"eval_accuracy": 0.7846153846153846,
"eval_loss": 0.7691364884376526,
"eval_runtime": 4.2153,
"eval_samples_per_second": 15.42,
"eval_steps_per_second": 0.712,
"step": 28
},
{
"epoch": 7.84,
"eval_accuracy": 0.8307692307692308,
"eval_loss": 0.6369762420654297,
"eval_runtime": 4.7258,
"eval_samples_per_second": 13.754,
"eval_steps_per_second": 0.635,
"step": 32
},
{
"epoch": 8.84,
"eval_accuracy": 0.9076923076923077,
"eval_loss": 0.4328678548336029,
"eval_runtime": 4.7157,
"eval_samples_per_second": 13.784,
"eval_steps_per_second": 0.636,
"step": 36
},
{
"epoch": 9.84,
"learning_rate": 4.62962962962963e-05,
"loss": 1.0682,
"step": 40
},
{
"epoch": 9.84,
"eval_accuracy": 0.9076923076923077,
"eval_loss": 0.3517535626888275,
"eval_runtime": 4.7127,
"eval_samples_per_second": 13.792,
"eval_steps_per_second": 0.637,
"step": 40
},
{
"epoch": 10.84,
"eval_accuracy": 0.8923076923076924,
"eval_loss": 0.3229323625564575,
"eval_runtime": 4.2434,
"eval_samples_per_second": 15.318,
"eval_steps_per_second": 0.707,
"step": 44
},
{
"epoch": 11.84,
"eval_accuracy": 0.9384615384615385,
"eval_loss": 0.2324085831642151,
"eval_runtime": 4.734,
"eval_samples_per_second": 13.731,
"eval_steps_per_second": 0.634,
"step": 48
},
{
"epoch": 12.84,
"eval_accuracy": 0.9384615384615385,
"eval_loss": 0.23686641454696655,
"eval_runtime": 4.3354,
"eval_samples_per_second": 14.993,
"eval_steps_per_second": 0.692,
"step": 52
},
{
"epoch": 13.84,
"eval_accuracy": 0.9384615384615385,
"eval_loss": 0.21190524101257324,
"eval_runtime": 4.793,
"eval_samples_per_second": 13.561,
"eval_steps_per_second": 0.626,
"step": 56
},
{
"epoch": 14.84,
"learning_rate": 4.166666666666667e-05,
"loss": 0.6335,
"step": 60
},
{
"epoch": 14.84,
"eval_accuracy": 0.9384615384615385,
"eval_loss": 0.18046662211418152,
"eval_runtime": 4.2602,
"eval_samples_per_second": 15.257,
"eval_steps_per_second": 0.704,
"step": 60
},
{
"epoch": 15.84,
"eval_accuracy": 0.9076923076923077,
"eval_loss": 0.21350829303264618,
"eval_runtime": 4.7427,
"eval_samples_per_second": 13.705,
"eval_steps_per_second": 0.633,
"step": 64
},
{
"epoch": 16.84,
"eval_accuracy": 0.9230769230769231,
"eval_loss": 0.1889328807592392,
"eval_runtime": 4.2616,
"eval_samples_per_second": 15.253,
"eval_steps_per_second": 0.704,
"step": 68
},
{
"epoch": 17.84,
"eval_accuracy": 0.9538461538461539,
"eval_loss": 0.16009008884429932,
"eval_runtime": 4.7629,
"eval_samples_per_second": 13.647,
"eval_steps_per_second": 0.63,
"step": 72
},
{
"epoch": 18.84,
"eval_accuracy": 0.9692307692307692,
"eval_loss": 0.14124387502670288,
"eval_runtime": 4.3251,
"eval_samples_per_second": 15.029,
"eval_steps_per_second": 0.694,
"step": 76
},
{
"epoch": 19.84,
"learning_rate": 3.7037037037037037e-05,
"loss": 0.5133,
"step": 80
},
{
"epoch": 19.84,
"eval_accuracy": 0.9538461538461539,
"eval_loss": 0.14968368411064148,
"eval_runtime": 4.7085,
"eval_samples_per_second": 13.805,
"eval_steps_per_second": 0.637,
"step": 80
},
{
"epoch": 20.84,
"eval_accuracy": 0.9538461538461539,
"eval_loss": 0.15449711680412292,
"eval_runtime": 4.2803,
"eval_samples_per_second": 15.186,
"eval_steps_per_second": 0.701,
"step": 84
},
{
"epoch": 21.84,
"eval_accuracy": 0.9538461538461539,
"eval_loss": 0.12975920736789703,
"eval_runtime": 6.2107,
"eval_samples_per_second": 10.466,
"eval_steps_per_second": 0.483,
"step": 88
},
{
"epoch": 22.84,
"eval_accuracy": 0.9538461538461539,
"eval_loss": 0.14153267443180084,
"eval_runtime": 4.2538,
"eval_samples_per_second": 15.28,
"eval_steps_per_second": 0.705,
"step": 92
},
{
"epoch": 23.84,
"eval_accuracy": 0.9230769230769231,
"eval_loss": 0.16845214366912842,
"eval_runtime": 4.6805,
"eval_samples_per_second": 13.888,
"eval_steps_per_second": 0.641,
"step": 96
},
{
"epoch": 24.84,
"learning_rate": 3.240740740740741e-05,
"loss": 0.4383,
"step": 100
},
{
"epoch": 24.84,
"eval_accuracy": 0.9384615384615385,
"eval_loss": 0.13808518648147583,
"eval_runtime": 4.2829,
"eval_samples_per_second": 15.177,
"eval_steps_per_second": 0.7,
"step": 100
},
{
"epoch": 25.84,
"eval_accuracy": 0.9846153846153847,
"eval_loss": 0.1295621246099472,
"eval_runtime": 4.717,
"eval_samples_per_second": 13.78,
"eval_steps_per_second": 0.636,
"step": 104
},
{
"epoch": 26.84,
"eval_accuracy": 0.9538461538461539,
"eval_loss": 0.1106828972697258,
"eval_runtime": 4.4246,
"eval_samples_per_second": 14.691,
"eval_steps_per_second": 0.678,
"step": 108
},
{
"epoch": 27.84,
"eval_accuracy": 0.9384615384615385,
"eval_loss": 0.12369797378778458,
"eval_runtime": 4.7653,
"eval_samples_per_second": 13.64,
"eval_steps_per_second": 0.63,
"step": 112
},
{
"epoch": 28.84,
"eval_accuracy": 0.9538461538461539,
"eval_loss": 0.1366400122642517,
"eval_runtime": 4.3203,
"eval_samples_per_second": 15.045,
"eval_steps_per_second": 0.694,
"step": 116
},
{
"epoch": 29.84,
"learning_rate": 2.777777777777778e-05,
"loss": 0.4149,
"step": 120
},
{
"epoch": 29.84,
"eval_accuracy": 0.9692307692307692,
"eval_loss": 0.13494354486465454,
"eval_runtime": 4.6686,
"eval_samples_per_second": 13.923,
"eval_steps_per_second": 0.643,
"step": 120
},
{
"epoch": 30.84,
"eval_accuracy": 0.9846153846153847,
"eval_loss": 0.10458508133888245,
"eval_runtime": 4.2843,
"eval_samples_per_second": 15.172,
"eval_steps_per_second": 0.7,
"step": 124
},
{
"epoch": 31.84,
"eval_accuracy": 0.9846153846153847,
"eval_loss": 0.0881725624203682,
"eval_runtime": 4.7053,
"eval_samples_per_second": 13.814,
"eval_steps_per_second": 0.638,
"step": 128
},
{
"epoch": 32.84,
"eval_accuracy": 0.9846153846153847,
"eval_loss": 0.10219049453735352,
"eval_runtime": 4.3211,
"eval_samples_per_second": 15.042,
"eval_steps_per_second": 0.694,
"step": 132
},
{
"epoch": 33.84,
"eval_accuracy": 0.9692307692307692,
"eval_loss": 0.12066025286912918,
"eval_runtime": 4.8023,
"eval_samples_per_second": 13.535,
"eval_steps_per_second": 0.625,
"step": 136
},
{
"epoch": 34.84,
"learning_rate": 2.314814814814815e-05,
"loss": 0.3657,
"step": 140
},
{
"epoch": 34.84,
"eval_accuracy": 0.9538461538461539,
"eval_loss": 0.11678420007228851,
"eval_runtime": 4.4027,
"eval_samples_per_second": 14.764,
"eval_steps_per_second": 0.681,
"step": 140
},
{
"epoch": 35.84,
"eval_accuracy": 0.9846153846153847,
"eval_loss": 0.09219826757907867,
"eval_runtime": 6.9593,
"eval_samples_per_second": 9.34,
"eval_steps_per_second": 0.431,
"step": 144
},
{
"epoch": 36.84,
"eval_accuracy": 0.9846153846153847,
"eval_loss": 0.09314019978046417,
"eval_runtime": 4.3,
"eval_samples_per_second": 15.116,
"eval_steps_per_second": 0.698,
"step": 148
},
{
"epoch": 37.84,
"eval_accuracy": 0.9692307692307692,
"eval_loss": 0.10055378824472427,
"eval_runtime": 4.7227,
"eval_samples_per_second": 13.763,
"eval_steps_per_second": 0.635,
"step": 152
},
{
"epoch": 38.84,
"eval_accuracy": 0.9692307692307692,
"eval_loss": 0.09866410493850708,
"eval_runtime": 4.3725,
"eval_samples_per_second": 14.866,
"eval_steps_per_second": 0.686,
"step": 156
},
{
"epoch": 39.84,
"learning_rate": 1.8518518518518518e-05,
"loss": 0.3294,
"step": 160
},
{
"epoch": 39.84,
"eval_accuracy": 0.9692307692307692,
"eval_loss": 0.11275947839021683,
"eval_runtime": 4.6903,
"eval_samples_per_second": 13.858,
"eval_steps_per_second": 0.64,
"step": 160
},
{
"epoch": 40.84,
"eval_accuracy": 0.9538461538461539,
"eval_loss": 0.11520560085773468,
"eval_runtime": 4.3303,
"eval_samples_per_second": 15.01,
"eval_steps_per_second": 0.693,
"step": 164
},
{
"epoch": 41.84,
"eval_accuracy": 0.9538461538461539,
"eval_loss": 0.09974207729101181,
"eval_runtime": 4.7259,
"eval_samples_per_second": 13.754,
"eval_steps_per_second": 0.635,
"step": 168
},
{
"epoch": 42.84,
"eval_accuracy": 0.9692307692307692,
"eval_loss": 0.09684933722019196,
"eval_runtime": 4.3525,
"eval_samples_per_second": 14.934,
"eval_steps_per_second": 0.689,
"step": 172
},
{
"epoch": 43.84,
"eval_accuracy": 0.9846153846153847,
"eval_loss": 0.08187751471996307,
"eval_runtime": 4.6538,
"eval_samples_per_second": 13.967,
"eval_steps_per_second": 0.645,
"step": 176
},
{
"epoch": 44.84,
"learning_rate": 1.388888888888889e-05,
"loss": 0.3198,
"step": 180
},
{
"epoch": 44.84,
"eval_accuracy": 0.9846153846153847,
"eval_loss": 0.07292691618204117,
"eval_runtime": 4.3483,
"eval_samples_per_second": 14.948,
"eval_steps_per_second": 0.69,
"step": 180
},
{
"epoch": 45.84,
"eval_accuracy": 0.9846153846153847,
"eval_loss": 0.07438476383686066,
"eval_runtime": 4.8323,
"eval_samples_per_second": 13.451,
"eval_steps_per_second": 0.621,
"step": 184
},
{
"epoch": 46.84,
"eval_accuracy": 0.9692307692307692,
"eval_loss": 0.09510225057601929,
"eval_runtime": 4.3498,
"eval_samples_per_second": 14.943,
"eval_steps_per_second": 0.69,
"step": 188
},
{
"epoch": 47.84,
"eval_accuracy": 0.9692307692307692,
"eval_loss": 0.09657642990350723,
"eval_runtime": 4.7293,
"eval_samples_per_second": 13.744,
"eval_steps_per_second": 0.634,
"step": 192
},
{
"epoch": 48.84,
"eval_accuracy": 0.9846153846153847,
"eval_loss": 0.08329986035823822,
"eval_runtime": 4.2989,
"eval_samples_per_second": 15.12,
"eval_steps_per_second": 0.698,
"step": 196
},
{
"epoch": 49.84,
"learning_rate": 9.259259259259259e-06,
"loss": 0.2936,
"step": 200
},
{
"epoch": 49.84,
"eval_accuracy": 0.9846153846153847,
"eval_loss": 0.06941184401512146,
"eval_runtime": 4.7066,
"eval_samples_per_second": 13.811,
"eval_steps_per_second": 0.637,
"step": 200
},
{
"epoch": 50.84,
"eval_accuracy": 0.9846153846153847,
"eval_loss": 0.06908843666315079,
"eval_runtime": 4.3338,
"eval_samples_per_second": 14.999,
"eval_steps_per_second": 0.692,
"step": 204
},
{
"epoch": 51.84,
"eval_accuracy": 0.9846153846153847,
"eval_loss": 0.0735919326543808,
"eval_runtime": 4.7155,
"eval_samples_per_second": 13.784,
"eval_steps_per_second": 0.636,
"step": 208
},
{
"epoch": 52.84,
"eval_accuracy": 0.9692307692307692,
"eval_loss": 0.08048100024461746,
"eval_runtime": 4.337,
"eval_samples_per_second": 14.987,
"eval_steps_per_second": 0.692,
"step": 212
},
{
"epoch": 53.84,
"eval_accuracy": 0.9846153846153847,
"eval_loss": 0.08007017523050308,
"eval_runtime": 4.765,
"eval_samples_per_second": 13.641,
"eval_steps_per_second": 0.63,
"step": 216
},
{
"epoch": 54.84,
"learning_rate": 4.6296296296296296e-06,
"loss": 0.3127,
"step": 220
},
{
"epoch": 54.84,
"eval_accuracy": 0.9846153846153847,
"eval_loss": 0.0826273187994957,
"eval_runtime": 4.2934,
"eval_samples_per_second": 15.139,
"eval_steps_per_second": 0.699,
"step": 220
},
{
"epoch": 55.84,
"eval_accuracy": 0.9692307692307692,
"eval_loss": 0.08565446734428406,
"eval_runtime": 4.7099,
"eval_samples_per_second": 13.801,
"eval_steps_per_second": 0.637,
"step": 224
},
{
"epoch": 56.84,
"eval_accuracy": 0.9846153846153847,
"eval_loss": 0.0864274650812149,
"eval_runtime": 4.246,
"eval_samples_per_second": 15.309,
"eval_steps_per_second": 0.707,
"step": 228
},
{
"epoch": 57.84,
"eval_accuracy": 0.9846153846153847,
"eval_loss": 0.08776658028364182,
"eval_runtime": 4.758,
"eval_samples_per_second": 13.661,
"eval_steps_per_second": 0.631,
"step": 232
},
{
"epoch": 58.84,
"eval_accuracy": 0.9846153846153847,
"eval_loss": 0.08772400766611099,
"eval_runtime": 4.2874,
"eval_samples_per_second": 15.161,
"eval_steps_per_second": 0.7,
"step": 236
},
{
"epoch": 59.84,
"learning_rate": 0.0,
"loss": 0.285,
"step": 240
},
{
"epoch": 59.84,
"eval_accuracy": 0.9846153846153847,
"eval_loss": 0.08735792338848114,
"eval_runtime": 4.7501,
"eval_samples_per_second": 13.684,
"eval_steps_per_second": 0.632,
"step": 240
},
{
"epoch": 59.84,
"step": 240,
"total_flos": 8.648855308501955e+17,
"train_loss": 0.577343902985255,
"train_runtime": 4213.9216,
"train_samples_per_second": 8.273,
"train_steps_per_second": 0.057
}
],
"max_steps": 240,
"num_train_epochs": 60,
"total_flos": 8.648855308501955e+17,
"trial_name": null,
"trial_params": null
}