delivery_truck_classification / trainer_state.json
JEdward7777's picture
End of training
78b618f
raw
history blame
16.1 kB
{
"best_metric": 0.96875,
"best_model_checkpoint": "delivery_truck_classification/checkpoint-52",
"epoch": 59.888888888888886,
"global_step": 240,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.89,
"eval_accuracy": 0.15625,
"eval_loss": 2.007406234741211,
"eval_runtime": 4.1284,
"eval_samples_per_second": 15.502,
"eval_steps_per_second": 0.484,
"step": 4
},
{
"epoch": 1.89,
"eval_accuracy": 0.25,
"eval_loss": 1.8895925283432007,
"eval_runtime": 4.9483,
"eval_samples_per_second": 12.934,
"eval_steps_per_second": 0.404,
"step": 8
},
{
"epoch": 2.89,
"eval_accuracy": 0.40625,
"eval_loss": 1.7421282529830933,
"eval_runtime": 4.1039,
"eval_samples_per_second": 15.595,
"eval_steps_per_second": 0.487,
"step": 12
},
{
"epoch": 3.89,
"eval_accuracy": 0.4375,
"eval_loss": 1.5891958475112915,
"eval_runtime": 4.5489,
"eval_samples_per_second": 14.069,
"eval_steps_per_second": 0.44,
"step": 16
},
{
"epoch": 4.89,
"learning_rate": 4.166666666666667e-05,
"loss": 1.973,
"step": 20
},
{
"epoch": 4.89,
"eval_accuracy": 0.609375,
"eval_loss": 1.362261176109314,
"eval_runtime": 4.1743,
"eval_samples_per_second": 15.332,
"eval_steps_per_second": 0.479,
"step": 20
},
{
"epoch": 5.89,
"eval_accuracy": 0.609375,
"eval_loss": 1.1093113422393799,
"eval_runtime": 4.4702,
"eval_samples_per_second": 14.317,
"eval_steps_per_second": 0.447,
"step": 24
},
{
"epoch": 6.89,
"eval_accuracy": 0.78125,
"eval_loss": 0.7900974154472351,
"eval_runtime": 4.1973,
"eval_samples_per_second": 15.248,
"eval_steps_per_second": 0.476,
"step": 28
},
{
"epoch": 7.89,
"eval_accuracy": 0.84375,
"eval_loss": 0.5773038268089294,
"eval_runtime": 4.6009,
"eval_samples_per_second": 13.91,
"eval_steps_per_second": 0.435,
"step": 32
},
{
"epoch": 8.89,
"eval_accuracy": 0.890625,
"eval_loss": 0.38568082451820374,
"eval_runtime": 4.1614,
"eval_samples_per_second": 15.379,
"eval_steps_per_second": 0.481,
"step": 36
},
{
"epoch": 9.89,
"learning_rate": 4.62962962962963e-05,
"loss": 1.0433,
"step": 40
},
{
"epoch": 9.89,
"eval_accuracy": 0.90625,
"eval_loss": 0.32543647289276123,
"eval_runtime": 4.5756,
"eval_samples_per_second": 13.987,
"eval_steps_per_second": 0.437,
"step": 40
},
{
"epoch": 10.89,
"eval_accuracy": 0.921875,
"eval_loss": 0.2461281269788742,
"eval_runtime": 4.2012,
"eval_samples_per_second": 15.234,
"eval_steps_per_second": 0.476,
"step": 44
},
{
"epoch": 11.89,
"eval_accuracy": 0.921875,
"eval_loss": 0.2339743673801422,
"eval_runtime": 4.5321,
"eval_samples_per_second": 14.121,
"eval_steps_per_second": 0.441,
"step": 48
},
{
"epoch": 12.89,
"eval_accuracy": 0.96875,
"eval_loss": 0.18353550136089325,
"eval_runtime": 4.3055,
"eval_samples_per_second": 14.865,
"eval_steps_per_second": 0.465,
"step": 52
},
{
"epoch": 13.89,
"eval_accuracy": 0.9375,
"eval_loss": 0.17793762683868408,
"eval_runtime": 4.4643,
"eval_samples_per_second": 14.336,
"eval_steps_per_second": 0.448,
"step": 56
},
{
"epoch": 14.89,
"learning_rate": 4.166666666666667e-05,
"loss": 0.5842,
"step": 60
},
{
"epoch": 14.89,
"eval_accuracy": 0.953125,
"eval_loss": 0.15445110201835632,
"eval_runtime": 4.1434,
"eval_samples_per_second": 15.446,
"eval_steps_per_second": 0.483,
"step": 60
},
{
"epoch": 15.89,
"eval_accuracy": 0.953125,
"eval_loss": 0.14869830012321472,
"eval_runtime": 4.5456,
"eval_samples_per_second": 14.08,
"eval_steps_per_second": 0.44,
"step": 64
},
{
"epoch": 16.89,
"eval_accuracy": 0.921875,
"eval_loss": 0.19956862926483154,
"eval_runtime": 4.0021,
"eval_samples_per_second": 15.992,
"eval_steps_per_second": 0.5,
"step": 68
},
{
"epoch": 17.89,
"eval_accuracy": 0.90625,
"eval_loss": 0.1619431972503662,
"eval_runtime": 4.478,
"eval_samples_per_second": 14.292,
"eval_steps_per_second": 0.447,
"step": 72
},
{
"epoch": 18.89,
"eval_accuracy": 0.96875,
"eval_loss": 0.13495692610740662,
"eval_runtime": 4.1244,
"eval_samples_per_second": 15.517,
"eval_steps_per_second": 0.485,
"step": 76
},
{
"epoch": 19.89,
"learning_rate": 3.7037037037037037e-05,
"loss": 0.4616,
"step": 80
},
{
"epoch": 19.89,
"eval_accuracy": 0.9375,
"eval_loss": 0.17057114839553833,
"eval_runtime": 4.5586,
"eval_samples_per_second": 14.039,
"eval_steps_per_second": 0.439,
"step": 80
},
{
"epoch": 20.89,
"eval_accuracy": 0.921875,
"eval_loss": 0.15793055295944214,
"eval_runtime": 4.126,
"eval_samples_per_second": 15.511,
"eval_steps_per_second": 0.485,
"step": 84
},
{
"epoch": 21.89,
"eval_accuracy": 0.9375,
"eval_loss": 0.16296246647834778,
"eval_runtime": 4.5173,
"eval_samples_per_second": 14.168,
"eval_steps_per_second": 0.443,
"step": 88
},
{
"epoch": 22.89,
"eval_accuracy": 0.90625,
"eval_loss": 0.20802505314350128,
"eval_runtime": 4.0833,
"eval_samples_per_second": 15.674,
"eval_steps_per_second": 0.49,
"step": 92
},
{
"epoch": 23.89,
"eval_accuracy": 0.9375,
"eval_loss": 0.14634451270103455,
"eval_runtime": 4.6059,
"eval_samples_per_second": 13.895,
"eval_steps_per_second": 0.434,
"step": 96
},
{
"epoch": 24.89,
"learning_rate": 3.240740740740741e-05,
"loss": 0.3898,
"step": 100
},
{
"epoch": 24.89,
"eval_accuracy": 0.96875,
"eval_loss": 0.11846979707479477,
"eval_runtime": 4.1451,
"eval_samples_per_second": 15.44,
"eval_steps_per_second": 0.483,
"step": 100
},
{
"epoch": 25.89,
"eval_accuracy": 0.921875,
"eval_loss": 0.14448919892311096,
"eval_runtime": 4.4782,
"eval_samples_per_second": 14.291,
"eval_steps_per_second": 0.447,
"step": 104
},
{
"epoch": 26.89,
"eval_accuracy": 0.921875,
"eval_loss": 0.20514565706253052,
"eval_runtime": 4.0807,
"eval_samples_per_second": 15.683,
"eval_steps_per_second": 0.49,
"step": 108
},
{
"epoch": 27.89,
"eval_accuracy": 0.9375,
"eval_loss": 0.19281229376792908,
"eval_runtime": 4.457,
"eval_samples_per_second": 14.36,
"eval_steps_per_second": 0.449,
"step": 112
},
{
"epoch": 28.89,
"eval_accuracy": 0.9375,
"eval_loss": 0.13649864494800568,
"eval_runtime": 4.038,
"eval_samples_per_second": 15.849,
"eval_steps_per_second": 0.495,
"step": 116
},
{
"epoch": 29.89,
"learning_rate": 2.777777777777778e-05,
"loss": 0.3511,
"step": 120
},
{
"epoch": 29.89,
"eval_accuracy": 0.953125,
"eval_loss": 0.10572843253612518,
"eval_runtime": 4.5443,
"eval_samples_per_second": 14.084,
"eval_steps_per_second": 0.44,
"step": 120
},
{
"epoch": 30.89,
"eval_accuracy": 0.953125,
"eval_loss": 0.10910199582576752,
"eval_runtime": 4.2535,
"eval_samples_per_second": 15.046,
"eval_steps_per_second": 0.47,
"step": 124
},
{
"epoch": 31.89,
"eval_accuracy": 0.9375,
"eval_loss": 0.1893911063671112,
"eval_runtime": 4.6955,
"eval_samples_per_second": 13.63,
"eval_steps_per_second": 0.426,
"step": 128
},
{
"epoch": 32.89,
"eval_accuracy": 0.953125,
"eval_loss": 0.12075338512659073,
"eval_runtime": 4.1214,
"eval_samples_per_second": 15.529,
"eval_steps_per_second": 0.485,
"step": 132
},
{
"epoch": 33.89,
"eval_accuracy": 0.96875,
"eval_loss": 0.11010686308145523,
"eval_runtime": 4.5267,
"eval_samples_per_second": 14.138,
"eval_steps_per_second": 0.442,
"step": 136
},
{
"epoch": 34.89,
"learning_rate": 2.314814814814815e-05,
"loss": 0.3286,
"step": 140
},
{
"epoch": 34.89,
"eval_accuracy": 0.9375,
"eval_loss": 0.14093339443206787,
"eval_runtime": 4.119,
"eval_samples_per_second": 15.538,
"eval_steps_per_second": 0.486,
"step": 140
},
{
"epoch": 35.89,
"eval_accuracy": 0.921875,
"eval_loss": 0.18304279446601868,
"eval_runtime": 4.4932,
"eval_samples_per_second": 14.244,
"eval_steps_per_second": 0.445,
"step": 144
},
{
"epoch": 36.89,
"eval_accuracy": 0.921875,
"eval_loss": 0.1518746018409729,
"eval_runtime": 4.1186,
"eval_samples_per_second": 15.539,
"eval_steps_per_second": 0.486,
"step": 148
},
{
"epoch": 37.89,
"eval_accuracy": 0.953125,
"eval_loss": 0.10309180617332458,
"eval_runtime": 4.5179,
"eval_samples_per_second": 14.166,
"eval_steps_per_second": 0.443,
"step": 152
},
{
"epoch": 38.89,
"eval_accuracy": 0.96875,
"eval_loss": 0.09621511399745941,
"eval_runtime": 4.2076,
"eval_samples_per_second": 15.211,
"eval_steps_per_second": 0.475,
"step": 156
},
{
"epoch": 39.89,
"learning_rate": 1.8518518518518518e-05,
"loss": 0.3095,
"step": 160
},
{
"epoch": 39.89,
"eval_accuracy": 0.96875,
"eval_loss": 0.09031268954277039,
"eval_runtime": 4.5982,
"eval_samples_per_second": 13.919,
"eval_steps_per_second": 0.435,
"step": 160
},
{
"epoch": 40.89,
"eval_accuracy": 0.96875,
"eval_loss": 0.08859497308731079,
"eval_runtime": 4.1937,
"eval_samples_per_second": 15.261,
"eval_steps_per_second": 0.477,
"step": 164
},
{
"epoch": 41.89,
"eval_accuracy": 0.96875,
"eval_loss": 0.10331027209758759,
"eval_runtime": 4.5829,
"eval_samples_per_second": 13.965,
"eval_steps_per_second": 0.436,
"step": 168
},
{
"epoch": 42.89,
"eval_accuracy": 0.953125,
"eval_loss": 0.11172451823949814,
"eval_runtime": 4.2291,
"eval_samples_per_second": 15.133,
"eval_steps_per_second": 0.473,
"step": 172
},
{
"epoch": 43.89,
"eval_accuracy": 0.9375,
"eval_loss": 0.11921519041061401,
"eval_runtime": 4.595,
"eval_samples_per_second": 13.928,
"eval_steps_per_second": 0.435,
"step": 176
},
{
"epoch": 44.89,
"learning_rate": 1.388888888888889e-05,
"loss": 0.3056,
"step": 180
},
{
"epoch": 44.89,
"eval_accuracy": 0.953125,
"eval_loss": 0.09840899705886841,
"eval_runtime": 4.2775,
"eval_samples_per_second": 14.962,
"eval_steps_per_second": 0.468,
"step": 180
},
{
"epoch": 45.89,
"eval_accuracy": 0.953125,
"eval_loss": 0.08203314244747162,
"eval_runtime": 4.5543,
"eval_samples_per_second": 14.053,
"eval_steps_per_second": 0.439,
"step": 184
},
{
"epoch": 46.89,
"eval_accuracy": 0.953125,
"eval_loss": 0.08574767410755157,
"eval_runtime": 4.1553,
"eval_samples_per_second": 15.402,
"eval_steps_per_second": 0.481,
"step": 188
},
{
"epoch": 47.89,
"eval_accuracy": 0.953125,
"eval_loss": 0.10580457001924515,
"eval_runtime": 4.6204,
"eval_samples_per_second": 13.852,
"eval_steps_per_second": 0.433,
"step": 192
},
{
"epoch": 48.89,
"eval_accuracy": 0.9375,
"eval_loss": 0.11630271375179291,
"eval_runtime": 4.1519,
"eval_samples_per_second": 15.415,
"eval_steps_per_second": 0.482,
"step": 196
},
{
"epoch": 49.89,
"learning_rate": 9.259259259259259e-06,
"loss": 0.255,
"step": 200
},
{
"epoch": 49.89,
"eval_accuracy": 0.953125,
"eval_loss": 0.11214150488376617,
"eval_runtime": 4.4888,
"eval_samples_per_second": 14.258,
"eval_steps_per_second": 0.446,
"step": 200
},
{
"epoch": 50.89,
"eval_accuracy": 0.96875,
"eval_loss": 0.10038581490516663,
"eval_runtime": 4.1624,
"eval_samples_per_second": 15.376,
"eval_steps_per_second": 0.48,
"step": 204
},
{
"epoch": 51.89,
"eval_accuracy": 0.96875,
"eval_loss": 0.09537401050329208,
"eval_runtime": 4.5154,
"eval_samples_per_second": 14.174,
"eval_steps_per_second": 0.443,
"step": 208
},
{
"epoch": 52.89,
"eval_accuracy": 0.96875,
"eval_loss": 0.0925481989979744,
"eval_runtime": 4.141,
"eval_samples_per_second": 15.455,
"eval_steps_per_second": 0.483,
"step": 212
},
{
"epoch": 53.89,
"eval_accuracy": 0.96875,
"eval_loss": 0.08920943737030029,
"eval_runtime": 4.5736,
"eval_samples_per_second": 13.993,
"eval_steps_per_second": 0.437,
"step": 216
},
{
"epoch": 54.89,
"learning_rate": 4.6296296296296296e-06,
"loss": 0.2494,
"step": 220
},
{
"epoch": 54.89,
"eval_accuracy": 0.96875,
"eval_loss": 0.08926128596067429,
"eval_runtime": 4.0979,
"eval_samples_per_second": 15.618,
"eval_steps_per_second": 0.488,
"step": 220
},
{
"epoch": 55.89,
"eval_accuracy": 0.96875,
"eval_loss": 0.0900685042142868,
"eval_runtime": 4.5713,
"eval_samples_per_second": 14.001,
"eval_steps_per_second": 0.438,
"step": 224
},
{
"epoch": 56.89,
"eval_accuracy": 0.96875,
"eval_loss": 0.08957040309906006,
"eval_runtime": 4.2031,
"eval_samples_per_second": 15.227,
"eval_steps_per_second": 0.476,
"step": 228
},
{
"epoch": 57.89,
"eval_accuracy": 0.96875,
"eval_loss": 0.09029233455657959,
"eval_runtime": 4.5507,
"eval_samples_per_second": 14.064,
"eval_steps_per_second": 0.439,
"step": 232
},
{
"epoch": 58.89,
"eval_accuracy": 0.96875,
"eval_loss": 0.09133943915367126,
"eval_runtime": 4.5211,
"eval_samples_per_second": 14.156,
"eval_steps_per_second": 0.442,
"step": 236
},
{
"epoch": 59.89,
"learning_rate": 0.0,
"loss": 0.2588,
"step": 240
},
{
"epoch": 59.89,
"eval_accuracy": 0.96875,
"eval_loss": 0.09184324741363525,
"eval_runtime": 4.5891,
"eval_samples_per_second": 13.946,
"eval_steps_per_second": 0.436,
"step": 240
},
{
"epoch": 59.89,
"step": 240,
"total_flos": 8.516851567051162e+17,
"train_loss": 0.5424989521503448,
"train_runtime": 4233.7913,
"train_samples_per_second": 8.106,
"train_steps_per_second": 0.057
}
],
"max_steps": 240,
"num_train_epochs": 60,
"total_flos": 8.516851567051162e+17,
"trial_name": null,
"trial_params": null
}