anirudhmu's picture
End of training
7a72c7b
{
"best_metric": 0.9525423728813559,
"best_model_checkpoint": "videomae-base-finetuned-soccer-action-recognitionx/checkpoint-733",
"epoch": 31.02843386627907,
"eval_steps": 500,
"global_step": 1376,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.03,
"eval_accuracy": 0.36610169491525424,
"eval_loss": 1.8151326179504395,
"eval_runtime": 140.7286,
"eval_samples_per_second": 2.096,
"eval_steps_per_second": 0.526,
"step": 43
},
{
"epoch": 1.03,
"learning_rate": 2.8985507246376814e-05,
"loss": 1.7589,
"step": 80
},
{
"epoch": 1.03,
"eval_accuracy": 0.6915254237288135,
"eval_loss": 0.9133387804031372,
"eval_runtime": 53.0805,
"eval_samples_per_second": 5.558,
"eval_steps_per_second": 1.394,
"step": 86
},
{
"epoch": 2.03,
"eval_accuracy": 0.7966101694915254,
"eval_loss": 0.502605676651001,
"eval_runtime": 51.9943,
"eval_samples_per_second": 5.674,
"eval_steps_per_second": 1.423,
"step": 129
},
{
"epoch": 3.02,
"learning_rate": 4.9111470113085624e-05,
"loss": 0.5494,
"step": 160
},
{
"epoch": 3.03,
"eval_accuracy": 0.8677966101694915,
"eval_loss": 0.3936995267868042,
"eval_runtime": 51.8695,
"eval_samples_per_second": 5.687,
"eval_steps_per_second": 1.427,
"step": 172
},
{
"epoch": 4.03,
"eval_accuracy": 0.8677966101694915,
"eval_loss": 0.3942561149597168,
"eval_runtime": 51.889,
"eval_samples_per_second": 5.685,
"eval_steps_per_second": 1.426,
"step": 215
},
{
"epoch": 5.02,
"learning_rate": 4.588045234248788e-05,
"loss": 0.2747,
"step": 240
},
{
"epoch": 5.03,
"eval_accuracy": 0.8677966101694915,
"eval_loss": 0.38759008049964905,
"eval_runtime": 51.6207,
"eval_samples_per_second": 5.715,
"eval_steps_per_second": 1.434,
"step": 258
},
{
"epoch": 6.03,
"eval_accuracy": 0.9084745762711864,
"eval_loss": 0.28025880455970764,
"eval_runtime": 51.769,
"eval_samples_per_second": 5.698,
"eval_steps_per_second": 1.429,
"step": 301
},
{
"epoch": 7.01,
"learning_rate": 4.264943457189014e-05,
"loss": 0.1731,
"step": 320
},
{
"epoch": 7.03,
"eval_accuracy": 0.911864406779661,
"eval_loss": 0.24141576886177063,
"eval_runtime": 51.5882,
"eval_samples_per_second": 5.718,
"eval_steps_per_second": 1.434,
"step": 345
},
{
"epoch": 8.03,
"eval_accuracy": 0.9288135593220339,
"eval_loss": 0.24339653551578522,
"eval_runtime": 52.5074,
"eval_samples_per_second": 5.618,
"eval_steps_per_second": 1.409,
"step": 388
},
{
"epoch": 9.01,
"learning_rate": 3.941841680129241e-05,
"loss": 0.1165,
"step": 400
},
{
"epoch": 9.03,
"eval_accuracy": 0.9457627118644067,
"eval_loss": 0.15595699846744537,
"eval_runtime": 51.5552,
"eval_samples_per_second": 5.722,
"eval_steps_per_second": 1.435,
"step": 431
},
{
"epoch": 10.03,
"eval_accuracy": 0.9254237288135593,
"eval_loss": 0.18938671052455902,
"eval_runtime": 51.3718,
"eval_samples_per_second": 5.742,
"eval_steps_per_second": 1.44,
"step": 474
},
{
"epoch": 11.0,
"learning_rate": 3.618739903069467e-05,
"loss": 0.07,
"step": 480
},
{
"epoch": 11.03,
"eval_accuracy": 0.9152542372881356,
"eval_loss": 0.2400982826948166,
"eval_runtime": 51.1883,
"eval_samples_per_second": 5.763,
"eval_steps_per_second": 1.446,
"step": 517
},
{
"epoch": 12.03,
"learning_rate": 3.295638126009693e-05,
"loss": 0.0417,
"step": 560
},
{
"epoch": 12.03,
"eval_accuracy": 0.9389830508474576,
"eval_loss": 0.18834476172924042,
"eval_runtime": 52.3816,
"eval_samples_per_second": 5.632,
"eval_steps_per_second": 1.413,
"step": 560
},
{
"epoch": 13.03,
"eval_accuracy": 0.9050847457627119,
"eval_loss": 0.2588905990123749,
"eval_runtime": 52.3591,
"eval_samples_per_second": 5.634,
"eval_steps_per_second": 1.413,
"step": 603
},
{
"epoch": 14.03,
"learning_rate": 2.9725363489499192e-05,
"loss": 0.0362,
"step": 640
},
{
"epoch": 14.03,
"eval_accuracy": 0.9491525423728814,
"eval_loss": 0.2125038504600525,
"eval_runtime": 52.038,
"eval_samples_per_second": 5.669,
"eval_steps_per_second": 1.422,
"step": 646
},
{
"epoch": 15.03,
"eval_accuracy": 0.9389830508474576,
"eval_loss": 0.22276653349399567,
"eval_runtime": 52.1385,
"eval_samples_per_second": 5.658,
"eval_steps_per_second": 1.419,
"step": 690
},
{
"epoch": 16.02,
"learning_rate": 2.6494345718901455e-05,
"loss": 0.0348,
"step": 720
},
{
"epoch": 16.03,
"eval_accuracy": 0.9525423728813559,
"eval_loss": 0.1796749383211136,
"eval_runtime": 51.9086,
"eval_samples_per_second": 5.683,
"eval_steps_per_second": 1.426,
"step": 733
},
{
"epoch": 17.03,
"eval_accuracy": 0.9389830508474576,
"eval_loss": 0.17283643782138824,
"eval_runtime": 54.9977,
"eval_samples_per_second": 5.364,
"eval_steps_per_second": 1.346,
"step": 776
},
{
"epoch": 18.02,
"learning_rate": 2.3263327948303717e-05,
"loss": 0.0129,
"step": 800
},
{
"epoch": 18.03,
"eval_accuracy": 0.9254237288135593,
"eval_loss": 0.22526715695858002,
"eval_runtime": 50.2328,
"eval_samples_per_second": 5.873,
"eval_steps_per_second": 1.473,
"step": 819
},
{
"epoch": 19.03,
"eval_accuracy": 0.9355932203389831,
"eval_loss": 0.1983296275138855,
"eval_runtime": 51.3454,
"eval_samples_per_second": 5.745,
"eval_steps_per_second": 1.441,
"step": 862
},
{
"epoch": 20.01,
"learning_rate": 2.003231017770598e-05,
"loss": 0.0112,
"step": 880
},
{
"epoch": 20.03,
"eval_accuracy": 0.9220338983050848,
"eval_loss": 0.28206783533096313,
"eval_runtime": 51.8364,
"eval_samples_per_second": 5.691,
"eval_steps_per_second": 1.428,
"step": 905
},
{
"epoch": 21.03,
"eval_accuracy": 0.9355932203389831,
"eval_loss": 0.2527361810207367,
"eval_runtime": 51.2851,
"eval_samples_per_second": 5.752,
"eval_steps_per_second": 1.443,
"step": 948
},
{
"epoch": 22.01,
"learning_rate": 1.6801292407108242e-05,
"loss": 0.0165,
"step": 960
},
{
"epoch": 22.03,
"eval_accuracy": 0.9288135593220339,
"eval_loss": 0.2598176896572113,
"eval_runtime": 51.1087,
"eval_samples_per_second": 5.772,
"eval_steps_per_second": 1.448,
"step": 991
},
{
"epoch": 23.03,
"eval_accuracy": 0.9288135593220339,
"eval_loss": 0.2689870595932007,
"eval_runtime": 52.0484,
"eval_samples_per_second": 5.668,
"eval_steps_per_second": 1.422,
"step": 1035
},
{
"epoch": 24.0,
"learning_rate": 1.3570274636510503e-05,
"loss": 0.0056,
"step": 1040
},
{
"epoch": 24.03,
"eval_accuracy": 0.9220338983050848,
"eval_loss": 0.2817440629005432,
"eval_runtime": 50.9874,
"eval_samples_per_second": 5.786,
"eval_steps_per_second": 1.451,
"step": 1078
},
{
"epoch": 25.03,
"learning_rate": 1.0339256865912764e-05,
"loss": 0.0026,
"step": 1120
},
{
"epoch": 25.03,
"eval_accuracy": 0.9423728813559322,
"eval_loss": 0.2038636952638626,
"eval_runtime": 51.3576,
"eval_samples_per_second": 5.744,
"eval_steps_per_second": 1.441,
"step": 1121
},
{
"epoch": 26.03,
"eval_accuracy": 0.9457627118644067,
"eval_loss": 0.21635624766349792,
"eval_runtime": 50.2612,
"eval_samples_per_second": 5.869,
"eval_steps_per_second": 1.472,
"step": 1164
},
{
"epoch": 27.03,
"learning_rate": 7.108239095315025e-06,
"loss": 0.0033,
"step": 1200
},
{
"epoch": 27.03,
"eval_accuracy": 0.9423728813559322,
"eval_loss": 0.20629702508449554,
"eval_runtime": 52.4013,
"eval_samples_per_second": 5.63,
"eval_steps_per_second": 1.412,
"step": 1207
},
{
"epoch": 28.03,
"eval_accuracy": 0.9525423728813559,
"eval_loss": 0.18356993794441223,
"eval_runtime": 51.9433,
"eval_samples_per_second": 5.679,
"eval_steps_per_second": 1.425,
"step": 1250
},
{
"epoch": 29.02,
"learning_rate": 3.877221324717286e-06,
"loss": 0.0038,
"step": 1280
},
{
"epoch": 29.03,
"eval_accuracy": 0.9457627118644067,
"eval_loss": 0.1899212896823883,
"eval_runtime": 50.6974,
"eval_samples_per_second": 5.819,
"eval_steps_per_second": 1.46,
"step": 1293
},
{
"epoch": 30.03,
"eval_accuracy": 0.9491525423728814,
"eval_loss": 0.18148240447044373,
"eval_runtime": 51.0875,
"eval_samples_per_second": 5.774,
"eval_steps_per_second": 1.448,
"step": 1336
},
{
"epoch": 31.02,
"learning_rate": 6.462035541195477e-07,
"loss": 0.0024,
"step": 1360
},
{
"epoch": 31.03,
"eval_accuracy": 0.9525423728813559,
"eval_loss": 0.1816376894712448,
"eval_runtime": 51.6789,
"eval_samples_per_second": 5.708,
"eval_steps_per_second": 1.432,
"step": 1376
},
{
"epoch": 31.03,
"step": 1376,
"total_flos": 5.4792880339785155e+19,
"train_loss": 0.18103733560920499,
"train_runtime": 13691.8843,
"train_samples_per_second": 3.216,
"train_steps_per_second": 0.1
},
{
"epoch": 31.03,
"eval_accuracy": 0.9281045751633987,
"eval_loss": 0.25746384263038635,
"eval_runtime": 158.37,
"eval_samples_per_second": 1.932,
"eval_steps_per_second": 0.486,
"step": 1376
},
{
"epoch": 31.03,
"eval_accuracy": 0.9281045751633987,
"eval_loss": 0.25746384263038635,
"eval_runtime": 53.448,
"eval_samples_per_second": 5.725,
"eval_steps_per_second": 1.441,
"step": 1376
}
],
"logging_steps": 80,
"max_steps": 1376,
"num_train_epochs": 9223372036854775807,
"save_steps": 500,
"total_flos": 5.4792880339785155e+19,
"trial_name": null,
"trial_params": null
}