elpv-vit / trainer_state.json
mjphayes's picture
mjphayes/vit-elpv-augmented
52b3af7
{
"best_metric": 0.733502538071066,
"best_model_checkpoint": "../results/elpv-vit/checkpoint-828",
"epoch": 14.0,
"eval_steps": 500,
"global_step": 966,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_accuracy": 0.5786802030456852,
"eval_loss": 1.1146228313446045,
"eval_runtime": 15.1595,
"eval_samples_per_second": 25.99,
"eval_steps_per_second": 1.649,
"step": 69
},
{
"epoch": 2.0,
"eval_accuracy": 0.5786802030456852,
"eval_loss": 0.9812496304512024,
"eval_runtime": 4.4653,
"eval_samples_per_second": 88.237,
"eval_steps_per_second": 5.599,
"step": 138
},
{
"epoch": 3.0,
"eval_accuracy": 0.6472081218274112,
"eval_loss": 0.8884502053260803,
"eval_runtime": 2.1388,
"eval_samples_per_second": 184.219,
"eval_steps_per_second": 11.689,
"step": 207
},
{
"epoch": 4.0,
"eval_accuracy": 0.7081218274111675,
"eval_loss": 0.7930060625076294,
"eval_runtime": 2.1153,
"eval_samples_per_second": 186.265,
"eval_steps_per_second": 11.819,
"step": 276
},
{
"epoch": 5.0,
"eval_accuracy": 0.6928934010152284,
"eval_loss": 0.8019062280654907,
"eval_runtime": 7.7818,
"eval_samples_per_second": 50.631,
"eval_steps_per_second": 3.213,
"step": 345
},
{
"epoch": 6.0,
"eval_accuracy": 0.6878172588832487,
"eval_loss": 0.8009192943572998,
"eval_runtime": 2.0611,
"eval_samples_per_second": 191.162,
"eval_steps_per_second": 12.13,
"step": 414
},
{
"epoch": 7.0,
"eval_accuracy": 0.6852791878172588,
"eval_loss": 0.7984281182289124,
"eval_runtime": 12.8592,
"eval_samples_per_second": 30.639,
"eval_steps_per_second": 1.944,
"step": 483
},
{
"epoch": 7.25,
"learning_rate": 2.6812428078250863e-05,
"loss": 0.8194,
"step": 500
},
{
"epoch": 8.0,
"eval_accuracy": 0.7106598984771574,
"eval_loss": 0.7714311480522156,
"eval_runtime": 2.123,
"eval_samples_per_second": 185.586,
"eval_steps_per_second": 11.776,
"step": 552
},
{
"epoch": 9.0,
"eval_accuracy": 0.7081218274111675,
"eval_loss": 0.7666618824005127,
"eval_runtime": 2.021,
"eval_samples_per_second": 194.952,
"eval_steps_per_second": 12.37,
"step": 621
},
{
"epoch": 10.0,
"eval_accuracy": 0.7233502538071066,
"eval_loss": 0.7302789688110352,
"eval_runtime": 14.4927,
"eval_samples_per_second": 27.186,
"eval_steps_per_second": 1.725,
"step": 690
},
{
"epoch": 11.0,
"eval_accuracy": 0.7284263959390863,
"eval_loss": 0.7321494817733765,
"eval_runtime": 2.2455,
"eval_samples_per_second": 175.465,
"eval_steps_per_second": 11.134,
"step": 759
},
{
"epoch": 12.0,
"eval_accuracy": 0.733502538071066,
"eval_loss": 0.7373437285423279,
"eval_runtime": 5.5421,
"eval_samples_per_second": 71.092,
"eval_steps_per_second": 4.511,
"step": 828
},
{
"epoch": 13.0,
"eval_accuracy": 0.6903553299492385,
"eval_loss": 0.8051439523696899,
"eval_runtime": 12.7177,
"eval_samples_per_second": 30.98,
"eval_steps_per_second": 1.966,
"step": 897
},
{
"epoch": 14.0,
"eval_accuracy": 0.7258883248730964,
"eval_loss": 0.7687421441078186,
"eval_runtime": 4.2192,
"eval_samples_per_second": 93.382,
"eval_steps_per_second": 5.925,
"step": 966
},
{
"epoch": 14.0,
"step": 966,
"total_flos": 4.790950643943604e+18,
"train_loss": 0.63200661163646,
"train_runtime": 1457.5958,
"train_samples_per_second": 42.415,
"train_steps_per_second": 0.663
}
],
"logging_steps": 500,
"max_steps": 966,
"num_train_epochs": 14,
"save_steps": 500,
"total_flos": 4.790950643943604e+18,
"trial_name": null,
"trial_params": null
}