djbp's picture
End of training
25f05a6 verified
raw
history blame
6.21 kB
{
"best_metric": 0.6666666666666666,
"best_model_checkpoint": "swin-base-patch4-window7-224-in22k-cons_Classification_base_V10/checkpoint-2",
"epoch": 7.0,
"eval_steps": 500,
"global_step": 7,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"step": 1,
"train_accuracy": 0.6,
"train_auc_class_0": 0.36,
"train_auc_class_1": 0.8,
"train_auc_class_2": 0.8400000000000001,
"train_auc_overall": 0.6666666666666666,
"train_loss": 0.9687549471855164,
"train_runtime": 1.665,
"train_samples_per_second": 9.009,
"train_steps_per_second": 0.601
},
{
"epoch": 1.0,
"eval_accuracy": 0.5,
"eval_auc_class_0": 0.625,
"eval_auc_class_1": 0.75,
"eval_auc_class_2": 0.75,
"eval_auc_overall": 0.7083333333333334,
"eval_loss": 1.028936505317688,
"eval_runtime": 0.6838,
"eval_samples_per_second": 8.774,
"eval_steps_per_second": 1.462,
"step": 1
},
{
"epoch": 2.0,
"step": 2,
"train_accuracy": 0.8,
"train_auc_class_0": 0.98,
"train_auc_class_1": 1.0,
"train_auc_class_2": 1.0,
"train_auc_overall": 0.9933333333333333,
"train_loss": 0.6606505513191223,
"train_runtime": 1.7751,
"train_samples_per_second": 8.45,
"train_steps_per_second": 0.563
},
{
"epoch": 2.0,
"eval_accuracy": 0.6666666666666666,
"eval_auc_class_0": 0.625,
"eval_auc_class_1": 0.75,
"eval_auc_class_2": 0.875,
"eval_auc_overall": 0.75,
"eval_loss": 0.9276485443115234,
"eval_runtime": 0.7125,
"eval_samples_per_second": 8.421,
"eval_steps_per_second": 1.404,
"step": 2
},
{
"epoch": 3.0,
"step": 3,
"train_accuracy": 1.0,
"train_auc_class_0": 1.0,
"train_auc_class_1": 1.0,
"train_auc_class_2": 1.0,
"train_auc_overall": 1.0,
"train_loss": 0.5248541831970215,
"train_runtime": 1.627,
"train_samples_per_second": 9.219,
"train_steps_per_second": 0.615
},
{
"epoch": 3.0,
"eval_accuracy": 0.6666666666666666,
"eval_auc_class_0": 0.625,
"eval_auc_class_1": 1.0,
"eval_auc_class_2": 0.875,
"eval_auc_overall": 0.8333333333333334,
"eval_loss": 0.8520984053611755,
"eval_runtime": 0.7245,
"eval_samples_per_second": 8.281,
"eval_steps_per_second": 1.38,
"step": 3
},
{
"epoch": 4.0,
"step": 4,
"train_accuracy": 1.0,
"train_auc_class_0": 1.0,
"train_auc_class_1": 1.0,
"train_auc_class_2": 1.0,
"train_auc_overall": 1.0,
"train_loss": 0.36024707555770874,
"train_runtime": 1.7829,
"train_samples_per_second": 8.413,
"train_steps_per_second": 0.561
},
{
"epoch": 4.0,
"eval_accuracy": 0.6666666666666666,
"eval_auc_class_0": 0.875,
"eval_auc_class_1": 1.0,
"eval_auc_class_2": 1.0,
"eval_auc_overall": 0.9583333333333334,
"eval_loss": 0.7887496948242188,
"eval_runtime": 0.8054,
"eval_samples_per_second": 7.45,
"eval_steps_per_second": 1.242,
"step": 4
},
{
"epoch": 5.0,
"step": 5,
"train_accuracy": 1.0,
"train_auc_class_0": 1.0,
"train_auc_class_1": 1.0,
"train_auc_class_2": 1.0,
"train_auc_overall": 1.0,
"train_loss": 0.31448933482170105,
"train_runtime": 1.9887,
"train_samples_per_second": 7.543,
"train_steps_per_second": 0.503
},
{
"epoch": 5.0,
"eval_accuracy": 0.6666666666666666,
"eval_auc_class_0": 1.0,
"eval_auc_class_1": 1.0,
"eval_auc_class_2": 1.0,
"eval_auc_overall": 1.0,
"eval_loss": 0.7302556037902832,
"eval_runtime": 0.719,
"eval_samples_per_second": 8.345,
"eval_steps_per_second": 1.391,
"step": 5
},
{
"epoch": 6.0,
"step": 6,
"train_accuracy": 0.9333333333333333,
"train_auc_class_0": 1.0,
"train_auc_class_1": 1.0,
"train_auc_class_2": 1.0,
"train_auc_overall": 1.0,
"train_loss": 0.31753572821617126,
"train_runtime": 1.8048,
"train_samples_per_second": 8.311,
"train_steps_per_second": 0.554
},
{
"epoch": 6.0,
"eval_accuracy": 0.6666666666666666,
"eval_auc_class_0": 1.0,
"eval_auc_class_1": 1.0,
"eval_auc_class_2": 1.0,
"eval_auc_overall": 1.0,
"eval_loss": 0.688157320022583,
"eval_runtime": 0.719,
"eval_samples_per_second": 8.345,
"eval_steps_per_second": 1.391,
"step": 6
},
{
"epoch": 7.0,
"step": 7,
"train_accuracy": 1.0,
"train_auc_class_0": 1.0,
"train_auc_class_1": 1.0,
"train_auc_class_2": 1.0,
"train_auc_overall": 1.0,
"train_loss": 0.27592089772224426,
"train_runtime": 2.0142,
"train_samples_per_second": 7.447,
"train_steps_per_second": 0.496
},
{
"epoch": 7.0,
"eval_accuracy": 0.6666666666666666,
"eval_auc_class_0": 1.0,
"eval_auc_class_1": 1.0,
"eval_auc_class_2": 1.0,
"eval_auc_overall": 1.0,
"eval_loss": 0.6634145379066467,
"eval_runtime": 0.7768,
"eval_samples_per_second": 7.724,
"eval_steps_per_second": 1.287,
"step": 7
},
{
"epoch": 7.0,
"step": 7,
"total_flos": 8226380544399360.0,
"train_loss": 0.14502547468457902,
"train_runtime": 156.7549,
"train_samples_per_second": 0.67,
"train_steps_per_second": 0.045
}
],
"logging_steps": 10,
"max_steps": 7,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 8226380544399360.0,
"train_batch_size": 128,
"trial_name": null,
"trial_params": null
}