|
{ |
|
"best_metric": 0.8974358974358975, |
|
"best_model_checkpoint": "swin-large-patch4-window7-224-in22k-finetuned-lora-medmnistv2/checkpoint-35", |
|
"epoch": 9.142857142857142, |
|
"eval_steps": 500, |
|
"global_step": 80, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.9142857142857143, |
|
"eval_accuracy": 0.7435897435897436, |
|
"eval_f1": 0.47082767978290374, |
|
"eval_loss": 0.506903886795044, |
|
"eval_precision": 0.8701298701298701, |
|
"eval_recall": 0.5238095238095238, |
|
"eval_runtime": 1.0819, |
|
"eval_samples_per_second": 72.096, |
|
"eval_steps_per_second": 4.622, |
|
"step": 8 |
|
}, |
|
{ |
|
"epoch": 1.1428571428571428, |
|
"grad_norm": 1.5360957384109497, |
|
"learning_rate": 0.004375, |
|
"loss": 0.6976, |
|
"step": 10 |
|
}, |
|
{ |
|
"epoch": 1.9428571428571428, |
|
"eval_accuracy": 0.8589743589743589, |
|
"eval_f1": 0.8234204568841326, |
|
"eval_loss": 0.4591017961502075, |
|
"eval_precision": 0.8189935064935066, |
|
"eval_recall": 0.8283208020050126, |
|
"eval_runtime": 0.8911, |
|
"eval_samples_per_second": 87.528, |
|
"eval_steps_per_second": 5.611, |
|
"step": 17 |
|
}, |
|
{ |
|
"epoch": 2.2857142857142856, |
|
"grad_norm": 0.8164573311805725, |
|
"learning_rate": 0.00375, |
|
"loss": 0.5351, |
|
"step": 20 |
|
}, |
|
{ |
|
"epoch": 2.9714285714285715, |
|
"eval_accuracy": 0.8846153846153846, |
|
"eval_f1": 0.8461538461538461, |
|
"eval_loss": 0.37451839447021484, |
|
"eval_precision": 0.8666666666666667, |
|
"eval_recall": 0.8308270676691729, |
|
"eval_runtime": 0.9058, |
|
"eval_samples_per_second": 86.111, |
|
"eval_steps_per_second": 5.52, |
|
"step": 26 |
|
}, |
|
{ |
|
"epoch": 3.4285714285714284, |
|
"grad_norm": 0.974304735660553, |
|
"learning_rate": 0.003125, |
|
"loss": 0.4998, |
|
"step": 30 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.8974358974358975, |
|
"eval_f1": 0.8696741854636592, |
|
"eval_loss": 0.32434844970703125, |
|
"eval_precision": 0.8696741854636592, |
|
"eval_recall": 0.8696741854636592, |
|
"eval_runtime": 0.9239, |
|
"eval_samples_per_second": 84.422, |
|
"eval_steps_per_second": 5.412, |
|
"step": 35 |
|
}, |
|
{ |
|
"epoch": 4.571428571428571, |
|
"grad_norm": 0.9340265989303589, |
|
"learning_rate": 0.0025, |
|
"loss": 0.4569, |
|
"step": 40 |
|
}, |
|
{ |
|
"epoch": 4.914285714285715, |
|
"eval_accuracy": 0.8589743589743589, |
|
"eval_f1": 0.811965811965812, |
|
"eval_loss": 0.40701231360435486, |
|
"eval_precision": 0.8305555555555555, |
|
"eval_recall": 0.7982456140350878, |
|
"eval_runtime": 0.8814, |
|
"eval_samples_per_second": 88.5, |
|
"eval_steps_per_second": 5.673, |
|
"step": 43 |
|
}, |
|
{ |
|
"epoch": 5.714285714285714, |
|
"grad_norm": 1.012099266052246, |
|
"learning_rate": 0.001875, |
|
"loss": 0.4182, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 5.942857142857143, |
|
"eval_accuracy": 0.8717948717948718, |
|
"eval_f1": 0.831896551724138, |
|
"eval_loss": 0.3801339566707611, |
|
"eval_precision": 0.8438893844781445, |
|
"eval_recall": 0.8220551378446115, |
|
"eval_runtime": 0.8409, |
|
"eval_samples_per_second": 92.758, |
|
"eval_steps_per_second": 5.946, |
|
"step": 52 |
|
}, |
|
{ |
|
"epoch": 6.857142857142857, |
|
"grad_norm": 0.7531532645225525, |
|
"learning_rate": 0.00125, |
|
"loss": 0.4432, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 6.9714285714285715, |
|
"eval_accuracy": 0.8717948717948718, |
|
"eval_f1": 0.8370927318295739, |
|
"eval_loss": 0.3070574402809143, |
|
"eval_precision": 0.8370927318295739, |
|
"eval_recall": 0.8370927318295739, |
|
"eval_runtime": 0.856, |
|
"eval_samples_per_second": 91.124, |
|
"eval_steps_per_second": 5.841, |
|
"step": 61 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"grad_norm": 1.1633806228637695, |
|
"learning_rate": 0.000625, |
|
"loss": 0.3988, |
|
"step": 70 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.8717948717948718, |
|
"eval_f1": 0.8417207792207791, |
|
"eval_loss": 0.320502907037735, |
|
"eval_precision": 0.833201581027668, |
|
"eval_recall": 0.8521303258145363, |
|
"eval_runtime": 0.8567, |
|
"eval_samples_per_second": 91.048, |
|
"eval_steps_per_second": 5.836, |
|
"step": 70 |
|
}, |
|
{ |
|
"epoch": 8.914285714285715, |
|
"eval_accuracy": 0.8846153846153846, |
|
"eval_f1": 0.8555258283597448, |
|
"eval_loss": 0.3238745331764221, |
|
"eval_precision": 0.8506493506493507, |
|
"eval_recall": 0.8609022556390977, |
|
"eval_runtime": 0.8616, |
|
"eval_samples_per_second": 90.526, |
|
"eval_steps_per_second": 5.803, |
|
"step": 78 |
|
}, |
|
{ |
|
"epoch": 9.142857142857142, |
|
"grad_norm": 0.8995063900947571, |
|
"learning_rate": 0.0, |
|
"loss": 0.3993, |
|
"step": 80 |
|
}, |
|
{ |
|
"epoch": 9.142857142857142, |
|
"eval_accuracy": 0.8846153846153846, |
|
"eval_f1": 0.8555258283597448, |
|
"eval_loss": 0.32138964533805847, |
|
"eval_precision": 0.8506493506493507, |
|
"eval_recall": 0.8609022556390977, |
|
"eval_runtime": 0.8772, |
|
"eval_samples_per_second": 88.917, |
|
"eval_steps_per_second": 5.7, |
|
"step": 80 |
|
}, |
|
{ |
|
"epoch": 9.142857142857142, |
|
"step": 80, |
|
"total_flos": 8.847492793597624e+17, |
|
"train_loss": 0.48110649585723875, |
|
"train_runtime": 140.8237, |
|
"train_samples_per_second": 38.772, |
|
"train_steps_per_second": 0.568 |
|
} |
|
], |
|
"logging_steps": 10, |
|
"max_steps": 80, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 10, |
|
"save_steps": 500, |
|
"stateful_callbacks": { |
|
"TrainerControl": { |
|
"args": { |
|
"should_epoch_stop": false, |
|
"should_evaluate": false, |
|
"should_log": false, |
|
"should_save": true, |
|
"should_training_stop": true |
|
}, |
|
"attributes": {} |
|
} |
|
}, |
|
"total_flos": 8.847492793597624e+17, |
|
"train_batch_size": 16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|