{ "best_metric": 0.9982142857142857, "best_model_checkpoint": "vit-large-patch16-224-dungeon-geo-morphs-0-4-30Nov24-006/checkpoint-60", "epoch": 35.45454545454545, "eval_steps": 10, "global_step": 80, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 4.363636363636363, "grad_norm": 24.64277458190918, "learning_rate": 9.861111111111112e-06, "loss": 1.5574, "step": 10 }, { "epoch": 4.363636363636363, "eval_accuracy": 0.6017857142857143, "eval_loss": 1.2378439903259277, "eval_runtime": 7.5027, "eval_samples_per_second": 74.64, "eval_steps_per_second": 9.33, "step": 10 }, { "epoch": 8.727272727272727, "grad_norm": 23.63115119934082, "learning_rate": 8.472222222222223e-06, "loss": 0.9431, "step": 20 }, { "epoch": 8.727272727272727, "eval_accuracy": 0.8892857142857142, "eval_loss": 0.6701930165290833, "eval_runtime": 7.7778, "eval_samples_per_second": 72.0, "eval_steps_per_second": 9.0, "step": 20 }, { "epoch": 13.272727272727273, "grad_norm": 14.12543773651123, "learning_rate": 7.083333333333335e-06, "loss": 0.4807, "step": 30 }, { "epoch": 13.272727272727273, "eval_accuracy": 0.95, "eval_loss": 0.38032934069633484, "eval_runtime": 7.2067, "eval_samples_per_second": 77.706, "eval_steps_per_second": 9.713, "step": 30 }, { "epoch": 17.636363636363637, "grad_norm": 13.682252883911133, "learning_rate": 5.694444444444445e-06, "loss": 0.2673, "step": 40 }, { "epoch": 17.636363636363637, "eval_accuracy": 0.9732142857142857, "eval_loss": 0.22460468113422394, "eval_runtime": 8.2781, "eval_samples_per_second": 67.648, "eval_steps_per_second": 8.456, "step": 40 }, { "epoch": 22.181818181818183, "grad_norm": 21.752925872802734, "learning_rate": 4.305555555555556e-06, "loss": 0.1501, "step": 50 }, { "epoch": 22.181818181818183, "eval_accuracy": 0.975, "eval_loss": 0.15731294453144073, "eval_runtime": 7.5746, "eval_samples_per_second": 73.931, "eval_steps_per_second": 9.241, "step": 50 }, { "epoch": 26.545454545454547, "grad_norm": 8.0554838180542, "learning_rate": 2.916666666666667e-06, "loss": 0.0962, "step": 60 }, { "epoch": 26.545454545454547, "eval_accuracy": 0.9982142857142857, "eval_loss": 0.10373682528734207, "eval_runtime": 8.3878, "eval_samples_per_second": 66.764, "eval_steps_per_second": 8.346, "step": 60 }, { "epoch": 31.09090909090909, "grad_norm": 6.769862651824951, "learning_rate": 1.527777777777778e-06, "loss": 0.0629, "step": 70 }, { "epoch": 31.09090909090909, "eval_accuracy": 0.9964285714285714, "eval_loss": 0.08421190828084946, "eval_runtime": 8.3691, "eval_samples_per_second": 66.913, "eval_steps_per_second": 8.364, "step": 70 }, { "epoch": 35.45454545454545, "grad_norm": 5.019294738769531, "learning_rate": 1.3888888888888888e-07, "loss": 0.049, "step": 80 }, { "epoch": 35.45454545454545, "eval_accuracy": 0.9964285714285714, "eval_loss": 0.07256519049406052, "eval_runtime": 8.7265, "eval_samples_per_second": 64.172, "eval_steps_per_second": 8.022, "step": 80 }, { "epoch": 35.45454545454545, "step": 80, "total_flos": 7.012786101918106e+17, "train_loss": 0.4508287474513054, "train_runtime": 460.7942, "train_samples_per_second": 7.031, "train_steps_per_second": 0.174 } ], "logging_steps": 10, "max_steps": 80, "num_input_tokens_seen": 0, "num_train_epochs": 40, "save_steps": 10, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 7.012786101918106e+17, "train_batch_size": 8, "trial_name": null, "trial_params": null }