|
{ |
|
"best_metric": 0.9695078031212484, |
|
"best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned-eurosat/checkpoint-111", |
|
"epoch": 9.887640449438202, |
|
"eval_steps": 500, |
|
"global_step": 220, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.449438202247191, |
|
"grad_norm": 6.729045391082764, |
|
"learning_rate": 2.272727272727273e-05, |
|
"loss": 0.6016, |
|
"step": 10 |
|
}, |
|
{ |
|
"epoch": 0.898876404494382, |
|
"grad_norm": 5.153387546539307, |
|
"learning_rate": 4.545454545454546e-05, |
|
"loss": 0.2262, |
|
"step": 20 |
|
}, |
|
{ |
|
"epoch": 0.9887640449438202, |
|
"eval_accuracy": 0.9365079365079365, |
|
"eval_f1": 0.9058027582617746, |
|
"eval_loss": 0.20612730085849762, |
|
"eval_precision": 0.8770471151423532, |
|
"eval_recall": 0.9365079365079365, |
|
"eval_runtime": 29.0895, |
|
"eval_samples_per_second": 10.829, |
|
"eval_steps_per_second": 0.344, |
|
"step": 22 |
|
}, |
|
{ |
|
"epoch": 1.348314606741573, |
|
"grad_norm": 2.6891238689422607, |
|
"learning_rate": 4.797979797979798e-05, |
|
"loss": 0.1932, |
|
"step": 30 |
|
}, |
|
{ |
|
"epoch": 1.797752808988764, |
|
"grad_norm": 10.437292098999023, |
|
"learning_rate": 4.545454545454546e-05, |
|
"loss": 0.1666, |
|
"step": 40 |
|
}, |
|
{ |
|
"epoch": 1.9775280898876404, |
|
"eval_accuracy": 0.9333333333333333, |
|
"eval_f1": 0.9042145593869733, |
|
"eval_loss": 0.12735532224178314, |
|
"eval_precision": 0.8768577494692145, |
|
"eval_recall": 0.9333333333333333, |
|
"eval_runtime": 28.9476, |
|
"eval_samples_per_second": 10.882, |
|
"eval_steps_per_second": 0.345, |
|
"step": 44 |
|
}, |
|
{ |
|
"epoch": 2.247191011235955, |
|
"grad_norm": 13.23202896118164, |
|
"learning_rate": 4.292929292929293e-05, |
|
"loss": 0.1408, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 2.696629213483146, |
|
"grad_norm": 13.037389755249023, |
|
"learning_rate": 4.0404040404040405e-05, |
|
"loss": 0.1168, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 2.966292134831461, |
|
"eval_accuracy": 0.9523809523809523, |
|
"eval_f1": 0.9437855353283663, |
|
"eval_loss": 0.10540811717510223, |
|
"eval_precision": 0.9461043676729951, |
|
"eval_recall": 0.9523809523809523, |
|
"eval_runtime": 28.9757, |
|
"eval_samples_per_second": 10.871, |
|
"eval_steps_per_second": 0.345, |
|
"step": 66 |
|
}, |
|
{ |
|
"epoch": 3.146067415730337, |
|
"grad_norm": 13.592888832092285, |
|
"learning_rate": 3.787878787878788e-05, |
|
"loss": 0.132, |
|
"step": 70 |
|
}, |
|
{ |
|
"epoch": 3.595505617977528, |
|
"grad_norm": 4.916988849639893, |
|
"learning_rate": 3.535353535353535e-05, |
|
"loss": 0.0984, |
|
"step": 80 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.9619047619047619, |
|
"eval_f1": 0.9599166265832932, |
|
"eval_loss": 0.08242347091436386, |
|
"eval_precision": 0.9590699155916548, |
|
"eval_recall": 0.9619047619047619, |
|
"eval_runtime": 29.2105, |
|
"eval_samples_per_second": 10.784, |
|
"eval_steps_per_second": 0.342, |
|
"step": 89 |
|
}, |
|
{ |
|
"epoch": 4.044943820224719, |
|
"grad_norm": 5.384190082550049, |
|
"learning_rate": 3.282828282828283e-05, |
|
"loss": 0.0997, |
|
"step": 90 |
|
}, |
|
{ |
|
"epoch": 4.49438202247191, |
|
"grad_norm": 6.7096028327941895, |
|
"learning_rate": 3.0303030303030306e-05, |
|
"loss": 0.1319, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 4.943820224719101, |
|
"grad_norm": 3.9921090602874756, |
|
"learning_rate": 2.777777777777778e-05, |
|
"loss": 0.1028, |
|
"step": 110 |
|
}, |
|
{ |
|
"epoch": 4.98876404494382, |
|
"eval_accuracy": 0.9714285714285714, |
|
"eval_f1": 0.9695078031212484, |
|
"eval_loss": 0.08143213391304016, |
|
"eval_precision": 0.9696825396825397, |
|
"eval_recall": 0.9714285714285714, |
|
"eval_runtime": 29.3091, |
|
"eval_samples_per_second": 10.748, |
|
"eval_steps_per_second": 0.341, |
|
"step": 111 |
|
}, |
|
{ |
|
"epoch": 5.393258426966292, |
|
"grad_norm": 7.567589282989502, |
|
"learning_rate": 2.5252525252525256e-05, |
|
"loss": 0.0806, |
|
"step": 120 |
|
}, |
|
{ |
|
"epoch": 5.842696629213483, |
|
"grad_norm": 3.001021385192871, |
|
"learning_rate": 2.272727272727273e-05, |
|
"loss": 0.1082, |
|
"step": 130 |
|
}, |
|
{ |
|
"epoch": 5.97752808988764, |
|
"eval_accuracy": 0.9492063492063492, |
|
"eval_f1": 0.9329456755199329, |
|
"eval_loss": 0.08350013196468353, |
|
"eval_precision": 0.9518195273822283, |
|
"eval_recall": 0.9492063492063492, |
|
"eval_runtime": 28.3828, |
|
"eval_samples_per_second": 11.098, |
|
"eval_steps_per_second": 0.352, |
|
"step": 133 |
|
}, |
|
{ |
|
"epoch": 6.292134831460674, |
|
"grad_norm": 3.2272369861602783, |
|
"learning_rate": 2.0202020202020203e-05, |
|
"loss": 0.0914, |
|
"step": 140 |
|
}, |
|
{ |
|
"epoch": 6.741573033707866, |
|
"grad_norm": 11.393094062805176, |
|
"learning_rate": 1.7676767676767676e-05, |
|
"loss": 0.0962, |
|
"step": 150 |
|
}, |
|
{ |
|
"epoch": 6.966292134831461, |
|
"eval_accuracy": 0.9587301587301588, |
|
"eval_f1": 0.9582359734643997, |
|
"eval_loss": 0.08720001578330994, |
|
"eval_precision": 0.9578027275395696, |
|
"eval_recall": 0.9587301587301588, |
|
"eval_runtime": 28.5518, |
|
"eval_samples_per_second": 11.033, |
|
"eval_steps_per_second": 0.35, |
|
"step": 155 |
|
}, |
|
{ |
|
"epoch": 7.191011235955056, |
|
"grad_norm": 3.3998546600341797, |
|
"learning_rate": 1.5151515151515153e-05, |
|
"loss": 0.1013, |
|
"step": 160 |
|
}, |
|
{ |
|
"epoch": 7.640449438202247, |
|
"grad_norm": 2.875291109085083, |
|
"learning_rate": 1.2626262626262628e-05, |
|
"loss": 0.0799, |
|
"step": 170 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.9587301587301588, |
|
"eval_f1": 0.9545950048462611, |
|
"eval_loss": 0.08030053973197937, |
|
"eval_precision": 0.9543377887748749, |
|
"eval_recall": 0.9587301587301588, |
|
"eval_runtime": 28.171, |
|
"eval_samples_per_second": 11.182, |
|
"eval_steps_per_second": 0.355, |
|
"step": 178 |
|
}, |
|
{ |
|
"epoch": 8.089887640449438, |
|
"grad_norm": 3.642427682876587, |
|
"learning_rate": 1.0101010101010101e-05, |
|
"loss": 0.0703, |
|
"step": 180 |
|
}, |
|
{ |
|
"epoch": 8.539325842696629, |
|
"grad_norm": 11.242568016052246, |
|
"learning_rate": 7.5757575757575764e-06, |
|
"loss": 0.0869, |
|
"step": 190 |
|
}, |
|
{ |
|
"epoch": 8.98876404494382, |
|
"grad_norm": 11.542448997497559, |
|
"learning_rate": 5.050505050505051e-06, |
|
"loss": 0.0954, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 8.98876404494382, |
|
"eval_accuracy": 0.9619047619047619, |
|
"eval_f1": 0.9587351719211175, |
|
"eval_loss": 0.06851905584335327, |
|
"eval_precision": 0.9583926593893372, |
|
"eval_recall": 0.9619047619047619, |
|
"eval_runtime": 28.2782, |
|
"eval_samples_per_second": 11.139, |
|
"eval_steps_per_second": 0.354, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 9.438202247191011, |
|
"grad_norm": 4.964309215545654, |
|
"learning_rate": 2.5252525252525253e-06, |
|
"loss": 0.0806, |
|
"step": 210 |
|
}, |
|
{ |
|
"epoch": 9.887640449438202, |
|
"grad_norm": 3.8892452716827393, |
|
"learning_rate": 0.0, |
|
"loss": 0.0771, |
|
"step": 220 |
|
}, |
|
{ |
|
"epoch": 9.887640449438202, |
|
"eval_accuracy": 0.9619047619047619, |
|
"eval_f1": 0.9587351719211175, |
|
"eval_loss": 0.07111740857362747, |
|
"eval_precision": 0.9583926593893372, |
|
"eval_recall": 0.9619047619047619, |
|
"eval_runtime": 28.6883, |
|
"eval_samples_per_second": 10.98, |
|
"eval_steps_per_second": 0.349, |
|
"step": 220 |
|
}, |
|
{ |
|
"epoch": 9.887640449438202, |
|
"step": 220, |
|
"total_flos": 6.968127952294871e+17, |
|
"train_loss": 0.13535271666266702, |
|
"train_runtime": 2769.4739, |
|
"train_samples_per_second": 10.233, |
|
"train_steps_per_second": 0.079 |
|
} |
|
], |
|
"logging_steps": 10, |
|
"max_steps": 220, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 10, |
|
"save_steps": 500, |
|
"stateful_callbacks": { |
|
"TrainerControl": { |
|
"args": { |
|
"should_epoch_stop": false, |
|
"should_evaluate": false, |
|
"should_log": false, |
|
"should_save": true, |
|
"should_training_stop": true |
|
}, |
|
"attributes": {} |
|
} |
|
}, |
|
"total_flos": 6.968127952294871e+17, |
|
"train_batch_size": 32, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|