|
{ |
|
"best_metric": 0.7862407862407862, |
|
"best_model_checkpoint": "finetune_results/omarmomen/structformer_s1_final_with_pos/qnli/checkpoint-2000", |
|
"epoch": 5.46448087431694, |
|
"global_step": 2000, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.09, |
|
"eval_accuracy": 0.6736658215522766, |
|
"eval_f1": 0.7146136189747514, |
|
"eval_loss": 0.5989475250244141, |
|
"eval_mcc": 0.3425894886466018, |
|
"eval_runtime": 4.4241, |
|
"eval_samples_per_second": 516.72, |
|
"eval_steps_per_second": 64.646, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 1.37, |
|
"learning_rate": 4.316939890710383e-05, |
|
"loss": 0.6481, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 2.19, |
|
"eval_accuracy": 0.7349081635475159, |
|
"eval_f1": 0.72579185520362, |
|
"eval_loss": 0.5559495091438293, |
|
"eval_mcc": 0.4829898982899456, |
|
"eval_runtime": 4.4215, |
|
"eval_samples_per_second": 517.013, |
|
"eval_steps_per_second": 64.683, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 2.73, |
|
"learning_rate": 3.633879781420765e-05, |
|
"loss": 0.5099, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 3.28, |
|
"eval_accuracy": 0.751968502998352, |
|
"eval_f1": 0.7618647627047459, |
|
"eval_loss": 0.555103063583374, |
|
"eval_mcc": 0.5037717283176012, |
|
"eval_runtime": 4.4181, |
|
"eval_samples_per_second": 517.421, |
|
"eval_steps_per_second": 64.734, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 4.1, |
|
"learning_rate": 2.9508196721311478e-05, |
|
"loss": 0.3245, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 4.37, |
|
"eval_accuracy": 0.7755905389785767, |
|
"eval_f1": 0.7782101167315174, |
|
"eval_loss": 0.6722451448440552, |
|
"eval_mcc": 0.5551932955703639, |
|
"eval_runtime": 4.4196, |
|
"eval_samples_per_second": 517.245, |
|
"eval_steps_per_second": 64.712, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 5.46, |
|
"learning_rate": 2.2677595628415303e-05, |
|
"loss": 0.1577, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 5.46, |
|
"eval_accuracy": 0.7716535329818726, |
|
"eval_f1": 0.7862407862407862, |
|
"eval_loss": 0.8745389580726624, |
|
"eval_mcc": 0.5412131716827608, |
|
"eval_runtime": 4.4197, |
|
"eval_samples_per_second": 517.228, |
|
"eval_steps_per_second": 64.71, |
|
"step": 2000 |
|
} |
|
], |
|
"max_steps": 3660, |
|
"num_train_epochs": 10, |
|
"total_flos": 2.003243376727296e+16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|