Omar
update
abe8798
{
"best_metric": 0.7862407862407862,
"best_model_checkpoint": "finetune_results/omarmomen/structformer_s1_final_with_pos/qnli/checkpoint-2000",
"epoch": 5.46448087431694,
"global_step": 2000,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.09,
"eval_accuracy": 0.6736658215522766,
"eval_f1": 0.7146136189747514,
"eval_loss": 0.5989475250244141,
"eval_mcc": 0.3425894886466018,
"eval_runtime": 4.4241,
"eval_samples_per_second": 516.72,
"eval_steps_per_second": 64.646,
"step": 400
},
{
"epoch": 1.37,
"learning_rate": 4.316939890710383e-05,
"loss": 0.6481,
"step": 500
},
{
"epoch": 2.19,
"eval_accuracy": 0.7349081635475159,
"eval_f1": 0.72579185520362,
"eval_loss": 0.5559495091438293,
"eval_mcc": 0.4829898982899456,
"eval_runtime": 4.4215,
"eval_samples_per_second": 517.013,
"eval_steps_per_second": 64.683,
"step": 800
},
{
"epoch": 2.73,
"learning_rate": 3.633879781420765e-05,
"loss": 0.5099,
"step": 1000
},
{
"epoch": 3.28,
"eval_accuracy": 0.751968502998352,
"eval_f1": 0.7618647627047459,
"eval_loss": 0.555103063583374,
"eval_mcc": 0.5037717283176012,
"eval_runtime": 4.4181,
"eval_samples_per_second": 517.421,
"eval_steps_per_second": 64.734,
"step": 1200
},
{
"epoch": 4.1,
"learning_rate": 2.9508196721311478e-05,
"loss": 0.3245,
"step": 1500
},
{
"epoch": 4.37,
"eval_accuracy": 0.7755905389785767,
"eval_f1": 0.7782101167315174,
"eval_loss": 0.6722451448440552,
"eval_mcc": 0.5551932955703639,
"eval_runtime": 4.4196,
"eval_samples_per_second": 517.245,
"eval_steps_per_second": 64.712,
"step": 1600
},
{
"epoch": 5.46,
"learning_rate": 2.2677595628415303e-05,
"loss": 0.1577,
"step": 2000
},
{
"epoch": 5.46,
"eval_accuracy": 0.7716535329818726,
"eval_f1": 0.7862407862407862,
"eval_loss": 0.8745389580726624,
"eval_mcc": 0.5412131716827608,
"eval_runtime": 4.4197,
"eval_samples_per_second": 517.228,
"eval_steps_per_second": 64.71,
"step": 2000
}
],
"max_steps": 3660,
"num_train_epochs": 10,
"total_flos": 2.003243376727296e+16,
"trial_name": null,
"trial_params": null
}