|
{ |
|
"best_metric": 0.9588719153936546, |
|
"best_model_checkpoint": "experiments_results/cometa/outputs/xlm-roberta-large-output/cometa_8_0.01_0.00002_02-26-24_12-34/checkpoint-1452", |
|
"epoch": 3.998624484181568, |
|
"global_step": 1452, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"learning_rate": 1.596774193548387e-05, |
|
"loss": 0.1244, |
|
"step": 363 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.988247268052282, |
|
"eval_f1": 0.6509704104358893, |
|
"eval_loss": 0.03377820923924446, |
|
"eval_precision": 0.7153846153846154, |
|
"eval_recall": 0.5971978984238179, |
|
"eval_runtime": 18.9255, |
|
"eval_samples_per_second": 153.602, |
|
"eval_steps_per_second": 19.233, |
|
"step": 363 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"learning_rate": 1.0645161290322582e-05, |
|
"loss": 0.0355, |
|
"step": 726 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.9933040497107349, |
|
"eval_f1": 0.7906197654941373, |
|
"eval_loss": 0.018763022497296333, |
|
"eval_precision": 0.9276729559748428, |
|
"eval_recall": 0.688849970811442, |
|
"eval_runtime": 18.9192, |
|
"eval_samples_per_second": 153.653, |
|
"eval_steps_per_second": 19.24, |
|
"step": 726 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"learning_rate": 5.322580645161291e-06, |
|
"loss": 0.0196, |
|
"step": 1089 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.9973966145275337, |
|
"eval_f1": 0.9279573080343908, |
|
"eval_loss": 0.00810301024466753, |
|
"eval_precision": 0.9427710843373494, |
|
"eval_recall": 0.9136018680677175, |
|
"eval_runtime": 19.0179, |
|
"eval_samples_per_second": 152.856, |
|
"eval_steps_per_second": 19.14, |
|
"step": 1089 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"learning_rate": 0.0, |
|
"loss": 0.0111, |
|
"step": 1452 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.9985001071352047, |
|
"eval_f1": 0.9588719153936546, |
|
"eval_loss": 0.005104937590658665, |
|
"eval_precision": 0.9651094027202839, |
|
"eval_recall": 0.9527145359019265, |
|
"eval_runtime": 18.9209, |
|
"eval_samples_per_second": 153.64, |
|
"eval_steps_per_second": 19.238, |
|
"step": 1452 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"step": 1452, |
|
"total_flos": 1523924460800142.0, |
|
"train_loss": 0.047672507848293, |
|
"train_runtime": 706.4241, |
|
"train_samples_per_second": 16.46, |
|
"train_steps_per_second": 2.055 |
|
} |
|
], |
|
"max_steps": 1452, |
|
"num_train_epochs": 4, |
|
"total_flos": 1523924460800142.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|