roberta-base-ca-cased-pos / trainer_state.json
ccasimiro's picture
upload model
bbde5db
{
"best_metric": 0.9909600298841987,
"best_model_checkpoint": "/home/shared/dt01/temutauro/ccasimiro/berta/src/finetuning/pos/roberta-base-ca-cased-pos/checkpoint-1230",
"epoch": 9.99878197320341,
"global_step": 4100,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_accuracy": 0.9902717208990272,
"eval_f1": 0.9884402778815269,
"eval_loss": 0.04564520716667175,
"eval_precision": 0.9881081282903335,
"eval_recall": 0.9887726508499907,
"eval_runtime": 13.2852,
"eval_samples_per_second": 128.639,
"step": 410
},
{
"epoch": 1.22,
"learning_rate": 4.390243902439025e-05,
"loss": 0.1804,
"step": 500
},
{
"epoch": 2.0,
"eval_accuracy": 0.9918077649676018,
"eval_f1": 0.9899899152130878,
"eval_loss": 0.036869727075099945,
"eval_precision": 0.9896941861767671,
"eval_recall": 0.9902858210349337,
"eval_runtime": 13.3317,
"eval_samples_per_second": 128.191,
"step": 820
},
{
"epoch": 2.44,
"learning_rate": 3.780487804878049e-05,
"loss": 0.0303,
"step": 1000
},
{
"epoch": 3.0,
"eval_accuracy": 0.992355091015025,
"eval_f1": 0.9909600298841987,
"eval_loss": 0.03579937666654587,
"eval_precision": 0.9907749766573296,
"eval_recall": 0.9911451522510741,
"eval_runtime": 13.2482,
"eval_samples_per_second": 128.999,
"step": 1230
},
{
"epoch": 3.66,
"learning_rate": 3.170731707317073e-05,
"loss": 0.0194,
"step": 1500
},
{
"epoch": 4.0,
"eval_accuracy": 0.9921079115097371,
"eval_f1": 0.9907175675170894,
"eval_loss": 0.037922825664281845,
"eval_precision": 0.9904955745602569,
"eval_recall": 0.9909396600037362,
"eval_runtime": 13.1871,
"eval_samples_per_second": 129.596,
"step": 1640
},
{
"epoch": 4.88,
"learning_rate": 2.5609756097560977e-05,
"loss": 0.0133,
"step": 2000
},
{
"epoch": 5.0,
"eval_accuracy": 0.992231501262381,
"eval_f1": 0.9908294577986965,
"eval_loss": 0.03801530599594116,
"eval_precision": 0.9906259336719451,
"eval_recall": 0.991033065570708,
"eval_runtime": 13.3822,
"eval_samples_per_second": 127.707,
"step": 2050
},
{
"epoch": 6.0,
"eval_accuracy": 0.9916841752149579,
"eval_f1": 0.9903335170120761,
"eval_loss": 0.04094540327787399,
"eval_precision": 0.9902317849872061,
"eval_recall": 0.9904352699420885,
"eval_runtime": 13.2046,
"eval_samples_per_second": 129.424,
"step": 2460
},
{
"epoch": 6.1,
"learning_rate": 1.9512195121951222e-05,
"loss": 0.0085,
"step": 2500
},
{
"epoch": 7.0,
"eval_accuracy": 0.9918430763255001,
"eval_f1": 0.9904548426263192,
"eval_loss": 0.04267619550228119,
"eval_precision": 0.9903623459096003,
"eval_recall": 0.9905473566224547,
"eval_runtime": 13.3294,
"eval_samples_per_second": 128.212,
"step": 2870
},
{
"epoch": 7.32,
"learning_rate": 1.3414634146341466e-05,
"loss": 0.0059,
"step": 3000
},
{
"epoch": 8.0,
"eval_accuracy": 0.9922668126202793,
"eval_f1": 0.9909512826019965,
"eval_loss": 0.04542930796742439,
"eval_precision": 0.9907014956028157,
"eval_recall": 0.9912011955912572,
"eval_runtime": 13.2987,
"eval_samples_per_second": 128.508,
"step": 3280
},
{
"epoch": 8.54,
"learning_rate": 7.317073170731707e-06,
"loss": 0.0037,
"step": 3500
},
{
"epoch": 9.0,
"eval_accuracy": 0.991966666078144,
"eval_f1": 0.9906329090280827,
"eval_loss": 0.04698851332068443,
"eval_precision": 0.9904756568995462,
"eval_recall": 0.9907902110965814,
"eval_runtime": 13.2254,
"eval_samples_per_second": 129.221,
"step": 3690
},
{
"epoch": 9.76,
"learning_rate": 1.2195121951219514e-06,
"loss": 0.0028,
"step": 4000
},
{
"epoch": 10.0,
"eval_accuracy": 0.9919843217570932,
"eval_f1": 0.9906423354937522,
"eval_loss": 0.04776829481124878,
"eval_precision": 0.9904758347650706,
"eval_recall": 0.9908088922099757,
"eval_runtime": 13.2102,
"eval_samples_per_second": 129.37,
"step": 4100
},
{
"epoch": 10.0,
"step": 4100,
"total_flos": 0,
"train_runtime": 3867.6486,
"train_samples_per_second": 1.06
}
],
"max_steps": 4100,
"num_train_epochs": 10,
"total_flos": 0,
"trial_name": null,
"trial_params": null
}