|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 8.0, |
|
"global_step": 5056, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.79, |
|
"learning_rate": 5e-05, |
|
"loss": 0.324, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.9792203149081317, |
|
"eval_f1": 0.9060294526257294, |
|
"eval_loss": 0.10194244235754013, |
|
"eval_precision": 0.9077614045506849, |
|
"eval_recall": 0.904304097027067, |
|
"eval_runtime": 12.6479, |
|
"eval_samples_per_second": 217.348, |
|
"step": 632 |
|
}, |
|
{ |
|
"epoch": 1.58, |
|
"learning_rate": 4.451273046532046e-05, |
|
"loss": 0.0599, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.9832931525115832, |
|
"eval_f1": 0.9250188602866763, |
|
"eval_loss": 0.08270899951457977, |
|
"eval_precision": 0.9206314324433212, |
|
"eval_recall": 0.9294483064635409, |
|
"eval_runtime": 12.8104, |
|
"eval_samples_per_second": 214.592, |
|
"step": 1264 |
|
}, |
|
{ |
|
"epoch": 2.37, |
|
"learning_rate": 3.902546093064092e-05, |
|
"loss": 0.0414, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.9813122943651833, |
|
"eval_f1": 0.9174662014827737, |
|
"eval_loss": 0.09249694645404816, |
|
"eval_precision": 0.9019937115906818, |
|
"eval_recall": 0.9334787753290933, |
|
"eval_runtime": 12.6986, |
|
"eval_samples_per_second": 216.48, |
|
"step": 1896 |
|
}, |
|
{ |
|
"epoch": 3.16, |
|
"learning_rate": 3.353819139596137e-05, |
|
"loss": 0.03, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 3.96, |
|
"learning_rate": 2.8050921861281827e-05, |
|
"loss": 0.0203, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.9827810282103189, |
|
"eval_f1": 0.9226777565140586, |
|
"eval_loss": 0.09510081261396408, |
|
"eval_precision": 0.9183516483516484, |
|
"eval_recall": 0.9270448158556427, |
|
"eval_runtime": 12.7912, |
|
"eval_samples_per_second": 214.913, |
|
"step": 2528 |
|
}, |
|
{ |
|
"epoch": 4.75, |
|
"learning_rate": 2.256365232660228e-05, |
|
"loss": 0.0139, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.9840951584928085, |
|
"eval_f1": 0.9295437821927889, |
|
"eval_loss": 0.09760858118534088, |
|
"eval_precision": 0.9249158002635818, |
|
"eval_recall": 0.9342183109007544, |
|
"eval_runtime": 12.7478, |
|
"eval_samples_per_second": 215.645, |
|
"step": 3160 |
|
}, |
|
{ |
|
"epoch": 5.54, |
|
"learning_rate": 1.707638279192274e-05, |
|
"loss": 0.01, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.9842159425261255, |
|
"eval_f1": 0.9298436262501611, |
|
"eval_loss": 0.10052050650119781, |
|
"eval_precision": 0.9263459209512276, |
|
"eval_recall": 0.9333678449933441, |
|
"eval_runtime": 12.7445, |
|
"eval_samples_per_second": 215.702, |
|
"step": 3792 |
|
}, |
|
{ |
|
"epoch": 6.33, |
|
"learning_rate": 1.1589113257243196e-05, |
|
"loss": 0.0067, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_accuracy": 0.984558969180746, |
|
"eval_f1": 0.9318746892093487, |
|
"eval_loss": 0.11000438034534454, |
|
"eval_precision": 0.9283014713976443, |
|
"eval_recall": 0.9354755213725781, |
|
"eval_runtime": 12.8711, |
|
"eval_samples_per_second": 213.579, |
|
"step": 4424 |
|
}, |
|
{ |
|
"epoch": 7.12, |
|
"learning_rate": 6.101843722563653e-06, |
|
"loss": 0.0049, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 7.91, |
|
"learning_rate": 6.145741878841089e-07, |
|
"loss": 0.0033, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.9842642561394525, |
|
"eval_f1": 0.9308433246772383, |
|
"eval_loss": 0.11643598228693008, |
|
"eval_precision": 0.9272740615712032, |
|
"eval_recall": 0.9344401715722527, |
|
"eval_runtime": 12.7915, |
|
"eval_samples_per_second": 214.908, |
|
"step": 5056 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"step": 5056, |
|
"total_flos": 1.2033636864613164e+16, |
|
"train_runtime": 1294.9862, |
|
"train_samples_per_second": 3.904 |
|
} |
|
], |
|
"max_steps": 5056, |
|
"num_train_epochs": 8, |
|
"total_flos": 1.2033636864613164e+16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|