|
{ |
|
"best_metric": 0.9776214833759592, |
|
"best_model_checkpoint": "test/model\\checkpoint-1500", |
|
"epoch": 9.146341463414634, |
|
"global_step": 1500, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.61, |
|
"eval_accuracy": 0.9168925867065533, |
|
"eval_f1": 0.531752104055088, |
|
"eval_loss": 0.2909819185733795, |
|
"eval_precision": 0.6453110492107706, |
|
"eval_recall": 0.4521795705920625, |
|
"eval_runtime": 7.6557, |
|
"eval_samples_per_second": 19.332, |
|
"eval_steps_per_second": 9.666, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 1.22, |
|
"eval_accuracy": 0.9672805459474619, |
|
"eval_f1": 0.8156667702828723, |
|
"eval_loss": 0.1369905024766922, |
|
"eval_precision": 0.780952380952381, |
|
"eval_recall": 0.8536109303838647, |
|
"eval_runtime": 7.6461, |
|
"eval_samples_per_second": 19.356, |
|
"eval_steps_per_second": 9.678, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 1.83, |
|
"eval_accuracy": 0.9770028980087875, |
|
"eval_f1": 0.87900466562986, |
|
"eval_loss": 0.0756949633359909, |
|
"eval_precision": 0.8420738974970202, |
|
"eval_recall": 0.9193233571893299, |
|
"eval_runtime": 7.6257, |
|
"eval_samples_per_second": 19.408, |
|
"eval_steps_per_second": 9.704, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 2.44, |
|
"eval_accuracy": 0.9902776479386743, |
|
"eval_f1": 0.9516539440203563, |
|
"eval_loss": 0.04403918609023094, |
|
"eval_precision": 0.9309271935283137, |
|
"eval_recall": 0.9733246584255042, |
|
"eval_runtime": 7.6305, |
|
"eval_samples_per_second": 19.396, |
|
"eval_steps_per_second": 9.698, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 3.05, |
|
"learning_rate": 9.5e-06, |
|
"loss": 0.2309, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 3.05, |
|
"eval_accuracy": 0.9855099560624474, |
|
"eval_f1": 0.9462231893068076, |
|
"eval_loss": 0.047688089311122894, |
|
"eval_precision": 0.905952380952381, |
|
"eval_recall": 0.9902407286922577, |
|
"eval_runtime": 7.6227, |
|
"eval_samples_per_second": 19.416, |
|
"eval_steps_per_second": 9.708, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 3.66, |
|
"eval_accuracy": 0.9955127605870805, |
|
"eval_f1": 0.982028241335045, |
|
"eval_loss": 0.022968417033553123, |
|
"eval_precision": 0.9689677010766308, |
|
"eval_recall": 0.9954456733897202, |
|
"eval_runtime": 7.6581, |
|
"eval_samples_per_second": 19.326, |
|
"eval_steps_per_second": 9.663, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 4.27, |
|
"eval_accuracy": 0.9834533046648593, |
|
"eval_f1": 0.9442905509387505, |
|
"eval_loss": 0.04970035329461098, |
|
"eval_precision": 0.8960280373831776, |
|
"eval_recall": 0.9980481457384516, |
|
"eval_runtime": 7.634, |
|
"eval_samples_per_second": 19.387, |
|
"eval_steps_per_second": 9.693, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 4.88, |
|
"eval_accuracy": 0.9912124894830326, |
|
"eval_f1": 0.969046114971573, |
|
"eval_loss": 0.03323974087834358, |
|
"eval_precision": 0.941682013505218, |
|
"eval_recall": 0.9980481457384516, |
|
"eval_runtime": 7.674, |
|
"eval_samples_per_second": 19.286, |
|
"eval_steps_per_second": 9.643, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 5.49, |
|
"eval_accuracy": 0.9900906796298028, |
|
"eval_f1": 0.9653870358716173, |
|
"eval_loss": 0.031032076105475426, |
|
"eval_precision": 0.9347958561852528, |
|
"eval_recall": 0.9980481457384516, |
|
"eval_runtime": 7.6489, |
|
"eval_samples_per_second": 19.349, |
|
"eval_steps_per_second": 9.675, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 6.1, |
|
"learning_rate": 9e-06, |
|
"loss": 0.0211, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 6.1, |
|
"eval_accuracy": 0.9921473310273908, |
|
"eval_f1": 0.9724072312083729, |
|
"eval_loss": 0.02703050896525383, |
|
"eval_precision": 0.9486386138613861, |
|
"eval_recall": 0.9973975276512687, |
|
"eval_runtime": 7.623, |
|
"eval_samples_per_second": 19.415, |
|
"eval_steps_per_second": 9.707, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 6.71, |
|
"eval_accuracy": 0.9914929419463401, |
|
"eval_f1": 0.9699652228896617, |
|
"eval_loss": 0.03206472471356392, |
|
"eval_precision": 0.9434194341943419, |
|
"eval_recall": 0.9980481457384516, |
|
"eval_runtime": 7.6405, |
|
"eval_samples_per_second": 19.37, |
|
"eval_steps_per_second": 9.685, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 7.32, |
|
"eval_accuracy": 0.9970085070580537, |
|
"eval_f1": 0.9877181641887525, |
|
"eval_loss": 0.016345446929335594, |
|
"eval_precision": 0.9813744380218369, |
|
"eval_recall": 0.9941444372153546, |
|
"eval_runtime": 7.742, |
|
"eval_samples_per_second": 19.117, |
|
"eval_steps_per_second": 9.558, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 7.93, |
|
"eval_accuracy": 0.9908385528652893, |
|
"eval_f1": 0.9684542586750788, |
|
"eval_loss": 0.031482577323913574, |
|
"eval_precision": 0.939987752602572, |
|
"eval_recall": 0.9986987638256344, |
|
"eval_runtime": 7.6808, |
|
"eval_samples_per_second": 19.269, |
|
"eval_steps_per_second": 9.634, |
|
"step": 1300 |
|
}, |
|
{ |
|
"epoch": 8.54, |
|
"eval_accuracy": 0.9920538468729551, |
|
"eval_f1": 0.9720989220038045, |
|
"eval_loss": 0.029911138117313385, |
|
"eval_precision": 0.948051948051948, |
|
"eval_recall": 0.9973975276512687, |
|
"eval_runtime": 7.6156, |
|
"eval_samples_per_second": 19.434, |
|
"eval_steps_per_second": 9.717, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 9.15, |
|
"learning_rate": 8.5e-06, |
|
"loss": 0.0158, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 9.15, |
|
"eval_accuracy": 0.993643077498364, |
|
"eval_f1": 0.9776214833759592, |
|
"eval_loss": 0.025822490453720093, |
|
"eval_precision": 0.9610307982401005, |
|
"eval_recall": 0.9947950553025374, |
|
"eval_runtime": 7.6981, |
|
"eval_samples_per_second": 19.226, |
|
"eval_steps_per_second": 9.613, |
|
"step": 1500 |
|
} |
|
], |
|
"max_steps": 10000, |
|
"num_train_epochs": 61, |
|
"total_flos": 793919609690112.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|