|
{ |
|
"best_metric": 0.14741940796375275, |
|
"best_model_checkpoint": "./trained_models/twitter-emotion-deberta-v3-base/checkpoint-500", |
|
"epoch": 6.0, |
|
"global_step": 1200, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.5, |
|
"eval_accuracy": 0.8405, |
|
"eval_loss": 0.5359936952590942, |
|
"eval_runtime": 4.1757, |
|
"eval_samples_per_second": 478.965, |
|
"eval_steps_per_second": 5.987, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.915, |
|
"eval_loss": 0.28240880370140076, |
|
"eval_runtime": 4.2049, |
|
"eval_samples_per_second": 475.638, |
|
"eval_steps_per_second": 5.945, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 1.5, |
|
"eval_accuracy": 0.93, |
|
"eval_loss": 0.19999809563159943, |
|
"eval_runtime": 4.2283, |
|
"eval_samples_per_second": 473.002, |
|
"eval_steps_per_second": 5.913, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.936, |
|
"eval_loss": 0.13397051393985748, |
|
"eval_runtime": 4.2488, |
|
"eval_samples_per_second": 470.716, |
|
"eval_steps_per_second": 5.884, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 2.5, |
|
"learning_rate": 2.916666666666667e-05, |
|
"loss": 0.4142, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 2.5, |
|
"eval_accuracy": 0.937, |
|
"eval_loss": 0.14741940796375275, |
|
"eval_runtime": 4.2278, |
|
"eval_samples_per_second": 473.054, |
|
"eval_steps_per_second": 5.913, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.936, |
|
"eval_loss": 0.15366272628307343, |
|
"eval_runtime": 4.2318, |
|
"eval_samples_per_second": 472.612, |
|
"eval_steps_per_second": 5.908, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 3.5, |
|
"eval_accuracy": 0.939, |
|
"eval_loss": 0.13712549209594727, |
|
"eval_runtime": 4.2434, |
|
"eval_samples_per_second": 471.315, |
|
"eval_steps_per_second": 5.891, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.941, |
|
"eval_loss": 0.13440823554992676, |
|
"eval_runtime": 4.2389, |
|
"eval_samples_per_second": 471.816, |
|
"eval_steps_per_second": 5.898, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 4.5, |
|
"eval_accuracy": 0.939, |
|
"eval_loss": 0.13154806196689606, |
|
"eval_runtime": 4.244, |
|
"eval_samples_per_second": 471.257, |
|
"eval_steps_per_second": 5.891, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"learning_rate": 8.333333333333334e-06, |
|
"loss": 0.1013, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.936, |
|
"eval_loss": 0.15716207027435303, |
|
"eval_runtime": 4.2453, |
|
"eval_samples_per_second": 471.109, |
|
"eval_steps_per_second": 5.889, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 5.5, |
|
"eval_accuracy": 0.938, |
|
"eval_loss": 0.15671509504318237, |
|
"eval_runtime": 4.2362, |
|
"eval_samples_per_second": 472.124, |
|
"eval_steps_per_second": 5.902, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.939, |
|
"eval_loss": 0.15347838401794434, |
|
"eval_runtime": 4.2428, |
|
"eval_samples_per_second": 471.385, |
|
"eval_steps_per_second": 5.892, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"step": 1200, |
|
"total_flos": 6907037114880000.0, |
|
"train_loss": 0.2273927664756775, |
|
"train_runtime": 627.7316, |
|
"train_samples_per_second": 152.932, |
|
"train_steps_per_second": 1.912 |
|
} |
|
], |
|
"max_steps": 1200, |
|
"num_train_epochs": 6, |
|
"total_flos": 6907037114880000.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|