nguyen1207's picture
add model adapter
fe20bea verified
{
"best_metric": 0.3467291593551636,
"best_model_checkpoint": "./models/e5_weighted_3\\checkpoint-21170",
"epoch": 10.0,
"eval_steps": 4234,
"global_step": 21170,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 2.0,
"grad_norm": 0.6739985346794128,
"learning_rate": 1.8e-05,
"loss": 0.4895,
"step": 4234
},
{
"epoch": 2.0,
"eval_accuracy": 0.6055607917059378,
"eval_f1_0: ": 0.0,
"eval_f1_1: ": 0.7543293219841503,
"eval_loss": 0.4801671504974365,
"eval_precision_0: ": 0.0,
"eval_precision_1: ": 0.6055607917059378,
"eval_recall_0: ": 0.0,
"eval_recall_1: ": 1.0,
"eval_runtime": 695.7116,
"eval_samples_per_second": 3.05,
"eval_steps_per_second": 3.05,
"step": 4234
},
{
"epoch": 4.0,
"grad_norm": 1.520650863647461,
"learning_rate": 1.6000000000000003e-05,
"loss": 0.474,
"step": 8468
},
{
"epoch": 4.0,
"eval_accuracy": 0.6710650329877474,
"eval_f1_0: ": 0.3102766798418972,
"eval_f1_1: ": 0.7840346534653465,
"eval_loss": 0.4519682228565216,
"eval_precision_0: ": 0.8971428571428571,
"eval_precision_1: ": 0.6507447354904982,
"eval_recall_0: ": 0.1875746714456392,
"eval_recall_1: ": 0.9859922178988327,
"eval_runtime": 685.0371,
"eval_samples_per_second": 3.098,
"eval_steps_per_second": 3.098,
"step": 8468
},
{
"epoch": 6.0,
"grad_norm": 0.5096299648284912,
"learning_rate": 1.4e-05,
"loss": 0.4505,
"step": 12702
},
{
"epoch": 6.0,
"eval_accuracy": 0.7445805843543827,
"eval_f1_0: ": 0.5505804311774462,
"eval_f1_1: ": 0.8215931533903884,
"eval_loss": 0.42401960492134094,
"eval_precision_0: ": 0.8997289972899729,
"eval_precision_1: ": 0.7119224187107815,
"eval_recall_0: ": 0.3966547192353644,
"eval_recall_1: ": 0.9712062256809338,
"eval_runtime": 684.6385,
"eval_samples_per_second": 3.099,
"eval_steps_per_second": 3.099,
"step": 12702
},
{
"epoch": 8.0,
"grad_norm": 0.8480051755905151,
"learning_rate": 1.2e-05,
"loss": 0.418,
"step": 16936
},
{
"epoch": 8.0,
"eval_accuracy": 0.8044297832233742,
"eval_f1_0: ": 0.7182620502376104,
"eval_f1_1: ": 0.85023457235655,
"eval_loss": 0.37760457396507263,
"eval_precision_0: ": 0.8317610062893082,
"eval_precision_1: ": 0.7927321668909825,
"eval_recall_0: ": 0.6320191158900836,
"eval_recall_1: ": 0.9167315175097276,
"eval_runtime": 680.6302,
"eval_samples_per_second": 3.118,
"eval_steps_per_second": 3.118,
"step": 16936
},
{
"epoch": 10.0,
"grad_norm": 0.9994410872459412,
"learning_rate": 1e-05,
"loss": 0.3911,
"step": 21170
},
{
"epoch": 10.0,
"eval_accuracy": 0.8185673892554194,
"eval_f1_0: ": 0.752411575562701,
"eval_f1_1: ": 0.8568240981777613,
"eval_loss": 0.3467291593551636,
"eval_precision_0: ": 0.8147632311977716,
"eval_precision_1: ": 0.8205128205128205,
"eval_recall_0: ": 0.6989247311827957,
"eval_recall_1: ": 0.8964980544747082,
"eval_runtime": 673.4114,
"eval_samples_per_second": 3.151,
"eval_steps_per_second": 3.151,
"step": 21170
}
],
"logging_steps": 4234,
"max_steps": 42340,
"num_input_tokens_seen": 0,
"num_train_epochs": 20,
"save_steps": 4234,
"total_flos": 2.448451500060672e+16,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}