File size: 2,567 Bytes
1e36d27 bc63d9b 1e36d27 bc63d9b 1e36d27 bc63d9b 1e36d27 bc63d9b 1e36d27 bc63d9b 1e36d27 bc63d9b 1e36d27 bc63d9b 1e36d27 bc63d9b 1e36d27 bc63d9b 1e36d27 bc63d9b 1e36d27 bc63d9b 1e36d27 bc63d9b 1e36d27 bc63d9b 1e36d27 bc63d9b 1e36d27 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 |
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 5.0,
"eval_steps": 500,
"global_step": 2815,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"learning_rate": 1.6000000000000003e-05,
"loss": 3.3692,
"step": 563
},
{
"epoch": 1.0,
"eval_accuracy": 0.872,
"eval_f1": 0.856009752654711,
"eval_loss": 3.21221923828125,
"eval_runtime": 16.3666,
"eval_samples_per_second": 61.1,
"eval_steps_per_second": 3.849,
"step": 563
},
{
"epoch": 2.0,
"learning_rate": 1.2e-05,
"loss": 3.0963,
"step": 1126
},
{
"epoch": 2.0,
"eval_accuracy": 0.866,
"eval_f1": 0.8624612482571968,
"eval_loss": 3.1044771671295166,
"eval_runtime": 16.3224,
"eval_samples_per_second": 61.265,
"eval_steps_per_second": 3.86,
"step": 1126
},
{
"epoch": 3.0,
"learning_rate": 8.000000000000001e-06,
"loss": 2.8698,
"step": 1689
},
{
"epoch": 3.0,
"eval_accuracy": 0.882,
"eval_f1": 0.8755033031176542,
"eval_loss": 3.1409871578216553,
"eval_runtime": 16.3796,
"eval_samples_per_second": 61.051,
"eval_steps_per_second": 3.846,
"step": 1689
},
{
"epoch": 4.0,
"learning_rate": 4.000000000000001e-06,
"loss": 2.6212,
"step": 2252
},
{
"epoch": 4.0,
"eval_accuracy": 0.876,
"eval_f1": 0.8701998582565557,
"eval_loss": 3.2119336128234863,
"eval_runtime": 16.3349,
"eval_samples_per_second": 61.219,
"eval_steps_per_second": 3.857,
"step": 2252
},
{
"epoch": 5.0,
"learning_rate": 0.0,
"loss": 2.407,
"step": 2815
},
{
"epoch": 5.0,
"eval_accuracy": 0.885,
"eval_f1": 0.8788301734570391,
"eval_loss": 3.269321918487549,
"eval_runtime": 16.3269,
"eval_samples_per_second": 61.249,
"eval_steps_per_second": 3.859,
"step": 2815
},
{
"epoch": 5.0,
"step": 2815,
"total_flos": 4.169197960165814e+16,
"train_loss": 2.8726869085118785,
"train_runtime": 3265.1327,
"train_samples_per_second": 13.782,
"train_steps_per_second": 0.862
}
],
"logging_steps": 500,
"max_steps": 2815,
"num_train_epochs": 5,
"save_steps": 500,
"total_flos": 4.169197960165814e+16,
"trial_name": null,
"trial_params": null
}
|