File size: 2,324 Bytes
bbc4d64 ca209f5 1790f07 ca209f5 bbc4d64 1790f07 bbc4d64 1790f07 bbc4d64 1790f07 bbc4d64 1790f07 bbc4d64 1790f07 bbc4d64 1790f07 bbc4d64 1790f07 bbc4d64 1790f07 bbc4d64 1790f07 bbc4d64 1790f07 bbc4d64 1790f07 bbc4d64 1790f07 bbc4d64 1790f07 bbc4d64 1790f07 bbc4d64 ca209f5 bbc4d64 ca209f5 bbc4d64 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 |
{
"best_metric": 0.7435600757598877,
"best_model_checkpoint": "output/queen/checkpoint-69",
"epoch": 1.0,
"global_step": 69,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.07,
"learning_rate": 0.00013537785052914348,
"loss": 0.8946,
"step": 5
},
{
"epoch": 0.15,
"learning_rate": 0.0001300082017869573,
"loss": 1.1571,
"step": 10
},
{
"epoch": 0.22,
"learning_rate": 0.00012137631040942562,
"loss": 1.0891,
"step": 15
},
{
"epoch": 0.29,
"learning_rate": 0.00010994073605561692,
"loss": 1.0026,
"step": 20
},
{
"epoch": 0.37,
"learning_rate": 9.63089809342121e-05,
"loss": 0.8956,
"step": 25
},
{
"epoch": 0.44,
"learning_rate": 8.120521692221655e-05,
"loss": 1.0037,
"step": 30
},
{
"epoch": 0.51,
"learning_rate": 6.543181473690228e-05,
"loss": 0.9259,
"step": 35
},
{
"epoch": 0.59,
"learning_rate": 4.982671888105533e-05,
"loss": 0.9391,
"step": 40
},
{
"epoch": 0.66,
"learning_rate": 3.52189327703136e-05,
"loss": 0.897,
"step": 45
},
{
"epoch": 0.74,
"learning_rate": 2.2384478845846266e-05,
"loss": 0.969,
"step": 50
},
{
"epoch": 0.81,
"learning_rate": 1.2005173242556645e-05,
"loss": 0.9795,
"step": 55
},
{
"epoch": 0.88,
"learning_rate": 4.632405062861206e-06,
"loss": 1.0966,
"step": 60
},
{
"epoch": 0.96,
"learning_rate": 6.578444419609618e-07,
"loss": 0.9097,
"step": 65
},
{
"epoch": 1.0,
"eval_loss": 0.9767317771911621,
"eval_runtime": 2.0747,
"eval_samples_per_second": 46.272,
"eval_steps_per_second": 5.784,
"step": 68
},
{
"epoch": 1.0,
"eval_loss": 0.7435600757598877,
"eval_runtime": 1.811,
"eval_samples_per_second": 48.039,
"eval_steps_per_second": 6.074,
"step": 69
}
],
"max_steps": 138,
"num_train_epochs": 2,
"total_flos": 70418202624000.0,
"trial_name": null,
"trial_params": null
}
|