File size: 2,247 Bytes
53fc0f2 579cd93 6b08339 148c01d 6b08339 53fc0f2 148c01d cef001b 148c01d cef001b 5abe211 5d65a7b cef001b 5d65a7b cef001b 5d65a7b 579cd93 e3d98d9 6b08339 4ea6138 53fc0f2 148c01d 6789a54 a353654 6789a54 148c01d 6b08339 a353654 53fc0f2 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 |
{
"best_metric": 4.924107074737549,
"best_model_checkpoint": "ner-bert-ingredients/checkpoint-20",
"epoch": 50.0,
"eval_steps": 10,
"global_step": 50,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 10.0,
"learning_rate": 4e-05,
"loss": 0.0466,
"step": 10
},
{
"epoch": 10.0,
"eval_loss": 4.74609375,
"eval_runtime": 0.0189,
"eval_samples_per_second": 52.922,
"eval_steps_per_second": 52.922,
"step": 10
},
{
"epoch": 20.0,
"learning_rate": 4e-05,
"loss": 0.0213,
"step": 20
},
{
"epoch": 20.0,
"eval_loss": 4.924107074737549,
"eval_runtime": 0.0183,
"eval_samples_per_second": 54.52,
"eval_steps_per_second": 54.52,
"step": 20
},
{
"epoch": 30.0,
"learning_rate": 3e-05,
"loss": 0.01,
"step": 30
},
{
"epoch": 30.0,
"eval_loss": 5.040736675262451,
"eval_runtime": 0.0178,
"eval_samples_per_second": 56.023,
"eval_steps_per_second": 56.023,
"step": 30
},
{
"epoch": 40.0,
"learning_rate": 2e-05,
"loss": 0.0063,
"step": 40
},
{
"epoch": 40.0,
"eval_loss": 5.1612725257873535,
"eval_runtime": 0.0185,
"eval_samples_per_second": 54.098,
"eval_steps_per_second": 54.098,
"step": 40
},
{
"epoch": 50.0,
"learning_rate": 4e-05,
"loss": 0.0043,
"step": 50
},
{
"epoch": 50.0,
"eval_loss": 5.35546875,
"eval_runtime": 0.0182,
"eval_samples_per_second": 55.091,
"eval_steps_per_second": 55.091,
"step": 50
},
{
"epoch": 50.0,
"step": 50,
"total_flos": 32856154788600.0,
"train_loss": 0.0008505997806787491,
"train_runtime": 23.3473,
"train_samples_per_second": 19.274,
"train_steps_per_second": 2.142
}
],
"logging_steps": 10,
"max_steps": 50,
"num_input_tokens_seen": 0,
"num_train_epochs": 50,
"save_steps": 10,
"total_flos": 32856154788600.0,
"train_batch_size": 16,
"trial_name": null,
"trial_params": null
}
|