|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 2.998504843008516, |
|
"global_step": 1440, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.42351716961498437, |
|
"eval_accuracy_0": 0.7588532883642496, |
|
"eval_accuracy_1": 0.046094750320102434, |
|
"eval_accuracy_2": 0.5985401459854015, |
|
"eval_loss": 0.80291348695755, |
|
"eval_runtime": 24.8435, |
|
"eval_samples_per_second": 77.364, |
|
"eval_steps_per_second": 77.364, |
|
"step": 480 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.4011446409989594, |
|
"eval_accuracy_0": 0.7470489038785835, |
|
"eval_accuracy_1": 0.18309859154929578, |
|
"eval_accuracy_2": 0.3375912408759124, |
|
"eval_loss": 0.7574263215065002, |
|
"eval_runtime": 24.6349, |
|
"eval_samples_per_second": 78.019, |
|
"eval_steps_per_second": 78.019, |
|
"step": 960 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.40790842872008326, |
|
"eval_accuracy_0": 0.8026981450252951, |
|
"eval_accuracy_1": 0.18693982074263765, |
|
"eval_accuracy_2": 0.2956204379562044, |
|
"eval_loss": 0.7730965614318848, |
|
"eval_runtime": 24.5617, |
|
"eval_samples_per_second": 78.252, |
|
"eval_steps_per_second": 78.252, |
|
"step": 1440 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"step": 1440, |
|
"total_flos": 2507409848941452.0, |
|
"train_loss": 0.7177374945746527, |
|
"train_runtime": 2670.6543, |
|
"train_samples_per_second": 17.28, |
|
"train_steps_per_second": 0.539 |
|
} |
|
], |
|
"max_steps": 1440, |
|
"num_train_epochs": 3, |
|
"total_flos": 2507409848941452.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|