{ | |
"epoch": 2.995008319467554, | |
"eval_accuracy": 0.6832919793707865, | |
"eval_loss": 0.5938892960548401, | |
"eval_runtime": 94.4623, | |
"eval_samples": 921, | |
"eval_samples_per_second": 9.75, | |
"eval_steps_per_second": 4.88, | |
"perplexity": 1.8110183222577882, | |
"total_flos": 5.0830773065036595e+17, | |
"train_loss": 0.6010428385822861, | |
"train_runtime": 4607.4026, | |
"train_samples": 7211, | |
"train_samples_per_second": 4.695, | |
"train_steps_per_second": 0.293 | |
} |