{ | |
"epoch": 0.9989786886362089, | |
"eval_loss": 0.8981775641441345, | |
"eval_runtime": 2707.4811, | |
"eval_samples": 459267, | |
"eval_samples_per_second": 169.629, | |
"eval_steps_per_second": 0.663, | |
"perplexity": 2.455124724281883, | |
"total_flos": 6.402304001609564e+17, | |
"train_loss": 17.88196479689204, | |
"train_runtime": 28909.2161, | |
"train_samples": 1879858, | |
"train_samples_per_second": 65.026, | |
"train_steps_per_second": 0.032 | |
} |