{ | |
"epoch": 6.7809745229100065, | |
"eval_accuracy": 0.364555259244386, | |
"eval_loss": 3.7116007804870605, | |
"eval_runtime": 273.6863, | |
"eval_samples": 33767, | |
"eval_samples_per_second": 123.378, | |
"eval_steps_per_second": 3.858, | |
"perplexity": 40.919256875144555, | |
"total_flos": 5.861064073050849e+17, | |
"train_loss": 4.399306026785714, | |
"train_runtime": 93598.1238, | |
"train_samples": 660643, | |
"train_samples_per_second": 705.829, | |
"train_steps_per_second": 22.058 | |
} |