{ "epoch": 3.0, "eval_accuracy": 0.8641530412656662, "eval_loss": 0.627652108669281, "eval_runtime": 2741.9492, "eval_samples": 533443, "eval_samples_per_second": 194.549, "eval_steps_per_second": 6.08, "perplexity": 1.8732073248670145, "train_loss": 0.7972901372973573, "train_runtime": 334073.6243, "train_samples": 10071323, "train_samples_per_second": 90.441, "train_steps_per_second": 2.826 }