{ "epoch": 3.0, "eval_accuracy": 0.6240879264443259, "eval_loss": 1.9968321323394775, "eval_runtime": 5913.1596, "eval_samples": 2812170, "eval_samples_per_second": 475.578, "eval_steps_per_second": 1.858, "perplexity": 7.365685583966684, "train_loss": 2.243077999982859, "train_runtime": 411193.7405, "train_samples": 25309522, "train_samples_per_second": 184.654, "train_steps_per_second": 0.721 }