{ "epoch": 3.0, "eval_accuracy": 0.4858960641696518, "eval_loss": 3.0558760166168213, "eval_runtime": 5966.6425, "eval_samples": 2812170, "eval_samples_per_second": 471.315, "eval_steps_per_second": 1.841, "perplexity": 21.239783783063608, "train_loss": 3.505743960671732, "train_runtime": 1074369.6431, "train_samples": 25309522, "train_samples_per_second": 70.673, "train_steps_per_second": 0.276 }