{ "epoch": 3.0, "eval_loss": 1.202375054359436, "eval_runtime": 3381.3728, "eval_samples": 132344, "eval_samples_per_second": 39.139, "eval_steps_per_second": 4.892, "perplexity": 3.3280117525215283, "train_loss": 1.3875968830903724, "train_runtime": 695161.7821, "train_samples": 2486745, "train_samples_per_second": 10.732, "train_steps_per_second": 0.335 }