{ "epoch": 1.0, "eval_loss": 2.014606237411499, "eval_runtime": 107.9002, "eval_samples_per_second": 13.679, "eval_steps_per_second": 1.715, "perplexity": 7.497774456787433, "total_flos": 1.594701201408e+17, "train_loss": 2.1740849319013575, "train_runtime": 2909.2573, "train_samples_per_second": 6.019, "train_steps_per_second": 3.009 }