{ "epoch": 3.0, "eval_loss": 1.3419121503829956, "eval_runtime": 10.6724, "eval_samples_per_second": 14.055, "eval_steps_per_second": 1.78, "perplexity": 3.826353077140856, "train_loss": 1.3472231076148138, "train_runtime": 10021.615, "train_samples_per_second": 4.42, "train_steps_per_second": 0.276 }