{ "epoch": 1.0, "eval_loss": 1.5753202438354492, "eval_runtime": 30.3994, "eval_samples_per_second": 15.461, "eval_steps_per_second": 1.941, "perplexity": 4.832288881071616, "total_flos": 3.505428283392e+16, "train_loss": 1.8155303717278815, "train_runtime": 577.5445, "train_samples_per_second": 6.664, "train_steps_per_second": 3.333 }