{ "epoch": 1.0, "eval_loss": 2.0460915565490723, "eval_runtime": 9.9781, "eval_samples_per_second": 21.848, "eval_steps_per_second": 2.806, "perplexity": 7.7375999578361965, "total_flos": 2.4464433119232e+16, "train_loss": 2.247535785515151, "train_runtime": 357.9632, "train_samples_per_second": 7.462, "train_steps_per_second": 3.732 }