{ "epoch": 1.0, "eval_loss": 1.9683517217636108, "eval_runtime": 30.1976, "eval_samples_per_second": 22.088, "eval_steps_per_second": 2.782, "perplexity": 7.158866953723834, "total_flos": 7.54868493877248e+16, "train_loss": 2.153304632613963, "train_runtime": 1112.8562, "train_samples_per_second": 7.456, "train_steps_per_second": 3.728 }