{ "epoch": 3.0, "eval_loss": 1.202345371246338, "eval_runtime": 73.2928, "eval_samples": 177, "eval_samples_per_second": 2.415, "eval_steps_per_second": 0.164, "perplexity": 3.3279129682384063, "total_flos": 4.846865511470285e+16, "train_loss": 1.5912532506997346, "train_runtime": 107034.0122, "train_samples": 17322, "train_samples_per_second": 0.486, "train_steps_per_second": 0.061 }