{ "epoch": 1.0, "eval_loss": 1.9124690294265747, "eval_runtime": 23.4799, "eval_samples_per_second": 40.332, "eval_steps_per_second": 5.068, "perplexity": 6.769782974219858, "total_flos": 9.539063611392e+16, "train_loss": 2.0977558706333466, "train_runtime": 845.4487, "train_samples_per_second": 12.389, "train_steps_per_second": 6.194 }