{ "epoch": 5.0, "total_flos": 3.11005644392448e+16, "train_loss": 0.03944617702703827, "train_runtime": 23402.751, "train_samples_per_second": 10.101, "train_steps_per_second": 0.316 }