{ "epoch": 40.0, "total_flos": 6.164974248394752e+16, "train_loss": 0.3415180742740631, "train_runtime": 367.0026, "train_samples_per_second": 6.757, "train_steps_per_second": 0.109 }