{ "epoch": 2.64, "total_flos": 5.125448142246298e+16, "train_loss": 2.5212928454081216, "train_runtime": 93.9881, "train_samples_per_second": 24.737, "train_steps_per_second": 0.192 }