{ "epoch": 3.0, "eval_loss": 0.06556913256645203, "eval_mse": 0.06556913494220615, "eval_runtime": 13.1744, "eval_samples": 10000, "eval_samples_per_second": 759.049, "eval_steps_per_second": 94.881, "total_flos": 6357984788759040.0, "train_loss": 0.07220485827706652, "train_runtime": 846.782, "train_samples": 128690, "train_samples_per_second": 455.926, "train_steps_per_second": 7.125 }