{ "epoch": 0.045454545454545456, "total_flos": 280583108296704.0, "train_loss": 2.258466958999634, "train_runtime": 267.1515, "train_samples_per_second": 0.06, "train_steps_per_second": 0.007 }