{ "epoch": 91.0, "learning_rate": 1.0000000000000002e-07, "total_flos": 1.1760993126572918e+21, "train_loss": 0.1412498749900842, "train_runtime": 170277.6523, "train_samples_per_second": 7.678, "train_steps_per_second": 0.24 }