{ "epoch": 1.0, "eval_accuracy": 0.5606630977618748, "eval_loss": 2.634730815887451, "eval_runtime": 407.3409, "eval_samples": 36612, "eval_samples_per_second": 89.88, "eval_steps_per_second": 11.236, "perplexity": 13.939559650092963, "total_flos": 4.634223291773338e+16, "train_loss": 3.132497888326312, "train_runtime": 20429.0413, "train_samples": 699309, "train_samples_per_second": 34.231, "train_steps_per_second": 4.279 }