{ | |
"epoch": 1.0, | |
"eval_accuracy": 0.5387296045953106, | |
"eval_loss": 2.923440933227539, | |
"eval_runtime": 126.5222, | |
"eval_samples": 11620, | |
"eval_samples_per_second": 91.842, | |
"eval_steps_per_second": 11.484, | |
"perplexity": 18.60519668247528, | |
"total_flos": 1.5038202327662592e+16, | |
"train_loss": 3.3210895868885175, | |
"train_runtime": 6630.0799, | |
"train_samples": 226928, | |
"train_samples_per_second": 34.227, | |
"train_steps_per_second": 4.278 | |
} |