{ | |
"epoch": 0.4, | |
"eval_loss": 0.5791521668434143, | |
"eval_runtime": 501.8375, | |
"eval_samples": 1000, | |
"eval_samples_per_second": 9.401, | |
"eval_steps_per_second": 4.701, | |
"perplexity": 1.784524809889192, | |
"train_loss": 0.6467895458984375, | |
"train_runtime": 73141.1233, | |
"train_samples": 100000, | |
"train_samples_per_second": 2.734, | |
"train_steps_per_second": 0.342 | |
} |