{ | |
"epoch": 1.0, | |
"eval_accuracy": 0.5606630977618748, | |
"eval_loss": 2.634730815887451, | |
"eval_runtime": 407.3409, | |
"eval_samples": 36612, | |
"eval_samples_per_second": 89.88, | |
"eval_steps_per_second": 11.236, | |
"perplexity": 13.939559650092963, | |
"total_flos": 4.634223291773338e+16, | |
"train_loss": 3.132497888326312, | |
"train_runtime": 20429.0413, | |
"train_samples": 699309, | |
"train_samples_per_second": 34.231, | |
"train_steps_per_second": 4.279 | |
} |