{ | |
"epoch": 0.9999939379610938, | |
"eval_accuracy": 0.4560332193453835, | |
"eval_loss": 2.741572141647339, | |
"eval_runtime": 5.7613, | |
"eval_samples": 300, | |
"eval_samples_per_second": 52.072, | |
"eval_steps_per_second": 6.596, | |
"num_input_tokens_seen": 10810818560, | |
"perplexity": 15.511351979678839, | |
"total_flos": 1.199767969182253e+19, | |
"train_loss": 2.7848671950609445, | |
"train_runtime": 243040.2706, | |
"train_samples": 5278746, | |
"train_samples_per_second": 21.72, | |
"train_steps_per_second": 0.085 | |
} |