hogru's picture
Update tokenizer, bump hf versions
ce10699
raw
history blame contribute delete
422 Bytes
{
"epoch": 31.0,
"test_accuracy": 0.5044041304365378,
"test_loss": 0.3887753188610077,
"test_perplexity": 1.4751730705300097,
"test_runtime": 1.9728,
"test_samples_per_second": 1184.637,
"test_steps_per_second": 74.515,
"train_loss": 0.7912082670869731,
"train_runtime": 664.7096,
"train_samples": 7878,
"train_samples_per_second": 592.59,
"train_steps_per_second": 18.504
}