gemma2b-summarize-gpt4o-256k / all_results.json
chansung's picture
End of training
a217bd8 verified
raw
history blame
415 Bytes
{
"epoch": 14.961571306575577,
"eval_loss": 2.482285976409912,
"eval_runtime": 0.5289,
"eval_samples": 25,
"eval_samples_per_second": 18.909,
"eval_steps_per_second": 1.891,
"total_flos": 5.145390446595277e+18,
"train_loss": 1.0581742508226333,
"train_runtime": 45587.0719,
"train_samples": 258442,
"train_samples_per_second": 9.241,
"train_steps_per_second": 0.096
}