yakazimir's picture
End of training
aeebb44 verified
raw
history blame contribute delete
782 Bytes
{
"epoch": 0.9989071038251366,
"eval_logits/chosen": -1.4181982278823853,
"eval_logits/rejected": -1.3836873769760132,
"eval_logps/chosen": -1.1345627307891846,
"eval_logps/rejected": -1.5455946922302246,
"eval_loss": 2.404977321624756,
"eval_rewards/accuracies": 0.8102409839630127,
"eval_rewards/chosen": -11.345626831054688,
"eval_rewards/margins": 4.110320091247559,
"eval_rewards/rejected": -15.45594596862793,
"eval_runtime": 33.5188,
"eval_samples": 1318,
"eval_samples_per_second": 39.321,
"eval_steps_per_second": 2.476,
"total_flos": 0.0,
"train_loss": 3.252214796955267,
"train_runtime": 5969.5229,
"train_samples": 58558,
"train_samples_per_second": 9.809,
"train_steps_per_second": 0.077
}