Llama-3.1-8B-Instruct-SAA-600 / eval_results.json
chchen's picture
End of training
680afe0 verified
raw
history blame contribute delete
657 Bytes
{
"epoch": 9.777777777777779,
"eval_logits/chosen": -0.34323057532310486,
"eval_logits/rejected": -0.4047623574733734,
"eval_logps/chosen": -0.07215116173028946,
"eval_logps/rejected": -0.6233159303665161,
"eval_loss": 0.09428545832633972,
"eval_odds_ratio_loss": 0.8242944478988647,
"eval_rewards/accuracies": 0.8833333253860474,
"eval_rewards/chosen": -0.0072151171043515205,
"eval_rewards/margins": 0.05511648207902908,
"eval_rewards/rejected": -0.06233159825205803,
"eval_runtime": 2.331,
"eval_samples_per_second": 25.74,
"eval_sft_loss": 0.01185599621385336,
"eval_steps_per_second": 12.87
}