zephyr-7b-wpo-lora / eval_results.json
Wenboz's picture
End of training
6c03901 verified
raw
history blame contribute delete
622 Bytes
{
"epoch": 0.8,
"eval_logits/chosen": -0.5457379221916199,
"eval_logits/rejected": -0.5458806753158569,
"eval_logps/chosen": -317.97125244140625,
"eval_logps/ref_response": -0.5449998378753662,
"eval_logps/rejected": -331.12335205078125,
"eval_loss": 0.6931814551353455,
"eval_rewards/accuracies": 0.484375,
"eval_rewards/chosen": -0.001830391469411552,
"eval_rewards/margins": -0.000241550849750638,
"eval_rewards/rejected": -0.0015888408524915576,
"eval_runtime": 54.0012,
"eval_samples": 240,
"eval_samples_per_second": 4.444,
"eval_steps_per_second": 0.148
}