zephyr-7b-dpo-full / all_results.json
weijie210's picture
Model save
ae6db7b verified
raw
history blame contribute delete
742 Bytes
{
"epoch": 1.0,
"eval_logits/chosen": -2.484065532684326,
"eval_logits/rejected": -2.4274542331695557,
"eval_logps/chosen": -305.43212890625,
"eval_logps/rejected": -294.2740783691406,
"eval_loss": 0.5714402198791504,
"eval_rewards/accuracies": 0.761904776096344,
"eval_rewards/chosen": -0.4765053391456604,
"eval_rewards/margins": 1.3102855682373047,
"eval_rewards/rejected": -1.7867907285690308,
"eval_runtime": 613.7286,
"eval_samples": 2000,
"eval_samples_per_second": 3.259,
"eval_steps_per_second": 0.103,
"train_loss": 0.5469513680846325,
"train_runtime": 31987.9403,
"train_samples": 61135,
"train_samples_per_second": 1.911,
"train_steps_per_second": 0.06
}