|
{ |
|
"epoch": 0.9999197753710389, |
|
"eval_logits/chosen": -2.79840087890625, |
|
"eval_logits/rejected": -2.752188205718994, |
|
"eval_logps/chosen": -378.4407043457031, |
|
"eval_logps/rejected": -260.23724365234375, |
|
"eval_loss": 0.45464351773262024, |
|
"eval_rewards/accuracies": 0.7863636612892151, |
|
"eval_rewards/chosen": -1.0035351514816284, |
|
"eval_rewards/margins": 1.364441156387329, |
|
"eval_rewards/rejected": -2.367976188659668, |
|
"eval_runtime": 2783.2579, |
|
"eval_samples": 10555, |
|
"eval_samples_per_second": 3.792, |
|
"eval_steps_per_second": 0.474 |
|
} |