zephyr-gemma-2-9b-dpo-4k / eval_results.json
tanliboy's picture
End of training
aebef63 verified
raw
history blame contribute delete
586 Bytes
{
"epoch": 0.998691442030882,
"eval_logits/chosen": -11.360100746154785,
"eval_logits/rejected": -11.085914611816406,
"eval_logps/chosen": -459.7269592285156,
"eval_logps/rejected": -488.03009033203125,
"eval_loss": 0.5439372658729553,
"eval_rewards/accuracies": 0.671999990940094,
"eval_rewards/chosen": -0.9089793562889099,
"eval_rewards/margins": 0.5084334015846252,
"eval_rewards/rejected": -1.4174127578735352,
"eval_runtime": 223.5785,
"eval_samples": 2000,
"eval_samples_per_second": 8.945,
"eval_steps_per_second": 1.118
}