zephyr-7b-dpo-qlora / eval_results.json
jikaixuan's picture
Model save
44e3e84 verified
raw
history blame
569 Bytes
{
"epoch": 1.0,
"eval_logits/chosen": -2.0918362140655518,
"eval_logits/rejected": -2.03544020652771,
"eval_logps/chosen": -271.2979431152344,
"eval_logps/rejected": -267.2720642089844,
"eval_loss": 1721.1201171875,
"eval_rewards/accuracies": 0.773809552192688,
"eval_rewards/chosen": -0.06273359060287476,
"eval_rewards/margins": 0.16227789223194122,
"eval_rewards/rejected": -0.22501146793365479,
"eval_runtime": 548.8776,
"eval_samples": 2000,
"eval_samples_per_second": 3.644,
"eval_steps_per_second": 0.115
}