zephyr0-7b-ultra-p-0.05 / all_results.json
tongliuphysics's picture
Model save
02b30b9 verified
raw
history blame contribute delete
545 Bytes
{
"epoch": 0.9989701338825953,
"eval_logits/chosen": -2.065095901489258,
"eval_logits/rejected": -1.9689290523529053,
"eval_logps/chosen": -335.3676452636719,
"eval_logps/rejected": -427.32891845703125,
"eval_loss": 0.5029041767120361,
"eval_rewards/accuracies": 0.75,
"eval_rewards/chosen": -1.1300084590911865,
"eval_rewards/margins": 0.865437388420105,
"eval_rewards/rejected": -1.995445728302002,
"eval_runtime": 65.1127,
"eval_samples_per_second": 15.358,
"eval_steps_per_second": 0.246
}