zephyr-7b-dpo-full / all_results.json
lewtun's picture
lewtun HF staff
Model save
b227adb
raw
history blame
730 Bytes
{
"epoch": 1.0,
"eval_logits/chosen": 0.6529867053031921,
"eval_logits/rejected": 1.5730761289596558,
"eval_logps/chosen": -357.2324523925781,
"eval_logps/rejected": -451.466064453125,
"eval_loss": 0.5028161406517029,
"eval_rewards/accuracies": 0.765625,
"eval_rewards/chosen": -0.9468507170677185,
"eval_rewards/margins": 0.946345865726471,
"eval_rewards/rejected": -1.8931965827941895,
"eval_runtime": 89.0083,
"eval_samples": 2000,
"eval_samples_per_second": 22.47,
"eval_steps_per_second": 0.36,
"train_loss": 0.5366686437918052,
"train_runtime": 5328.4749,
"train_samples": 61135,
"train_samples_per_second": 11.473,
"train_steps_per_second": 0.09
}