phi-2-dpo-ultrachat-lora / eval_results.json
lole25's picture
Model save
b80f3e8 verified
raw
history blame
574 Bytes
{
"epoch": 1.0,
"eval_logits/chosen": 0.7827913761138916,
"eval_logits/rejected": 0.8020623326301575,
"eval_logps/chosen": -92.44380187988281,
"eval_logps/rejected": -95.30902099609375,
"eval_loss": 0.6912217736244202,
"eval_rewards/accuracies": 0.3179999887943268,
"eval_rewards/chosen": -0.00716440798714757,
"eval_rewards/margins": 0.00395576748996973,
"eval_rewards/rejected": -0.011120175942778587,
"eval_runtime": 273.2522,
"eval_samples": 2000,
"eval_samples_per_second": 7.319,
"eval_steps_per_second": 0.457
}