{ "epoch": 1.995276334435522, "eval_dpo_loss": 1.8786616325378418, "eval_logits": -0.8508970141410828, "eval_logps": -81.16841125488281, "eval_loss": 1.9399291276931763, "eval_objective": 1.8786616325378418, "eval_ranking_simple": 0.534679114818573, "eval_runtime": 616.6991, "eval_samples": 5790, "eval_samples_per_second": 9.389, "eval_steps_per_second": 0.783 }