{ "epoch": 3.689182805857345, "eval_dpo_loss": 2703.03125, "eval_logits": -0.4645061194896698, "eval_logps": -85.19200134277344, "eval_loss": 5280.861328125, "eval_objective": 5329.05712890625, "eval_ranking_idealized": 0.5212215185165405, "eval_ranking_idealized_expo": 0.5212215185165405, "eval_ranking_simple": 0.5263975262641907, "eval_regularize": 5329.05712890625, "eval_runtime": 308.7203, "eval_samples": 5790, "eval_samples_per_second": 18.755, "eval_steps_per_second": 1.565, "eval_wo_beta": 14.025749206542969 }