{ "epoch": 3.0, "eval_loss": 1.334074854850769, "eval_runtime": 4.3825, "eval_samples": 153, "eval_samples_per_second": 34.912, "eval_steps_per_second": 4.564, "perplexity": 3.7964820242969743, "total_flos": 1.1730479287894016e+16, "train_loss": 1.7010253453222524, "train_runtime": 4017.837, "train_samples": 14818, "train_samples_per_second": 11.064, "train_steps_per_second": 2.766 }