{ "epoch": 1.0, "eval_loss": 1.7925077676773071, "eval_runtime": 19.1715, "eval_samples_per_second": 184.076, "eval_steps_per_second": 5.79, "perplexity": 6.004491470966308, "total_flos": 2.0294485407275418e+17, "train_loss": 3.4696031336514457, "train_runtime": 269.8562, "train_samples_per_second": 50.256, "train_steps_per_second": 1.571 }