{ "epoch": 1.0, "eval_loss": 1.9547652006149292, "eval_runtime": 29.9421, "eval_samples_per_second": 22.276, "eval_steps_per_second": 2.805, "perplexity": 7.0622606145625975, "total_flos": 7.557299011584e+16, "train_loss": 2.140284038331314, "train_runtime": 1100.1009, "train_samples_per_second": 7.543, "train_steps_per_second": 3.771 }