{ "epoch": 1.0, "eval_loss": 1.9494917392730713, "eval_runtime": 54.4179, "eval_samples_per_second": 22.125, "eval_steps_per_second": 2.775, "perplexity": 7.025116082433238, "total_flos": 1.17399030595584e+17, "train_loss": 2.1091008744372672, "train_runtime": 1734.4968, "train_samples_per_second": 7.449, "train_steps_per_second": 3.724 }