{ "epoch": 1.0, "eval_loss": 1.8459237813949585, "eval_runtime": 73.2243, "eval_samples_per_second": 79.782, "eval_steps_per_second": 9.983, "perplexity": 6.333948272197309, "total_flos": 3.478541817358582e+17, "train_loss": 2.9001881553825744, "train_runtime": 774.5812, "train_samples_per_second": 30.024, "train_steps_per_second": 3.753 }