{ "epoch": 10.11, "eval_loss": 1.9157038927078247, "eval_runtime": 467.8394, "eval_samples": 400000, "eval_samples_per_second": 854.994, "eval_steps_per_second": 53.437, "perplexity": 6.791717755466664, "train_loss": 2.0669708544921876, "train_runtime": 368218.0367, "train_samples": 7600002, "train_samples_per_second": 208.572, "train_steps_per_second": 6.518 }