{ "epoch": 4.18, "eval_accuracy": 0.46381721409003707, "eval_loss": 3.0280144214630127, "eval_runtime": 1032.3382, "eval_samples": 308356, "eval_samples_per_second": 298.697, "eval_steps_per_second": 3.112, "perplexity": 20.656177381243463, "train_loss": 4.755463555369041, "train_runtime": 197998.775, "train_samples": 5858758, "train_samples_per_second": 2958.987, "train_steps_per_second": 30.823 }