{ "epoch": 6.11, "eval_accuracy": 0.4312818008502973, "eval_loss": 3.2895166873931885, "eval_runtime": 812.9497, "eval_samples": 308356, "eval_samples_per_second": 379.305, "eval_steps_per_second": 3.449, "perplexity": 26.829893296112427, "train_loss": 5.144133388285963, "train_runtime": 197998.8021, "train_samples": 5858758, "train_samples_per_second": 2958.987, "train_steps_per_second": 26.9 }