{ "epoch": 1.0, "eval_loss": 2.1312263011932373, "eval_runtime": 2.6837, "eval_samples_per_second": 13.787, "eval_steps_per_second": 1.863, "perplexity": 8.425192302438928, "total_flos": 4161668422041600.0, "train_loss": 2.3460041029484513, "train_runtime": 71.1285, "train_samples_per_second": 6.439, "train_steps_per_second": 3.22 }