{ "epoch": 1.0, "eval_loss": 1.9266319274902344, "eval_runtime": 63.6699, "eval_samples_per_second": 15.549, "eval_steps_per_second": 1.948, "perplexity": 6.866344904696836, "total_flos": 1.5640093507584e+17, "train_loss": 2.1807824082961527, "train_runtime": 2484.8584, "train_samples_per_second": 6.911, "train_steps_per_second": 3.456 }