{ "epoch": 1.0, "eval_loss": 2.0819287300109863, "eval_runtime": 170.7493, "eval_samples_per_second": 10.893, "eval_steps_per_second": 1.365, "perplexity": 8.019922271599825, "total_flos": 1.3987105112064e+17, "train_loss": 2.1709037589008475, "train_runtime": 4004.8154, "train_samples_per_second": 3.835, "train_steps_per_second": 1.917 }