{ "epoch": 3.0, "eval_loss": 0.9941670894622803, "eval_runtime": 97.2481, "eval_samples": 22063, "eval_samples_per_second": 226.873, "eval_steps_per_second": 28.36, "perplexity": 2.7024724858012354, "total_flos": 1.29759190843392e+17, "train_loss": 1.2568308499351457, "train_runtime": 14727.5851, "train_samples": 250048, "train_samples_per_second": 50.935, "train_steps_per_second": 0.796 }