{ "epoch": 1.0, "eval_loss": 2.029616117477417, "eval_runtime": 17.8752, "eval_samples_per_second": 21.706, "eval_steps_per_second": 2.741, "perplexity": 7.611164005057549, "total_flos": 4.1045168553984e+16, "train_loss": 2.2167040354207086, "train_runtime": 618.2687, "train_samples_per_second": 7.269, "train_steps_per_second": 3.634 }