{ "epoch": 1.0, "eval_loss": 1.9218220710754395, "eval_runtime": 62.1945, "eval_samples_per_second": 22.269, "eval_steps_per_second": 2.798, "perplexity": 6.833398069901086, "total_flos": 1.1351431053312e+17, "train_loss": 2.079003376893422, "train_runtime": 1659.922, "train_samples_per_second": 7.509, "train_steps_per_second": 3.754 }