{ "epoch": 4.0, "total_flos": 9299872197181440.0, "train_loss": 2.19787335395813, "train_runtime": 9.6458, "train_samples_per_second": 12.441, "train_steps_per_second": 1.659 }