{ "epoch": 2.0, "total_flos": 1.0833412255308841e+18, "train_loss": 0.5169055745715186, "train_runtime": 771.9486, "train_samples_per_second": 55.962, "train_steps_per_second": 0.435 }