{ "epoch": 3.0, "total_flos": 4.559176483209216e+16, "train_loss": 0.70023385491034, "train_runtime": 1270.7835, "train_samples_per_second": 3.116, "train_steps_per_second": 0.779 }