{ "epoch": 59.0, "learning_rate": 1.0000000000000002e-06, "total_flos": 2.151593295698903e+20, "train_loss": 0.11777938241923686, "train_runtime": 108362.28, "train_samples_per_second": 12.065, "train_steps_per_second": 0.378 }