{ "epoch": 37.0, "learning_rate": 1e-05, "total_flos": 1.318896404308369e+20, "train_loss": 0.4464974437295797, "train_runtime": 4164.1679, "train_samples_per_second": 86.596, "train_steps_per_second": 2.738 }