epoch = 3.0 train_loss = 1.3765672623247966 train_runtime = 7341.0199 train_samples_per_second = 99.099 train_steps_per_second = 12.388