{ "epoch": 3.0, "eval_accuracy": 0.8481199261869228, "eval_loss": 0.678066611289978, "eval_runtime": 15544.5436, "eval_samples": 2374416, "eval_samples_per_second": 152.749, "eval_steps_per_second": 1.193, "perplexity": 1.9700651461010967, "total_flos": 7.501219159976442e+18, "train_loss": 0.20371022846941, "train_runtime": 62599.538, "train_samples": 9497662, "train_samples_per_second": 455.163, "train_steps_per_second": 3.556 }