{ | |
"epoch": 3.0, | |
"eval_accuracy": 0.8481199261869228, | |
"eval_loss": 0.678066611289978, | |
"eval_runtime": 15544.5436, | |
"eval_samples": 2374416, | |
"eval_samples_per_second": 152.749, | |
"eval_steps_per_second": 1.193, | |
"perplexity": 1.9700651461010967, | |
"total_flos": 7.501219159976442e+18, | |
"train_loss": 0.20371022846941, | |
"train_runtime": 62599.538, | |
"train_samples": 9497662, | |
"train_samples_per_second": 455.163, | |
"train_steps_per_second": 3.556 | |
} |