{ | |
"epoch": 5.0, | |
"eval_accuracy": 0.9053223443951083, | |
"eval_loss": 0.45334097743034363, | |
"eval_runtime": 83.1276, | |
"eval_samples": 12451, | |
"eval_samples_per_second": 149.782, | |
"eval_steps_per_second": 1.564, | |
"perplexity": 1.573560643713862, | |
"total_flos": 2.898276322152499e+17, | |
"train_loss": 0.5986486167209296, | |
"train_runtime": 10447.1842, | |
"train_samples": 220179, | |
"train_samples_per_second": 105.377, | |
"train_steps_per_second": 1.098 | |
} |