{ | |
"epoch": 19.999721059972106, | |
"eval_accuracy": 0.47825513461811886, | |
"eval_loss": 2.6862878799438477, | |
"eval_runtime": 71.7425, | |
"eval_samples": 60680, | |
"eval_samples_per_second": 845.803, | |
"eval_steps_per_second": 13.228, | |
"perplexity": 14.677091545354612, | |
"total_flos": 1.498591326633984e+18, | |
"train_loss": 2.8105185209001813, | |
"train_runtime": 30265.3714, | |
"train_samples": 573595, | |
"train_samples_per_second": 379.044, | |
"train_steps_per_second": 1.48 | |
} |