{ | |
"epoch": 1.0, | |
"eval_loss": 2.448012590408325, | |
"eval_runtime": 1408.7239, | |
"eval_samples_per_second": 8.454, | |
"eval_steps_per_second": 0.529, | |
"perplexity": 11.56533879845621, | |
"total_flos": 8.45892909419987e+17, | |
"train_loss": 2.683517217184325, | |
"train_runtime": 1637.9851, | |
"train_samples_per_second": 56.701, | |
"train_steps_per_second": 3.544 | |
} |