{ | |
"epoch": 6.74, | |
"eval_loss": 2.268062114715576, | |
"eval_runtime": 340.6941, | |
"eval_samples": 300000, | |
"eval_samples_per_second": 880.555, | |
"eval_steps_per_second": 55.035, | |
"perplexity": 9.660661408946421, | |
"train_loss": 2.4076748518880207, | |
"train_runtime": 247856.7094, | |
"train_samples": 5700001, | |
"train_samples_per_second": 154.928, | |
"train_steps_per_second": 9.683 | |
} |