{ | |
"epoch": 20.0, | |
"eval_accuracy": 0.5309790230016276, | |
"eval_loss": 2.4374380111694336, | |
"eval_runtime": 124.2703, | |
"eval_samples": 46951, | |
"eval_samples_per_second": 377.813, | |
"eval_steps_per_second": 5.906, | |
"perplexity": 11.443684561720477, | |
"total_flos": 1.19390876011008e+18, | |
"train_loss": 2.0466036078604977, | |
"train_runtime": 62067.1587, | |
"train_samples": 453383, | |
"train_samples_per_second": 146.094, | |
"train_steps_per_second": 4.566 | |
} |