{ | |
"epoch": 1.0, | |
"eval_accuracy": 0.4675585581782436, | |
"eval_loss": 3.0689306259155273, | |
"eval_runtime": 87.4789, | |
"eval_samples": 37878, | |
"eval_samples_per_second": 432.996, | |
"eval_steps_per_second": 54.127, | |
"perplexity": 21.518878635401286, | |
"total_flos": 2.4124793739319296e+16, | |
"train_loss": 3.571538051929227, | |
"train_runtime": 3663.4284, | |
"train_samples": 725349, | |
"train_samples_per_second": 197.997, | |
"train_steps_per_second": 24.75 | |
} |