{ | |
"epoch": 1.0, | |
"eval_loss": 1.5488653182983398, | |
"eval_runtime": 48.6887, | |
"eval_samples_per_second": 10.906, | |
"eval_steps_per_second": 1.376, | |
"perplexity": 4.706127195454765, | |
"total_flos": 4.381557669888e+16, | |
"train_loss": 1.8077541630365208, | |
"train_runtime": 1256.4921, | |
"train_samples_per_second": 3.829, | |
"train_steps_per_second": 1.915 | |
} |