{ "epoch": 1.0, "eval_loss": 1.8229724168777466, "eval_runtime": 65.6293, "eval_samples_per_second": 10.895, "eval_steps_per_second": 1.371, "perplexity": 6.190231078134954, "total_flos": 7.717588795392e+16, "train_loss": 1.9823122004278713, "train_runtime": 2216.0595, "train_samples_per_second": 3.824, "train_steps_per_second": 1.912 }