smolm-autoreg-bpe-seed_555 / all_results.json
kanishka's picture
End of training
67d5a5d
raw
history blame
442 Bytes
{
"epoch": 10.0,
"eval_accuracy": 0.5416644525230297,
"eval_loss": 2.2877631187438965,
"eval_runtime": 4.555,
"eval_samples": 5038,
"eval_samples_per_second": 1106.038,
"eval_steps_per_second": 2.195,
"perplexity": 9.852873305063827,
"train_loss": 2.5528629182903297,
"train_runtime": 747.7642,
"train_samples": 52812,
"train_samples_per_second": 706.265,
"train_steps_per_second": 11.046
}