smolm-autoreg-bpe-seed_888 / all_results.json
kanishka's picture
End of training
25633b5
raw
history blame
443 Bytes
{
"epoch": 10.0,
"eval_accuracy": 0.5425975187003966,
"eval_loss": 2.2831156253814697,
"eval_runtime": 4.4985,
"eval_samples": 5038,
"eval_samples_per_second": 1119.928,
"eval_steps_per_second": 2.223,
"perplexity": 9.807188384190734,
"train_loss": 2.5465449372446276,
"train_runtime": 743.7716,
"train_samples": 52812,
"train_samples_per_second": 710.057,
"train_steps_per_second": 11.106
}