1b_distill_width_prune / all_results.json
friendshipkim's picture
End of training
ea77953 verified
raw
history blame contribute delete
411 Bytes
{
"epoch": 0.08267797093601252,
"eval_loss": 1.5711677074432373,
"eval_runtime": 394.1141,
"eval_samples": 4096,
"eval_samples_per_second": 10.393,
"eval_steps_per_second": 2.598,
"total_flos": 0.0,
"train_loss": 6.551032936291113e-05,
"train_runtime": 86.8457,
"train_samples": 15482525,
"train_samples_per_second": 14738.777,
"train_steps_per_second": 230.293
}