super-mistral-bros-alpha / trainer_log.jsonl
DaertML's picture
Upload 12 files
672b46a verified
{"current_steps": 5, "total_steps": 459, "loss": 4.5464, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.9985361990992455e-05, "epoch": 0.03, "percentage": 1.09, "elapsed_time": "0:01:44", "remaining_time": "2:38:37"}
{"current_steps": 10, "total_steps": 459, "loss": 3.5691, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.9941465105674435e-05, "epoch": 0.07, "percentage": 2.18, "elapsed_time": "0:03:35", "remaining_time": "2:41:25"}
{"current_steps": 15, "total_steps": 459, "loss": 2.6628, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.986836074908616e-05, "epoch": 0.1, "percentage": 3.27, "elapsed_time": "0:05:28", "remaining_time": "2:41:57"}
{"current_steps": 20, "total_steps": 459, "loss": 1.6234, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.976613452940604e-05, "epoch": 0.13, "percentage": 4.36, "elapsed_time": "0:07:25", "remaining_time": "2:42:53"}
{"current_steps": 25, "total_steps": 459, "loss": 0.4965, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.9634906157700036e-05, "epoch": 0.16, "percentage": 5.45, "elapsed_time": "0:09:18", "remaining_time": "2:41:33"}
{"current_steps": 30, "total_steps": 459, "loss": 0.2314, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.9474829307735115e-05, "epoch": 0.2, "percentage": 6.54, "elapsed_time": "0:11:08", "remaining_time": "2:39:18"}
{"current_steps": 35, "total_steps": 459, "loss": 0.2109, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.9286091436021015e-05, "epoch": 0.23, "percentage": 7.63, "elapsed_time": "0:12:58", "remaining_time": "2:37:06"}
{"current_steps": 40, "total_steps": 459, "loss": 0.243, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.906891356229103e-05, "epoch": 0.26, "percentage": 8.71, "elapsed_time": "0:14:47", "remaining_time": "2:34:54"}
{"current_steps": 45, "total_steps": 459, "loss": 0.1753, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.882355001067892e-05, "epoch": 0.29, "percentage": 9.8, "elapsed_time": "0:16:41", "remaining_time": "2:33:33"}
{"current_steps": 50, "total_steps": 459, "loss": 0.2237, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.855028811189496e-05, "epoch": 0.33, "percentage": 10.89, "elapsed_time": "0:18:31", "remaining_time": "2:31:34"}
{"current_steps": 55, "total_steps": 459, "loss": 0.1995, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.8249447866750025e-05, "epoch": 0.36, "percentage": 11.98, "elapsed_time": "0:20:24", "remaining_time": "2:29:52"}
{"current_steps": 60, "total_steps": 459, "loss": 0.259, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.792138157142158e-05, "epoch": 0.39, "percentage": 13.07, "elapsed_time": "0:22:13", "remaining_time": "2:27:48"}
{"current_steps": 60, "total_steps": 459, "loss": null, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 0.39, "percentage": 13.07, "elapsed_time": "0:22:13", "remaining_time": "2:27:48"}