{ "best_metric": 0.021361960098147392, "best_model_checkpoint": "gpt3_finetuned_model/checkpoint-15024", "epoch": 1.0, "eval_steps": 500, "global_step": 15024, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.03, "learning_rate": 1.966719914802982e-05, "loss": 0.0219, "step": 500 }, { "epoch": 0.07, "learning_rate": 1.933439829605964e-05, "loss": 0.012, "step": 1000 }, { "epoch": 0.1, "learning_rate": 1.900159744408946e-05, "loss": 0.0141, "step": 1500 }, { "epoch": 0.13, "learning_rate": 1.866879659211928e-05, "loss": 0.0096, "step": 2000 }, { "epoch": 0.17, "learning_rate": 1.8335995740149097e-05, "loss": 0.0135, "step": 2500 }, { "epoch": 0.2, "learning_rate": 1.8003194888178915e-05, "loss": 0.021, "step": 3000 }, { "epoch": 0.23, "learning_rate": 1.7670394036208734e-05, "loss": 0.0125, "step": 3500 }, { "epoch": 0.27, "learning_rate": 1.7337593184238552e-05, "loss": 0.0084, "step": 4000 }, { "epoch": 0.3, "learning_rate": 1.700479233226837e-05, "loss": 0.0128, "step": 4500 }, { "epoch": 0.33, "learning_rate": 1.6671991480298192e-05, "loss": 0.0142, "step": 5000 }, { "epoch": 0.37, "learning_rate": 1.633919062832801e-05, "loss": 0.0143, "step": 5500 }, { "epoch": 0.4, "learning_rate": 1.600638977635783e-05, "loss": 0.0087, "step": 6000 }, { "epoch": 0.43, "learning_rate": 1.5673588924387647e-05, "loss": 0.0085, "step": 6500 }, { "epoch": 0.47, "learning_rate": 1.5340788072417466e-05, "loss": 0.0122, "step": 7000 }, { "epoch": 0.5, "learning_rate": 1.5007987220447286e-05, "loss": 0.0126, "step": 7500 }, { "epoch": 0.53, "learning_rate": 1.4675186368477104e-05, "loss": 0.014, "step": 8000 }, { "epoch": 0.57, "learning_rate": 1.4342385516506923e-05, "loss": 0.0086, "step": 8500 }, { "epoch": 0.6, "learning_rate": 1.4009584664536741e-05, "loss": 0.0094, "step": 9000 }, { "epoch": 0.63, "learning_rate": 1.3676783812566561e-05, "loss": 0.0136, "step": 9500 }, { "epoch": 0.67, "learning_rate": 1.334398296059638e-05, "loss": 0.0057, "step": 10000 }, { "epoch": 0.7, "learning_rate": 1.30111821086262e-05, "loss": 0.0126, "step": 10500 }, { "epoch": 0.73, "learning_rate": 1.2678381256656018e-05, "loss": 0.013, "step": 11000 }, { "epoch": 0.77, "learning_rate": 1.2345580404685838e-05, "loss": 0.0096, "step": 11500 }, { "epoch": 0.8, "learning_rate": 1.2012779552715656e-05, "loss": 0.0068, "step": 12000 }, { "epoch": 0.83, "learning_rate": 1.1679978700745476e-05, "loss": 0.0057, "step": 12500 }, { "epoch": 0.87, "learning_rate": 1.1347177848775295e-05, "loss": 0.0062, "step": 13000 }, { "epoch": 0.9, "learning_rate": 1.1014376996805112e-05, "loss": 0.0138, "step": 13500 }, { "epoch": 0.93, "learning_rate": 1.0681576144834932e-05, "loss": 0.007, "step": 14000 }, { "epoch": 0.97, "learning_rate": 1.034877529286475e-05, "loss": 0.0054, "step": 14500 }, { "epoch": 1.0, "learning_rate": 1.0015974440894568e-05, "loss": 0.0061, "step": 15000 }, { "epoch": 1.0, "eval_accuracy": 0.9955404685835996, "eval_loss": 0.021361960098147392, "eval_runtime": 198.8868, "eval_samples_per_second": 302.162, "eval_steps_per_second": 18.885, "step": 15024 } ], "logging_steps": 500, "max_steps": 30048, "num_train_epochs": 2, "save_steps": 500, "total_flos": 2.288794378322357e+16, "trial_name": null, "trial_params": null }