Training in progress, step 362, checkpoint

Files changed (4) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8095535d287a5363ea56d6e1a990b793651e0842f91f0e62b2cde7ad796e3c97
 size 100198584

 version https://git-lfs.github.com/spec/v1
+oid sha256:d8c0d97e659bc4443647ca4bb5214a3fd172de8cb97b76926060afaa1ce02b68
 size 100198584

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:165bc7411b625ca298d13e3c88f8745dc09872293291b602919d21265ad0ba3b
 size 50675604

 version https://git-lfs.github.com/spec/v1
+oid sha256:86c43689ac0cec244a4d403549cfe7f198290515d01fcc3fc5c91fcfe4ca6318
 size 50675604

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:84cd725a97db95f8de6db3eaffde1002a056efc831c1635a52e2a74854a937e4
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:ddd284836fe01fb8da0367ba9e958c4168cceec88a256cdb9badb53073d3392b
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.5274404164003287,
   "eval_steps": 500,
-  "global_step": 361,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -2534,6 +2534,13 @@
       "learning_rate": 1.1061643835616441e-05,
       "loss": 1.1788,
       "step": 361
     }
   ],
   "logging_steps": 1,
@@ -2553,7 +2560,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 4.0655166024812544e+17,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.5289014701853711,
   "eval_steps": 500,
+  "global_step": 362,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 1.1061643835616441e-05,
       "loss": 1.1788,
       "step": 361
+    },
+    {
+      "epoch": 0.5289014701853711,
+      "grad_norm": 0.12005290389060974,
+      "learning_rate": 1.1027397260273974e-05,
+      "loss": 1.1608,
+      "step": 362
     }
   ],
   "logging_steps": 1,
       "attributes": {}
     }
   },
+  "total_flos": 4.077009720080179e+17,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null