Training in progress, step 789, checkpoint

Browse files

Files changed (4) hide show

last-checkpoint/adapter_model.safetensors +1 -1
last-checkpoint/optimizer.pt +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +45 -3

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1d209977df9813fed44fad624e5fb58dc1e5b15c5b51940ed1468e7c3dfe5fd9
 size 100198584

 version https://git-lfs.github.com/spec/v1
+oid sha256:31b0837275cc5f11270651e4afa09e46d066ac962dab68f2dc813068f170d69a
 size 100198584

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3a853076cce04170a9efa4aba119013888999f2ac0422fb5d16b39458831a719
 size 50675604

 version https://git-lfs.github.com/spec/v1
+oid sha256:07a002c9cb506fad059bebbe67c0737c9f684d39d8a96d697d7f947c812a25b3
 size 50675604

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2ca9fb85c447c86084528e309b6c6989260de379c269ae99f82548ef6b07c4e0
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:4d054cb5b5973f365f853a3e5809ff93e1f3146a44706d0ea9814bf12ba99652
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.8592592592592593,
   "eval_steps": 500,
-  "global_step": 783,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -5488,6 +5488,48 @@
       "learning_rate": 3.1565967940813812e-06,
       "loss": 1.0938,
       "step": 783
     }
   ],
   "logging_steps": 1,
@@ -5507,7 +5549,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 8.117704792212849e+17,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.8658436213991769,
   "eval_steps": 500,
+  "global_step": 789,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 3.1565967940813812e-06,
       "loss": 1.0938,
       "step": 783
+    },
+    {
+      "epoch": 0.8603566529492456,
+      "grad_norm": 0.12630558013916016,
+      "learning_rate": 3.1319358816276206e-06,
+      "loss": 1.1672,
+      "step": 784
+    },
+    {
+      "epoch": 0.8614540466392319,
+      "grad_norm": 0.14046333730220795,
+      "learning_rate": 3.1072749691738595e-06,
+      "loss": 1.1078,
+      "step": 785
+    },
+    {
+      "epoch": 0.8625514403292182,
+      "grad_norm": 0.13367818295955658,
+      "learning_rate": 3.0826140567200992e-06,
+      "loss": 1.1097,
+      "step": 786
+    },
+    {
+      "epoch": 0.8636488340192043,
+      "grad_norm": 0.14946097135543823,
+      "learning_rate": 3.057953144266338e-06,
+      "loss": 1.0131,
+      "step": 787
+    },
+    {
+      "epoch": 0.8647462277091906,
+      "grad_norm": 0.1397130787372589,
+      "learning_rate": 3.0332922318125775e-06,
+      "loss": 1.1225,
+      "step": 788
+    },
+    {
+      "epoch": 0.8658436213991769,
+      "grad_norm": 0.13838127255439758,
+      "learning_rate": 3.0086313193588164e-06,
+      "loss": 1.0598,
+      "step": 789
     }
   ],
   "logging_steps": 1,
       "attributes": {}
     }
   },
+  "total_flos": 8.180270209825137e+17,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null