farmery commited on
Commit
3a4a391
·
verified ·
1 Parent(s): fbe37c7

Training in progress, step 63, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fbaf1ed57b17e15838d7ba427275c71e5239abd01fce75f2b8831fac26d5aba5
3
  size 645975704
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e784acdeea8251a6336500366d312e683bd14e3b97f10fae082fa3d6941ae7c
3
  size 645975704
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:33281a030601722e6e5833c52b1e422fe1559d066595f17c423831e4db7eafe0
3
  size 328468404
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec526be729fc00766aa465a00eb2bf0692f28ce23edb3bf18d27f8d70b8a5d6c
3
  size 328468404
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:18d1e322d844019667efd77005c343afd5a843933d60a6d377f0cac5bb77cb19
3
  size 14960
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4021ac42541c732a9edf05da0035fae77d4a41abb574781ede4fe889417988ba
3
  size 14960
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6db846ff2ee419b9368c374e099a2c577a7103459c8f15233032b76636eccd21
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41670b12d55b8b5e00e1702187eaf19a951a106909295e3bdb88a154dad660d3
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:346c719b46ba2add08db3614f24dfa501356aff6bef89984c3850b171d54a423
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:357fa8adc33d4c6287c5a582578b54604c4e2ff77e822b43c331fe6a4113b76a
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ac6abe539c42e12e554dbb33ca0979eacce661411ac7da2a82a07086d592ab60
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1523cad77aebbc5c93094a08e19a912cbf5e034a61c053725fea450338236ccb
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:882cbcdafabe936edc086ed06911378377212c19ac6648379eaecef2ba03d21c
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e56d433c056f847cd62894fdc7d2cfac435f2db58e37ae7dede3f4334c0f5d0
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.217821782178218,
5
  "eval_steps": 7,
6
- "global_step": 56,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -205,6 +205,35 @@
205
  "eval_samples_per_second": 66.094,
206
  "eval_steps_per_second": 4.665,
207
  "step": 56
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
208
  }
209
  ],
210
  "logging_steps": 3,
@@ -224,7 +253,7 @@
224
  "attributes": {}
225
  }
226
  },
227
- "total_flos": 1.5925152900028826e+17,
228
  "train_batch_size": 4,
229
  "trial_name": null,
230
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 2.495049504950495,
5
  "eval_steps": 7,
6
+ "global_step": 63,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
205
  "eval_samples_per_second": 66.094,
206
  "eval_steps_per_second": 4.665,
207
  "step": 56
208
+ },
209
+ {
210
+ "epoch": 2.2574257425742577,
211
+ "grad_norm": 0.8602892160415649,
212
+ "learning_rate": 1.9092050688969738e-05,
213
+ "loss": 1.0049,
214
+ "step": 57
215
+ },
216
+ {
217
+ "epoch": 2.376237623762376,
218
+ "grad_norm": 0.8723423480987549,
219
+ "learning_rate": 1.3813298094746491e-05,
220
+ "loss": 1.0431,
221
+ "step": 60
222
+ },
223
+ {
224
+ "epoch": 2.495049504950495,
225
+ "grad_norm": 0.8783928155899048,
226
+ "learning_rate": 9.271202397483215e-06,
227
+ "loss": 0.9437,
228
+ "step": 63
229
+ },
230
+ {
231
+ "epoch": 2.495049504950495,
232
+ "eval_loss": 1.3786593675613403,
233
+ "eval_runtime": 1.3013,
234
+ "eval_samples_per_second": 65.322,
235
+ "eval_steps_per_second": 4.611,
236
+ "step": 63
237
  }
238
  ],
239
  "logging_steps": 3,
 
253
  "attributes": {}
254
  }
255
  },
256
+ "total_flos": 1.791579701253243e+17,
257
  "train_batch_size": 4,
258
  "trial_name": null,
259
  "trial_params": null