nttx commited on
Commit
9250f3e
·
verified ·
1 Parent(s): 24a7c9d

Training in progress, epoch 1, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d1d8713e24e0a2f94a7fa3c1df73f52efbcf67457e75b20fae89d8ad45288815
3
  size 83945296
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebe623c4f0421e7ade1f6e462e536afeb966e2f658717fd8883892f128e15a00
3
  size 83945296
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:146e018abda0d6337f700c3bcf2a2b283c676b153c2f613d377a7ff760740c6f
3
  size 43122580
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aeb75492d6eb59ef1e49f1622c9665ff0f66f0a9f7c935ead5d03f6d081dae52
3
  size 43122580
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:93886abc560ab3f8e7355c260a01e990e2bbd10433fe8df95b9f0f689e05abda
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4355423124dfcce7575820455724cb582682f7533e5e61cb41b391b7c0372bdf
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:493ce52bbbeb9b20008dd6d239fd04fb544278ea5f81325aad420ff05398af7b
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:735fcde948207403fdbfb47bb37bfc58c52e261d01a785aeb293a35e042e5b40
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.9973190348525469,
5
  "eval_steps": 24,
6
- "global_step": 93,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -179,12 +179,12 @@
179
  "should_evaluate": false,
180
  "should_log": false,
181
  "should_save": true,
182
- "should_training_stop": false
183
  },
184
  "attributes": {}
185
  }
186
  },
187
- "total_flos": 3.449437322792141e+16,
188
  "train_batch_size": 2,
189
  "trial_name": null,
190
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.0080428954423593,
5
  "eval_steps": 24,
6
+ "global_step": 94,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
179
  "should_evaluate": false,
180
  "should_log": false,
181
  "should_save": true,
182
+ "should_training_stop": true
183
  },
184
  "attributes": {}
185
  }
186
  },
187
+ "total_flos": 3.4771807865143296e+16,
188
  "train_batch_size": 2,
189
  "trial_name": null,
190
  "trial_params": null