farmery commited on
Commit
ba79dcd
·
verified ·
1 Parent(s): 5f67cd5

Training in progress, step 49, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:be04c9972e630958da8e44f9e4c9f9dcc16a03ca8ed2f4a5769d950bd0776ae2
3
  size 645975704
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3a249c8004081b9004e69983f978e119b5bf2063bc16bae03b87b6c29ca74a0
3
  size 645975704
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7b84d2d470a3f640e4b2cc4ce5ce8e6839289bdc697bdd545f7d7c8dd8c51b39
3
  size 328468404
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d155b28f5e7ed79a50ef3a32a655a17e7d9d4a06d622aba236d8bd6b5b6c0883
3
  size 328468404
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:abd2a2f2b84ec4af4de6e78c117101bf220fbb0d23f8d3186fde1f407aca376f
3
  size 14960
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9be25ff62256a472fa1f448e3d453c1943f4c5ebc354b49207e62f20236deb6a
3
  size 14960
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bd5de8cc5f988a2c3a2846ee47dd1b1c807c4b36aee9e6556e2dd8a5d0ef776a
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41f415cc44747810bca05c75d13f5253fa09a627c8a57f4da3e109dd0e1d508c
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b3a3a3147e9469653998f2b1fc733e316bbebf9c0ef7c13d269390e72efd2c6b
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4dff8eb55605cbb8ac33421a282c2a3344fd33ccc979ba253b9e98ac353951c
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fcb24ecc1303aadd1770afee5c5d48c535ac4827ae4531643a669c0d145e5db0
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16dedcb8131c0bf718453558c27ee6713605b2e55751923de748d81e923d0f55
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0fabed08622e08b27f1841ea221cb1eb063940b7a5bf0e62bf1a780665944540
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aab4a9e4ef073c8d05cbd3393b8f5e2be7efebf8d31894ffbc118b030a35e18a
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.6633663366336635,
5
  "eval_steps": 7,
6
- "global_step": 42,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -161,6 +161,28 @@
161
  "eval_samples_per_second": 65.965,
162
  "eval_steps_per_second": 4.656,
163
  "step": 42
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
164
  }
165
  ],
166
  "logging_steps": 3,
@@ -180,7 +202,7 @@
180
  "attributes": {}
181
  }
182
  },
183
- "total_flos": 1.194386467502162e+17,
184
  "train_batch_size": 4,
185
  "trial_name": null,
186
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.9405940594059405,
5
  "eval_steps": 7,
6
+ "global_step": 49,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
161
  "eval_samples_per_second": 65.965,
162
  "eval_steps_per_second": 4.656,
163
  "step": 42
164
+ },
165
+ {
166
+ "epoch": 1.7821782178217822,
167
+ "grad_norm": 0.8776001930236816,
168
+ "learning_rate": 4.5247197834790876e-05,
169
+ "loss": 1.1555,
170
+ "step": 45
171
+ },
172
+ {
173
+ "epoch": 1.900990099009901,
174
+ "grad_norm": 0.8503000140190125,
175
+ "learning_rate": 3.821205322452863e-05,
176
+ "loss": 1.2638,
177
+ "step": 48
178
+ },
179
+ {
180
+ "epoch": 1.9405940594059405,
181
+ "eval_loss": 1.384788155555725,
182
+ "eval_runtime": 1.2856,
183
+ "eval_samples_per_second": 66.119,
184
+ "eval_steps_per_second": 4.667,
185
+ "step": 49
186
  }
187
  ],
188
  "logging_steps": 3,
 
202
  "attributes": {}
203
  }
204
  },
205
+ "total_flos": 1.3934508787525222e+17,
206
  "train_batch_size": 4,
207
  "trial_name": null,
208
  "trial_params": null