farmery commited on
Commit
cdfa075
·
verified ·
1 Parent(s): 511e30c

Training in progress, step 56, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a3a249c8004081b9004e69983f978e119b5bf2063bc16bae03b87b6c29ca74a0
3
  size 645975704
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fbaf1ed57b17e15838d7ba427275c71e5239abd01fce75f2b8831fac26d5aba5
3
  size 645975704
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d155b28f5e7ed79a50ef3a32a655a17e7d9d4a06d622aba236d8bd6b5b6c0883
3
  size 328468404
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33281a030601722e6e5833c52b1e422fe1559d066595f17c423831e4db7eafe0
3
  size 328468404
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9be25ff62256a472fa1f448e3d453c1943f4c5ebc354b49207e62f20236deb6a
3
  size 14960
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18d1e322d844019667efd77005c343afd5a843933d60a6d377f0cac5bb77cb19
3
  size 14960
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:41f415cc44747810bca05c75d13f5253fa09a627c8a57f4da3e109dd0e1d508c
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6db846ff2ee419b9368c374e099a2c577a7103459c8f15233032b76636eccd21
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b4dff8eb55605cbb8ac33421a282c2a3344fd33ccc979ba253b9e98ac353951c
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:346c719b46ba2add08db3614f24dfa501356aff6bef89984c3850b171d54a423
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:16dedcb8131c0bf718453558c27ee6713605b2e55751923de748d81e923d0f55
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac6abe539c42e12e554dbb33ca0979eacce661411ac7da2a82a07086d592ab60
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aab4a9e4ef073c8d05cbd3393b8f5e2be7efebf8d31894ffbc118b030a35e18a
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:882cbcdafabe936edc086ed06911378377212c19ac6648379eaecef2ba03d21c
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.9405940594059405,
5
  "eval_steps": 7,
6
- "global_step": 49,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -183,6 +183,28 @@
183
  "eval_samples_per_second": 66.119,
184
  "eval_steps_per_second": 4.667,
185
  "step": 49
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
186
  }
187
  ],
188
  "logging_steps": 3,
@@ -202,7 +224,7 @@
202
  "attributes": {}
203
  }
204
  },
205
- "total_flos": 1.3934508787525222e+17,
206
  "train_batch_size": 4,
207
  "trial_name": null,
208
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 2.217821782178218,
5
  "eval_steps": 7,
6
+ "global_step": 56,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
183
  "eval_samples_per_second": 66.119,
184
  "eval_steps_per_second": 4.667,
185
  "step": 49
186
+ },
187
+ {
188
+ "epoch": 2.01980198019802,
189
+ "grad_norm": 1.8872629404067993,
190
+ "learning_rate": 3.141687721698363e-05,
191
+ "loss": 1.4865,
192
+ "step": 51
193
+ },
194
+ {
195
+ "epoch": 2.1386138613861387,
196
+ "grad_norm": 0.8172866106033325,
197
+ "learning_rate": 2.500000000000001e-05,
198
+ "loss": 0.9957,
199
+ "step": 54
200
+ },
201
+ {
202
+ "epoch": 2.217821782178218,
203
+ "eval_loss": 1.3781214952468872,
204
+ "eval_runtime": 1.286,
205
+ "eval_samples_per_second": 66.094,
206
+ "eval_steps_per_second": 4.665,
207
+ "step": 56
208
  }
209
  ],
210
  "logging_steps": 3,
 
224
  "attributes": {}
225
  }
226
  },
227
+ "total_flos": 1.5925152900028826e+17,
228
  "train_batch_size": 4,
229
  "trial_name": null,
230
  "trial_params": null