FooJiaYin commited on
Commit
c0ff440
1 Parent(s): e140e83

Step 30500

Browse files
Files changed (4) hide show
  1. optimizer.pt +2 -2
  2. pytorch_model.bin +1 -1
  3. scheduler.pt +1 -1
  4. trainer_state.json +21 -3
optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cc0b6f9ede25848b4440e3a3b75ae481910266027a76a6f6d4ccfceaf2cbcbc4
3
- size 114425856
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b76cb150609c83406500033daf1401c3c869b1bbd2c657924d34b64ef4f18a0a
3
+ size 124020431
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:26aa43a71ef20ec5338c4fdde9142dfd63ea5b4748f0718dc9c1adadc2356b50
3
  size 62015575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8b719ac98622aa5081e4588d32365a424b51442f0dc89d51634ec657d9dda47
3
  size 62015575
scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:55379860d5993322de7e50bc90fdcc01f8bd3b79ab77cc4a24298562169a1da1
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2dde91353e8e873fc6f08fb03c6a05a606a2fb1188c39a2cef816921a1d0a448
3
  size 623
trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 9.122365523749608,
5
- "global_step": 29000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -354,11 +354,29 @@
354
  "learning_rate": 1.631645171437559e-05,
355
  "loss": 0.0455,
356
  "step": 29000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
357
  }
358
  ],
359
  "max_steps": 63580,
360
  "num_train_epochs": 20,
361
- "total_flos": 1.020599417048832e+16,
362
  "trial_name": null,
363
  "trial_params": null
364
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 9.594212016357345,
5
+ "global_step": 30500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
354
  "learning_rate": 1.631645171437559e-05,
355
  "loss": 0.0455,
356
  "step": 29000
357
+ },
358
+ {
359
+ "epoch": 9.28,
360
+ "learning_rate": 1.608052846807172e-05,
361
+ "loss": 0.0437,
362
+ "step": 29500
363
+ },
364
+ {
365
+ "epoch": 9.44,
366
+ "learning_rate": 1.5844605221767853e-05,
367
+ "loss": 0.0667,
368
+ "step": 30000
369
+ },
370
+ {
371
+ "epoch": 9.59,
372
+ "learning_rate": 1.5608681975463986e-05,
373
+ "loss": 0.0472,
374
+ "step": 30500
375
  }
376
  ],
377
  "max_steps": 63580,
378
  "num_train_epochs": 20,
379
+ "total_flos": 1.073395869196032e+16,
380
  "trial_name": null,
381
  "trial_params": null
382
  }