k4black commited on
Commit
8f72d1c
1 Parent(s): fad991b

Training in progress, step 12500

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dc1f7c55c8f8c0d40f4dd00c60e2187aa0a8aa139514c1b33817125b3fbdcc6f
3
  size 484059375
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e65cf37678993fe3f18088679da537fa01d85da9d152deaa0f44810aeb323ce0
3
  size 484059375
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:01450b005a0c07927774367baf2df85370addf1ae358bb986bedd6b750669cba
3
  size 242019067
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48589b74cc0dd9aca7fabf6af7fbebeded924f02e75c01d4b186662817a3fc93
3
  size 242019067
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:67e94701ea26738e0c3e8924fcfb0f3afba7ae6c7118b9610924cd0ffeaf567c
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f177c85bdffc6c35bccc14f5fae42f9fa475b3565690a355cfcb00cbcbaca2b
3
  size 14503
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3947d449c9f4d1e0c9eb97a6f1405b24f0cb52a87ee412118f0b3e92dad7ac68
3
  size 559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e0411b19d02a684abea10135971df618e10478843b4b273e508440d8c839ca4
3
  size 559
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c17de809b895c3bd271032fe901af5531aab205f74c2d6adac3868824296045a
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:772a71df90a23cf1d15b47f710ae6706f64dace0a85b2ffc76c96757f3ee319e
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": 0.7575966715812683,
3
  "best_model_checkpoint": "/home2/s5431786/jb-internship/results/Salesforce-codet5-small-CodeXGLUE-CONCODE-w_special_tokens/checkpoint-12000",
4
- "epoch": 3.84,
5
- "global_step": 12000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -462,11 +462,30 @@
462
  "eval_samples_per_second": 82.46,
463
  "eval_steps_per_second": 2.597,
464
  "step": 12000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
465
  }
466
  ],
467
  "max_steps": 31250,
468
  "num_train_epochs": 10,
469
- "total_flos": 4.334845641621504e+16,
470
  "trial_name": null,
471
  "trial_params": null
472
  }
 
1
  {
2
  "best_metric": 0.7575966715812683,
3
  "best_model_checkpoint": "/home2/s5431786/jb-internship/results/Salesforce-codet5-small-CodeXGLUE-CONCODE-w_special_tokens/checkpoint-12000",
4
+ "epoch": 4.0,
5
+ "global_step": 12500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
462
  "eval_samples_per_second": 82.46,
463
  "eval_steps_per_second": 2.597,
464
  "step": 12000
465
+ },
466
+ {
467
+ "epoch": 4.0,
468
+ "learning_rate": 6.317916933337825e-05,
469
+ "loss": 0.4723,
470
+ "step": 12500
471
+ },
472
+ {
473
+ "epoch": 4.0,
474
+ "eval_bleu": 0.13724470187361304,
475
+ "eval_exact_match": 0.1605,
476
+ "eval_loss": 0.7616467475891113,
477
+ "eval_rouge1": 0.5756965634335589,
478
+ "eval_rouge2": 0.4100511997403594,
479
+ "eval_rougeL": 0.559460669435164,
480
+ "eval_runtime": 23.0958,
481
+ "eval_samples_per_second": 86.596,
482
+ "eval_steps_per_second": 2.728,
483
+ "step": 12500
484
  }
485
  ],
486
  "max_steps": 31250,
487
  "num_train_epochs": 10,
488
+ "total_flos": 4.515048174963917e+16,
489
  "trial_name": null,
490
  "trial_params": null
491
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:01450b005a0c07927774367baf2df85370addf1ae358bb986bedd6b750669cba
3
  size 242019067
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48589b74cc0dd9aca7fabf6af7fbebeded924f02e75c01d4b186662817a3fc93
3
  size 242019067