k4black commited on
Commit
24c72f3
1 Parent(s): 5e224e3

Training in progress, step 16000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b67a585ad731edfd3190139c2048716d1ef0cd5c4e23c5d039753733beb85292
3
  size 1135685
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a963e17d63c5311d4177c813a94a2aef757d599b9e54238d21dc7910cea8d38
3
  size 1135685
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:593e18bc3c456f313a1af17bb6a97030aabe3dfbde4c59f3e4ae0a040049cb77
3
  size 307910149
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ffb6cb62074cb556e4605433d13ffd9119d9af77cd667c007bfe11a29bc9c8a
3
  size 307910149
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:82960f07cae3e568bb93b45888fd2b6a63f1fd9b319bf6f6dda39789df0fc6a6
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e64fd0c22b4f678e997dcb527fccba5e7f7f0718a533bfc0e960d81e6c062ad4
3
  size 14575
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9a9379299cb036bee8563adb6a6941350bd1a2187d737827bca0ce7b889d9885
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3c7bfd871284a6faa92f94aee9c5ea71a9bdcdd13ee2b820e7d8b41939b332d
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 1.7180376052856445,
3
- "best_model_checkpoint": "/home3/s5431786/nlp-final-project/results/google-flan-t5-small-e-snli-generation-explanation_use_prompt_label-selected-b64/checkpoint-12000",
4
- "epoch": 1.6309412861136998,
5
- "global_step": 14000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -160,11 +160,33 @@
160
  "eval_samples_per_second": 60.37,
161
  "eval_steps_per_second": 0.945,
162
  "step": 14000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
163
  }
164
  ],
165
  "max_steps": 85840,
166
  "num_train_epochs": 10,
167
- "total_flos": 2.1150083559346176e+16,
168
  "trial_name": null,
169
  "trial_params": null
170
  }
 
1
  {
2
+ "best_metric": 1.692925214767456,
3
+ "best_model_checkpoint": "/home3/s5431786/nlp-final-project/results/google-flan-t5-small-e-snli-generation-explanation_use_prompt_label-selected-b64/checkpoint-16000",
4
+ "epoch": 1.8639328984156571,
5
+ "global_step": 16000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
160
  "eval_samples_per_second": 60.37,
161
  "eval_steps_per_second": 0.945,
162
  "step": 14000
163
+ },
164
+ {
165
+ "epoch": 1.86,
166
+ "learning_rate": 0.0008564281159562467,
167
+ "loss": 1.2367,
168
+ "step": 16000
169
+ },
170
+ {
171
+ "epoch": 1.86,
172
+ "eval_accuracy": null,
173
+ "eval_bertscore_f1": 0.9367065161642227,
174
+ "eval_bleu": 0.4269002075734853,
175
+ "eval_f1": null,
176
+ "eval_loss": 1.692925214767456,
177
+ "eval_rouge1": 0.6232036846315818,
178
+ "eval_rouge2": 0.4180000668098338,
179
+ "eval_rougeL": 0.5680648753273818,
180
+ "eval_rougeLsum": 0.570113733783007,
181
+ "eval_runtime": 165.5988,
182
+ "eval_samples_per_second": 59.433,
183
+ "eval_steps_per_second": 0.93,
184
+ "step": 16000
185
  }
186
  ],
187
  "max_steps": 85840,
188
  "num_train_epochs": 10,
189
+ "total_flos": 2.417528886921216e+16,
190
  "trial_name": null,
191
  "trial_params": null
192
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:593e18bc3c456f313a1af17bb6a97030aabe3dfbde4c59f3e4ae0a040049cb77
3
  size 307910149
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ffb6cb62074cb556e4605433d13ffd9119d9af77cd667c007bfe11a29bc9c8a
3
  size 307910149