booksouls commited on
Commit
607c73e
·
verified ·
1 Parent(s): 1aecf15

Training in progress, epoch 4, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:60afd84760802444ae58550d1896fc22db404e1b9ac0fead40f9c30c6e047045
3
  size 1625422896
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8201f18535a29f04f89563cbe35511097be9afba3b01a1e701eb8781948a7e3
3
  size 1625422896
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a4c7f41b4b79b88ffeb95e5eeb7ba629814254d8304f6658c89cbc116aa6db8f
3
  size 3250751759
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1abcae7ab0e3b9ac6edbd28550a312b42a9c47fdf907f89ba856c5bf3237c056
3
  size 3250751759
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:de1bfc2d268cf7923378b9b2e0fe99c311d8b932bea99f486a350f50ffd9e101
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df39f38db37f6701456fe0a4817ff33122927ab7938b1eea653c5a371678f4e6
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:426dcb52d1996a4c433b718765d7d5084e38f73a5d455b904f91da402171e701
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83abdcd16b2b9b2191fd1f05501acfc5e3cc7f2d27d51fac1f0aca438433a1b0
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 3.9896907216494846,
5
  "eval_steps": 500,
6
- "global_step": 252,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -87,6 +87,26 @@
87
  "eval_samples_per_second": 0.36,
88
  "eval_steps_per_second": 0.09,
89
  "step": 252
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
90
  }
91
  ],
92
  "logging_steps": 500,
@@ -94,7 +114,7 @@
94
  "num_input_tokens_seen": 0,
95
  "num_train_epochs": 20,
96
  "save_steps": 500,
97
- "total_flos": 7.060426793680896e+16,
98
  "train_batch_size": 4,
99
  "trial_name": null,
100
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 4.989690721649485,
5
  "eval_steps": 500,
6
+ "global_step": 315,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
87
  "eval_samples_per_second": 0.36,
88
  "eval_steps_per_second": 0.09,
89
  "step": 252
90
+ },
91
+ {
92
+ "epoch": 4.989690721649485,
93
+ "grad_norm": 0.8451509475708008,
94
+ "learning_rate": 7.500000000000001e-06,
95
+ "loss": 2.3836,
96
+ "step": 315
97
+ },
98
+ {
99
+ "epoch": 4.989690721649485,
100
+ "eval_gen_len": 254.285147,
101
+ "eval_loss": 2.3810665607452393,
102
+ "eval_rouge1": 0.382543,
103
+ "eval_rouge2": 0.079173,
104
+ "eval_rougeL": 0.183712,
105
+ "eval_rougeLsum": 0.355298,
106
+ "eval_runtime": 3613.6748,
107
+ "eval_samples_per_second": 0.348,
108
+ "eval_steps_per_second": 0.087,
109
+ "step": 315
110
  }
111
  ],
112
  "logging_steps": 500,
 
114
  "num_input_tokens_seen": 0,
115
  "num_train_epochs": 20,
116
  "save_steps": 500,
117
+ "total_flos": 8.82553349210112e+16,
118
  "train_batch_size": 4,
119
  "trial_name": null,
120
  "trial_params": null
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:118bb6421b373e0e03ecd8aab7a5860a2b18c80d88abafa457126607b17fd56f
3
  size 5112
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f1906cfa0ad9e14e9f7f606dee91b794900b0ec7b1452c25901d0c904a02a7b
3
  size 5112