booksouls commited on
Commit
6669ae2
·
verified ·
1 Parent(s): bbfc4de

Training in progress, epoch 1, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3c12d7f2593a757af810a868812a1d71436bdcae28efdf85ea7f38a4fc746ec5
3
  size 1625422896
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6827d008d9d4aa1d33ebd5114f2e6aec21c34611adb57234406e55f04767d8d
3
  size 1625422896
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ac6ec307772c725d237ce53ed00072c43daaa5b943c6ff8a9da9770286617faa
3
  size 3250751759
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32937b908f067c2992afcbd5006376f6501d018d1543873b1adbc0eb3af78b66
3
  size 3250751759
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a88b29d6e52643dde49d0cb58cc10992cdfe46f6b308a65f4ae40f4c3e286477
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9739f47ce3993debf7abf052444a7cacfe7a7344541e97f8d68b5bcccd87df17
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:688b62605b5df52f5fec25b0648081ab1c61e87d91d24d2c5606b1fd6ec87baf
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f703cd7922f54f41516d5ce900f74f70f626e6131121e3f10bc8556c6d3d8af4
3
  size 1064
last-checkpoint/tokenizer_config.json CHANGED
@@ -48,10 +48,17 @@
48
  "eos_token": "</s>",
49
  "errors": "replace",
50
  "mask_token": "<mask>",
 
51
  "model_max_length": 1000000000000000019884624838656,
 
52
  "pad_token": "<pad>",
 
 
53
  "sep_token": "</s>",
 
54
  "tokenizer_class": "BartTokenizer",
55
  "trim_offsets": true,
 
 
56
  "unk_token": "<unk>"
57
  }
 
48
  "eos_token": "</s>",
49
  "errors": "replace",
50
  "mask_token": "<mask>",
51
+ "max_length": 256,
52
  "model_max_length": 1000000000000000019884624838656,
53
+ "pad_to_multiple_of": null,
54
  "pad_token": "<pad>",
55
+ "pad_token_type_id": 0,
56
+ "padding_side": "right",
57
  "sep_token": "</s>",
58
+ "stride": 0,
59
  "tokenizer_class": "BartTokenizer",
60
  "trim_offsets": true,
61
+ "truncation_side": "right",
62
+ "truncation_strategy": "longest_first",
63
  "unk_token": "<unk>"
64
  }
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.9896907216494846,
5
  "eval_steps": 500,
6
- "global_step": 63,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -27,6 +27,26 @@
27
  "eval_samples_per_second": 0.351,
28
  "eval_steps_per_second": 0.088,
29
  "step": 63
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
30
  }
31
  ],
32
  "logging_steps": 500,
@@ -34,7 +54,7 @@
34
  "num_input_tokens_seen": 0,
35
  "num_train_epochs": 20,
36
  "save_steps": 500,
37
- "total_flos": 1.765106698420224e+16,
38
  "train_batch_size": 4,
39
  "trial_name": null,
40
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.9896907216494846,
5
  "eval_steps": 500,
6
+ "global_step": 126,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
27
  "eval_samples_per_second": 0.351,
28
  "eval_steps_per_second": 0.088,
29
  "step": 63
30
+ },
31
+ {
32
+ "epoch": 1.9896907216494846,
33
+ "grad_norm": 1.331000566482544,
34
+ "learning_rate": 9e-06,
35
+ "loss": 2.6117,
36
+ "step": 126
37
+ },
38
+ {
39
+ "epoch": 1.9896907216494846,
40
+ "eval_gen_len": 254.757744,
41
+ "eval_loss": 2.461825132369995,
42
+ "eval_rouge1": 0.378265,
43
+ "eval_rouge2": 0.077138,
44
+ "eval_rougeL": 0.182503,
45
+ "eval_rougeLsum": 0.351427,
46
+ "eval_runtime": 3653.2761,
47
+ "eval_samples_per_second": 0.345,
48
+ "eval_steps_per_second": 0.086,
49
+ "step": 126
50
  }
51
  ],
52
  "logging_steps": 500,
 
54
  "num_input_tokens_seen": 0,
55
  "num_train_epochs": 20,
56
  "save_steps": 500,
57
+ "total_flos": 3.530213396840448e+16,
58
  "train_batch_size": 4,
59
  "trial_name": null,
60
  "trial_params": null
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:caad959ae301f6d09f2d4b89a83e21da46692e815b332784c72ea6ba5f60dc2b
3
  size 5112
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9345dd68c98da773799b72393992df8416b90fe1be028abc820aaf776d08511d
3
  size 5112