zera09 commited on
Commit
01fe497
·
verified ·
1 Parent(s): 2be060b

Training in progress, step 500

Browse files
README.md CHANGED
@@ -1,4 +1,5 @@
1
  ---
 
2
  license: apache-2.0
3
  base_model: google/flan-t5-base
4
  tags:
@@ -50,7 +51,7 @@ The following hyperparameters were used during training:
50
  - train_batch_size: 4
51
  - eval_batch_size: 4
52
  - seed: 42
53
- - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
54
  - lr_scheduler_type: linear
55
  - num_epochs: 2
56
 
@@ -58,13 +59,13 @@ The following hyperparameters were used during training:
58
 
59
  | Training Loss | Epoch | Step | Validation Loss | Rouge | Bleu1 | Bleu2 | Bleu3 | Bleu4 | Meteor | Bertscore Precision | Bertscore Recall | Bertscore F1 | Gen Len |
60
  |:-------------:|:-----:|:----:|:---------------:|:-------------------------------------------------------:|:-----:|:-----:|:-----:|:-----:|:------:|:-------------------:|:----------------:|:------------:|:-------:|
61
- | 1.9328 | 1.0 | 378 | nan | {'rouge1': 0, 'rouge2': 0, 'rougeL': 0, 'rougeLsum': 0} | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
62
  | 0.0 | 2.0 | 756 | nan | {'rouge1': 0, 'rouge2': 0, 'rougeL': 0, 'rougeLsum': 0} | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
63
 
64
 
65
  ### Framework versions
66
 
67
- - Transformers 4.40.0
68
- - Pytorch 2.2.0+cu118
69
- - Datasets 3.0.0
70
- - Tokenizers 0.19.1
 
1
  ---
2
+ library_name: transformers
3
  license: apache-2.0
4
  base_model: google/flan-t5-base
5
  tags:
 
51
  - train_batch_size: 4
52
  - eval_batch_size: 4
53
  - seed: 42
54
+ - optimizer: Use adamw_torch with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
55
  - lr_scheduler_type: linear
56
  - num_epochs: 2
57
 
 
59
 
60
  | Training Loss | Epoch | Step | Validation Loss | Rouge | Bleu1 | Bleu2 | Bleu3 | Bleu4 | Meteor | Bertscore Precision | Bertscore Recall | Bertscore F1 | Gen Len |
61
  |:-------------:|:-----:|:----:|:---------------:|:-------------------------------------------------------:|:-----:|:-----:|:-----:|:-----:|:------:|:-------------------:|:----------------:|:------------:|:-------:|
62
+ | 1.83 | 1.0 | 378 | nan | {'rouge1': 0, 'rouge2': 0, 'rougeL': 0, 'rougeLsum': 0} | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
63
  | 0.0 | 2.0 | 756 | nan | {'rouge1': 0, 'rouge2': 0, 'rougeL': 0, 'rougeLsum': 0} | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
64
 
65
 
66
  ### Framework versions
67
 
68
+ - Transformers 4.46.3
69
+ - Pytorch 2.4.1+cu121
70
+ - Datasets 2.20.0
71
+ - Tokenizers 0.20.3
config.json CHANGED
@@ -55,8 +55,8 @@
55
  }
56
  },
57
  "tie_word_embeddings": false,
58
- "torch_dtype": "float16",
59
- "transformers_version": "4.40.0",
60
  "use_cache": true,
61
  "vocab_size": 32128
62
  }
 
55
  }
56
  },
57
  "tie_word_embeddings": false,
58
+ "torch_dtype": "float32",
59
+ "transformers_version": "4.46.3",
60
  "use_cache": true,
61
  "vocab_size": 32128
62
  }
generation_config.json CHANGED
@@ -2,5 +2,5 @@
2
  "decoder_start_token_id": 0,
3
  "eos_token_id": 1,
4
  "pad_token_id": 0,
5
- "transformers_version": "4.40.0"
6
  }
 
2
  "decoder_start_token_id": 0,
3
  "eos_token_id": 1,
4
  "pad_token_id": 0,
5
+ "transformers_version": "4.46.3"
6
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dd66f721d95e424eec3035589db15a9833aab2daa912e738569d42b3321d4461
3
- size 570686880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b19eda28178de2a24e5ef2b6b60446b6ee080dd17443144ca927fca8689e85e0
3
+ size 990345064
runs/Dec10_19-58-54_iit-p/events.out.tfevents.1733841294.iit-p.20039.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3708ec3d8a74acec4c939e16a98985974f536148ee386c47c8c2f22e2c1cb983
3
+ size 835
tokenizer_config.json CHANGED
@@ -927,7 +927,7 @@
927
  "<extra_id_98>",
928
  "<extra_id_99>"
929
  ],
930
- "clean_up_tokenization_spaces": true,
931
  "eos_token": "</s>",
932
  "extra_ids": 100,
933
  "model_max_length": 512,
 
927
  "<extra_id_98>",
928
  "<extra_id_99>"
929
  ],
930
+ "clean_up_tokenization_spaces": false,
931
  "eos_token": "</s>",
932
  "extra_ids": 100,
933
  "model_max_length": 512,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:323eca41da22235eaa9fb7fc694fc036b8e22f209c4485413fbba627f4ec6ff4
3
- size 5112
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d173a1eff11e3d6f77610033144a9d9a1fa70b4e0b608c85e629ec993c295640
3
+ size 5368