Training in progress, step 500
Browse files- README.md +7 -6
- config.json +2 -2
- generation_config.json +1 -1
- model.safetensors +2 -2
- runs/Dec10_19-58-54_iit-p/events.out.tfevents.1733841294.iit-p.20039.1 +3 -0
- tokenizer_config.json +1 -1
- training_args.bin +2 -2
README.md
CHANGED
@@ -1,4 +1,5 @@
|
|
1 |
---
|
|
|
2 |
license: apache-2.0
|
3 |
base_model: google/flan-t5-base
|
4 |
tags:
|
@@ -50,7 +51,7 @@ The following hyperparameters were used during training:
|
|
50 |
- train_batch_size: 4
|
51 |
- eval_batch_size: 4
|
52 |
- seed: 42
|
53 |
-
- optimizer:
|
54 |
- lr_scheduler_type: linear
|
55 |
- num_epochs: 2
|
56 |
|
@@ -58,13 +59,13 @@ The following hyperparameters were used during training:
|
|
58 |
|
59 |
| Training Loss | Epoch | Step | Validation Loss | Rouge | Bleu1 | Bleu2 | Bleu3 | Bleu4 | Meteor | Bertscore Precision | Bertscore Recall | Bertscore F1 | Gen Len |
|
60 |
|:-------------:|:-----:|:----:|:---------------:|:-------------------------------------------------------:|:-----:|:-----:|:-----:|:-----:|:------:|:-------------------:|:----------------:|:------------:|:-------:|
|
61 |
-
| 1.
|
62 |
| 0.0 | 2.0 | 756 | nan | {'rouge1': 0, 'rouge2': 0, 'rougeL': 0, 'rougeLsum': 0} | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
|
63 |
|
64 |
|
65 |
### Framework versions
|
66 |
|
67 |
-
- Transformers 4.
|
68 |
-
- Pytorch 2.
|
69 |
-
- Datasets
|
70 |
-
- Tokenizers 0.
|
|
|
1 |
---
|
2 |
+
library_name: transformers
|
3 |
license: apache-2.0
|
4 |
base_model: google/flan-t5-base
|
5 |
tags:
|
|
|
51 |
- train_batch_size: 4
|
52 |
- eval_batch_size: 4
|
53 |
- seed: 42
|
54 |
+
- optimizer: Use adamw_torch with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
|
55 |
- lr_scheduler_type: linear
|
56 |
- num_epochs: 2
|
57 |
|
|
|
59 |
|
60 |
| Training Loss | Epoch | Step | Validation Loss | Rouge | Bleu1 | Bleu2 | Bleu3 | Bleu4 | Meteor | Bertscore Precision | Bertscore Recall | Bertscore F1 | Gen Len |
|
61 |
|:-------------:|:-----:|:----:|:---------------:|:-------------------------------------------------------:|:-----:|:-----:|:-----:|:-----:|:------:|:-------------------:|:----------------:|:------------:|:-------:|
|
62 |
+
| 1.83 | 1.0 | 378 | nan | {'rouge1': 0, 'rouge2': 0, 'rougeL': 0, 'rougeLsum': 0} | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
|
63 |
| 0.0 | 2.0 | 756 | nan | {'rouge1': 0, 'rouge2': 0, 'rougeL': 0, 'rougeLsum': 0} | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 |
|
64 |
|
65 |
|
66 |
### Framework versions
|
67 |
|
68 |
+
- Transformers 4.46.3
|
69 |
+
- Pytorch 2.4.1+cu121
|
70 |
+
- Datasets 2.20.0
|
71 |
+
- Tokenizers 0.20.3
|
config.json
CHANGED
@@ -55,8 +55,8 @@
|
|
55 |
}
|
56 |
},
|
57 |
"tie_word_embeddings": false,
|
58 |
-
"torch_dtype": "
|
59 |
-
"transformers_version": "4.
|
60 |
"use_cache": true,
|
61 |
"vocab_size": 32128
|
62 |
}
|
|
|
55 |
}
|
56 |
},
|
57 |
"tie_word_embeddings": false,
|
58 |
+
"torch_dtype": "float32",
|
59 |
+
"transformers_version": "4.46.3",
|
60 |
"use_cache": true,
|
61 |
"vocab_size": 32128
|
62 |
}
|
generation_config.json
CHANGED
@@ -2,5 +2,5 @@
|
|
2 |
"decoder_start_token_id": 0,
|
3 |
"eos_token_id": 1,
|
4 |
"pad_token_id": 0,
|
5 |
-
"transformers_version": "4.
|
6 |
}
|
|
|
2 |
"decoder_start_token_id": 0,
|
3 |
"eos_token_id": 1,
|
4 |
"pad_token_id": 0,
|
5 |
+
"transformers_version": "4.46.3"
|
6 |
}
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b19eda28178de2a24e5ef2b6b60446b6ee080dd17443144ca927fca8689e85e0
|
3 |
+
size 990345064
|
runs/Dec10_19-58-54_iit-p/events.out.tfevents.1733841294.iit-p.20039.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3708ec3d8a74acec4c939e16a98985974f536148ee386c47c8c2f22e2c1cb983
|
3 |
+
size 835
|
tokenizer_config.json
CHANGED
@@ -927,7 +927,7 @@
|
|
927 |
"<extra_id_98>",
|
928 |
"<extra_id_99>"
|
929 |
],
|
930 |
-
"clean_up_tokenization_spaces":
|
931 |
"eos_token": "</s>",
|
932 |
"extra_ids": 100,
|
933 |
"model_max_length": 512,
|
|
|
927 |
"<extra_id_98>",
|
928 |
"<extra_id_99>"
|
929 |
],
|
930 |
+
"clean_up_tokenization_spaces": false,
|
931 |
"eos_token": "</s>",
|
932 |
"extra_ids": 100,
|
933 |
"model_max_length": 512,
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d173a1eff11e3d6f77610033144a9d9a1fa70b4e0b608c85e629ec993c295640
|
3 |
+
size 5368
|