fcogidi commited on
Commit
c198480
·
verified ·
1 Parent(s): 25a7cab

Add files using upload-large-folder tool

Browse files
config.json ADDED
@@ -0,0 +1,68 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "JustinDu/BARTxiv",
3
+ "_num_labels": 3,
4
+ "activation_dropout": 0.0,
5
+ "activation_function": "gelu",
6
+ "add_final_layer_norm": false,
7
+ "architectures": [
8
+ "BartForConditionalGeneration"
9
+ ],
10
+ "attention_dropout": 0.0,
11
+ "bos_token_id": 0,
12
+ "classif_dropout": 0.0,
13
+ "classifier_dropout": 0.0,
14
+ "d_model": 1024,
15
+ "decoder_attention_heads": 16,
16
+ "decoder_ffn_dim": 4096,
17
+ "decoder_layerdrop": 0.0,
18
+ "decoder_layers": 12,
19
+ "decoder_start_token_id": 2,
20
+ "dropout": 0.1,
21
+ "early_stopping": null,
22
+ "encoder_attention_heads": 16,
23
+ "encoder_ffn_dim": 4096,
24
+ "encoder_layerdrop": 0.0,
25
+ "encoder_layers": 12,
26
+ "eos_token_id": 2,
27
+ "force_bos_token_to_be_generated": true,
28
+ "forced_eos_token_id": 2,
29
+ "gradient_checkpointing": false,
30
+ "id2label": {
31
+ "0": "LABEL_0",
32
+ "1": "LABEL_1",
33
+ "2": "LABEL_2"
34
+ },
35
+ "init_std": 0.02,
36
+ "is_encoder_decoder": true,
37
+ "label2id": {
38
+ "LABEL_0": 0,
39
+ "LABEL_1": 1,
40
+ "LABEL_2": 2
41
+ },
42
+ "length_penalty": null,
43
+ "max_length": null,
44
+ "max_position_embeddings": 1024,
45
+ "min_length": null,
46
+ "model_type": "bart",
47
+ "no_repeat_ngram_size": null,
48
+ "normalize_before": false,
49
+ "num_beams": null,
50
+ "num_hidden_layers": 12,
51
+ "output_past": true,
52
+ "pad_token_id": 1,
53
+ "prefix": " ",
54
+ "scale_embedding": false,
55
+ "task_specific_params": {
56
+ "summarization": {
57
+ "early_stopping": true,
58
+ "length_penalty": 2.0,
59
+ "max_length": 142,
60
+ "min_length": 56,
61
+ "no_repeat_ngram_size": 3,
62
+ "num_beams": 4
63
+ }
64
+ },
65
+ "transformers_version": "4.45.2",
66
+ "use_cache": true,
67
+ "vocab_size": 50264
68
+ }
generation_config.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 0,
4
+ "decoder_start_token_id": 2,
5
+ "early_stopping": true,
6
+ "eos_token_id": 2,
7
+ "forced_bos_token_id": 0,
8
+ "forced_eos_token_id": 2,
9
+ "length_penalty": 2.0,
10
+ "max_length": 142,
11
+ "min_length": 56,
12
+ "no_repeat_ngram_size": 3,
13
+ "num_beams": 4,
14
+ "pad_token_id": 1,
15
+ "transformers_version": "4.45.2"
16
+ }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
onnx/decoder_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d636fdf0f14d7ce34a583e58dc2a42b5d94f0a2a8243959435afe7c82fe17eb6
3
+ size 1223014991
onnx/decoder_model_bnb4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eec152d1d1dcbca3899e3e94ade2e9f9e55bb3eeaf82aa35a3cd0a86764fb926
3
+ size 354044523
onnx/decoder_model_fp16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab002e5d3e2bcbd58202509922ec7d572f66ba0bec6205dc75f2fe07cfd2b340
3
+ size 612053711
onnx/decoder_model_int8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26517a4a2ce702538d78e2a7e6f4d57d1959c2d4c1635a6ccb157ccf29b14488
3
+ size 307444525
onnx/decoder_model_merged.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66547d51aa5ec0e222d75e4fd4971e6dcb7e00bd4e9c2a42284d1f21796afb7a
3
+ size 1223529295
onnx/decoder_model_merged_bnb4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d653fd2b422ddc30235aeb864ac6fb397b091f960d3e30c225f5c0ab3ecad058
3
+ size 354573034
onnx/decoder_model_merged_fp16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9cae81f695f33745f9774e8ed842dce6e908c690984de9ca966abf31d03eb96
3
+ size 1173627010
onnx/decoder_model_merged_int8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f156ffb515f3319c2a5402383bb6849a1f373c629889badc11756478b37cdd4e
3
+ size 308283106
onnx/decoder_model_merged_q4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d06e47e94810c8c51c2c6081182e124695c2c9e7d06e3e9c0e0d992681df0a6
3
+ size 370370989
onnx/decoder_model_merged_q4f16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0224d043852edd844bd88fdd710b017c78ae5b81ec0d3890e91fed64150489c
3
+ size 482992258
onnx/decoder_model_merged_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f156ffb515f3319c2a5402383bb6849a1f373c629889badc11756478b37cdd4e
3
+ size 308283106
onnx/decoder_model_merged_uint8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25d8daf08c701832d53f7e2098d9a4c32f8f1e4eb0065fee42e33b58c95a649d
3
+ size 308283170
onnx/decoder_model_q4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aac0c7884dc32b089ffae9df6051af3bb4a3542780291b087a0a98048b65f432
3
+ size 369843351
onnx/decoder_model_q4f16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:286edea1da1ebbe7c32427646f846dbb1dccb27b472af5ea8c683de0c1e88d82
3
+ size 248646674
onnx/decoder_model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26517a4a2ce702538d78e2a7e6f4d57d1959c2d4c1635a6ccb157ccf29b14488
3
+ size 307444525
onnx/decoder_model_uint8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3451d171e538f5c312dce55e0edb4b6e48f05d4f0e13bde7fdbb0d27bf677c8e
3
+ size 307444589
onnx/decoder_with_past_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f8369b5982ebf7ccbd229cb173253190a5650eeec901ed59e2c558d54bdb322
3
+ size 1122163060
onnx/decoder_with_past_model_bnb4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83bbcd71725f743d308aed3ee3bd69bb9519fb3ba5b3e5e658e6a1b6819675b2
3
+ size 339696368
onnx/decoder_with_past_model_fp16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5954d070c41163d36eee4ed188af3d0fddac8d47d0526960794aa3c50a07d532
3
+ size 561551182
onnx/decoder_with_past_model_int8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4377fe16472435716866a68e84d083ed4fbe7ee830dadf8e877ea61b861b62a9
3
+ size 282031721
onnx/decoder_with_past_model_q4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61a9767fd790b28393362e4342f4e303762e1b83adbedcde98e43be2a7f69c99
3
+ size 353922524
onnx/decoder_with_past_model_q4f16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29a29432994d34c2faa0eea406f019bc5dd26b868cce097db3f1a835a7dbca7c
3
+ size 234320609
onnx/decoder_with_past_model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4377fe16472435716866a68e84d083ed4fbe7ee830dadf8e877ea61b861b62a9
3
+ size 282031721
onnx/decoder_with_past_model_uint8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:060e401540d3291d58b71f92e304ce0aacc5788f6cbfc4982b300a0f69fa2e3a
3
+ size 282031772
onnx/encoder_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7c716283a9b176892a3efb9fe7121bd8f53aa355951042a7a7389de7c4f919b
3
+ size 814962649
onnx/encoder_model_bnb4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e73ee362d6c713ed7325d120bc6d5f1fd3a6a7c42ca5301a6ac269226e11e44c
3
+ size 295928874
onnx/encoder_model_fp16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a580a5753b7da6e18004ebacd8f0e390021b40f67f4f75e6ed05da9fa6327d8f
3
+ size 407718530
onnx/encoder_model_int8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20afe59a40370911b495bbb48b8809d418cd50329bc7b8cb60fc7579090cb7e2
3
+ size 204598853
onnx/encoder_model_q4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:982c893726c343800a37096bb6550595c9dd17f76c28f94539dbb40bc842dc61
3
+ size 305365470
onnx/encoder_model_q4f16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ca99bc9eaeedbd98b019fd385d4da39036463008059700d3c273c3bfd0ff9b5
3
+ size 190656929
onnx/encoder_model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20afe59a40370911b495bbb48b8809d418cd50329bc7b8cb60fc7579090cb7e2
3
+ size 204598853
onnx/encoder_model_uint8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9a451cf789fcdaa31b20705c7a292ad9f6f2498d798c5d0042e70426f47f06b
3
+ size 204598890
quantize_config.json ADDED
@@ -0,0 +1,125 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "per_channel": true,
3
+ "reduce_range": true,
4
+ "per_model_config": {
5
+ "decoder_model": {
6
+ "op_types": [
7
+ "Softmax",
8
+ "Sqrt",
9
+ "Slice",
10
+ "Squeeze",
11
+ "Reshape",
12
+ "ReduceMean",
13
+ "Equal",
14
+ "Transpose",
15
+ "MatMul",
16
+ "Expand",
17
+ "Mul",
18
+ "ConstantOfShape",
19
+ "Pow",
20
+ "Less",
21
+ "Cast",
22
+ "Constant",
23
+ "Gather",
24
+ "Range",
25
+ "Where",
26
+ "Unsqueeze",
27
+ "Add",
28
+ "Concat",
29
+ "Shape",
30
+ "Div",
31
+ "Erf",
32
+ "Sub"
33
+ ],
34
+ "weight_type": "QInt8"
35
+ },
36
+ "encoder_model": {
37
+ "op_types": [
38
+ "Softmax",
39
+ "Sqrt",
40
+ "Reshape",
41
+ "ReduceMean",
42
+ "Equal",
43
+ "Transpose",
44
+ "MatMul",
45
+ "Expand",
46
+ "Mul",
47
+ "ConstantOfShape",
48
+ "Pow",
49
+ "Cast",
50
+ "Constant",
51
+ "Gather",
52
+ "Range",
53
+ "Where",
54
+ "Unsqueeze",
55
+ "Add",
56
+ "Concat",
57
+ "Shape",
58
+ "Div",
59
+ "Erf",
60
+ "Sub"
61
+ ],
62
+ "weight_type": "QInt8"
63
+ },
64
+ "decoder_model_merged": {
65
+ "op_types": [
66
+ "Softmax",
67
+ "Sqrt",
68
+ "Slice",
69
+ "Squeeze",
70
+ "Reshape",
71
+ "ReduceMean",
72
+ "Equal",
73
+ "Transpose",
74
+ "MatMul",
75
+ "Expand",
76
+ "Mul",
77
+ "ConstantOfShape",
78
+ "Pow",
79
+ "If",
80
+ "Less",
81
+ "Cast",
82
+ "Constant",
83
+ "Gather",
84
+ "Range",
85
+ "Where",
86
+ "Unsqueeze",
87
+ "Add",
88
+ "Concat",
89
+ "Shape",
90
+ "Div",
91
+ "Erf",
92
+ "Sub"
93
+ ],
94
+ "weight_type": "QInt8"
95
+ },
96
+ "decoder_with_past_model": {
97
+ "op_types": [
98
+ "Softmax",
99
+ "Sqrt",
100
+ "Reshape",
101
+ "ReduceMean",
102
+ "Equal",
103
+ "Transpose",
104
+ "MatMul",
105
+ "Expand",
106
+ "Mul",
107
+ "ConstantOfShape",
108
+ "Pow",
109
+ "Cast",
110
+ "Constant",
111
+ "Gather",
112
+ "Range",
113
+ "Where",
114
+ "Unsqueeze",
115
+ "Add",
116
+ "Concat",
117
+ "Shape",
118
+ "Div",
119
+ "Erf",
120
+ "Sub"
121
+ ],
122
+ "weight_type": "QInt8"
123
+ }
124
+ }
125
+ }
special_tokens_map.json ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<s>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "cls_token": {
10
+ "content": "<s>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "eos_token": {
17
+ "content": "</s>",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "mask_token": {
24
+ "content": "<mask>",
25
+ "lstrip": true,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ },
30
+ "pad_token": {
31
+ "content": "<pad>",
32
+ "lstrip": false,
33
+ "normalized": false,
34
+ "rstrip": false,
35
+ "single_word": false
36
+ },
37
+ "sep_token": {
38
+ "content": "</s>",
39
+ "lstrip": false,
40
+ "normalized": false,
41
+ "rstrip": false,
42
+ "single_word": false
43
+ },
44
+ "unk_token": {
45
+ "content": "<unk>",
46
+ "lstrip": false,
47
+ "normalized": false,
48
+ "rstrip": false,
49
+ "single_word": false
50
+ }
51
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,64 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "added_tokens_decoder": {
4
+ "0": {
5
+ "content": "<s>",
6
+ "lstrip": false,
7
+ "normalized": false,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ "1": {
13
+ "content": "<pad>",
14
+ "lstrip": false,
15
+ "normalized": false,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
+ },
20
+ "2": {
21
+ "content": "</s>",
22
+ "lstrip": false,
23
+ "normalized": false,
24
+ "rstrip": false,
25
+ "single_word": false,
26
+ "special": true
27
+ },
28
+ "3": {
29
+ "content": "<unk>",
30
+ "lstrip": false,
31
+ "normalized": false,
32
+ "rstrip": false,
33
+ "single_word": false,
34
+ "special": true
35
+ },
36
+ "50264": {
37
+ "content": "<mask>",
38
+ "lstrip": true,
39
+ "normalized": false,
40
+ "rstrip": false,
41
+ "single_word": false,
42
+ "special": true
43
+ }
44
+ },
45
+ "bos_token": "<s>",
46
+ "clean_up_tokenization_spaces": false,
47
+ "cls_token": "<s>",
48
+ "eos_token": "</s>",
49
+ "errors": "replace",
50
+ "mask_token": "<mask>",
51
+ "max_length": 1024,
52
+ "model_max_length": 1024,
53
+ "pad_to_multiple_of": null,
54
+ "pad_token": "<pad>",
55
+ "pad_token_type_id": 0,
56
+ "padding_side": "right",
57
+ "sep_token": "</s>",
58
+ "stride": 0,
59
+ "tokenizer_class": "BartTokenizer",
60
+ "trim_offsets": true,
61
+ "truncation_side": "right",
62
+ "truncation_strategy": "longest_first",
63
+ "unk_token": "<unk>"
64
+ }
vocab.json ADDED
The diff for this file is too large to render. See raw diff