ljhskyso commited on
Commit
cedf954
·
unverified ·
1 Parent(s): 8fdc800

quantized v1.5 model

Browse files
.gitignore ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ # macOS
2
+ .DS_Store
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "/root/.cache/torch/sentence_transformers/BAAI_bge-base-en/",
3
  "architectures": [
4
  "BertModel"
5
  ],
@@ -24,8 +24,7 @@
24
  "num_hidden_layers": 12,
25
  "pad_token_id": 0,
26
  "position_embedding_type": "absolute",
27
- "torch_dtype": "float32",
28
- "transformers_version": "4.30.0",
29
  "type_vocab_size": 2,
30
  "use_cache": true,
31
  "vocab_size": 30522
 
1
  {
2
+ "_name_or_path": "onnx-v1.5",
3
  "architectures": [
4
  "BertModel"
5
  ],
 
24
  "num_hidden_layers": 12,
25
  "pad_token_id": 0,
26
  "position_embedding_type": "absolute",
27
+ "transformers_version": "4.33.0",
 
28
  "type_vocab_size": 2,
29
  "use_cache": true,
30
  "vocab_size": 30522
onnx ADDED
@@ -0,0 +1 @@
 
 
1
+ onnx-v1.5
onnx-v1.5/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9bc579acdba21c253c62a9bf866891355a63ffa3442b52c8a37d75b2ccb91848
3
+ size 435811539
onnx-v1.5/model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:22d996808c4539936ecc55be24dc3ecd8c36de1ebfcc461325f5cb4d947f7483
3
+ size 109706513
{onnx → onnx-v1.5}/ort_config.json RENAMED
File without changes
{onnx → onnx-v1}/model.onnx RENAMED
File without changes
{onnx → onnx-v1}/model_quantized.onnx RENAMED
File without changes
onnx-v1/ort_config.json ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "one_external_file": true,
3
+ "opset": null,
4
+ "optimization": {},
5
+ "optimum_version": "1.12.0",
6
+ "quantization": {
7
+ "activations_dtype": "QUInt8",
8
+ "activations_symmetric": false,
9
+ "format": "QOperator",
10
+ "is_static": false,
11
+ "mode": "IntegerOps",
12
+ "nodes_to_exclude": [],
13
+ "nodes_to_quantize": [],
14
+ "operators_to_quantize": [
15
+ "Conv",
16
+ "MatMul",
17
+ "Attention",
18
+ "LSTM",
19
+ "Gather",
20
+ "Transpose",
21
+ "EmbedLayerNormalization"
22
+ ],
23
+ "per_channel": false,
24
+ "qdq_add_pair_to_weight": false,
25
+ "qdq_dedicated_pair": false,
26
+ "qdq_op_type_per_channel_support_to_axis": {
27
+ "MatMul": 1
28
+ },
29
+ "reduce_range": false,
30
+ "weights_dtype": "QInt8",
31
+ "weights_symmetric": true
32
+ },
33
+ "transformers_version": "4.33.0",
34
+ "use_external_data_format": false
35
+ }