Xenova HF staff commited on
Commit
8b785a6
·
verified ·
1 Parent(s): 1287824

Upload folder using huggingface_hub

Browse files
onnx/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8da7df5f74944dcc8cc657f70b863e28c371131e433be75e95f35933d20b7ab2
3
+ size 37970693
onnx/model_bnb4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a53f2a8c6a7355d14c4061466d542e08246e783930542367d875b9b83c5b132
3
+ size 37970712
onnx/model_fp16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ffb20ec49baaf909ba369e9344cbd6e132ff31ee1c1801e3d328970fdb33d5d7
3
+ size 19069292
onnx/model_int8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d197a46be3a7844187b0c22a7b2575cf4d09061f7be7b8147c448a7129ada9b8
3
+ size 9919544
onnx/model_q4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a53f2a8c6a7355d14c4061466d542e08246e783930542367d875b9b83c5b132
3
+ size 37970712
onnx/model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:816714d6b6cfcfca43562488089fa87096fe25d63bb0542bbb48af32d0eeace9
3
+ size 9919577
onnx/model_uint8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:816714d6b6cfcfca43562488089fa87096fe25d63bb0542bbb48af32d0eeace9
3
+ size 9919577
quantize_config.json ADDED
@@ -0,0 +1,90 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "fp16": {},
3
+ "q8": {
4
+ "per_model_config": {
5
+ "model": {
6
+ "op_types": [
7
+ "Add",
8
+ "BatchNormalization",
9
+ "Constant",
10
+ "Conv",
11
+ "Div",
12
+ "Erf",
13
+ "Flatten",
14
+ "Gemm",
15
+ "GlobalAveragePool",
16
+ "Identity",
17
+ "Mul",
18
+ "ReduceMean",
19
+ "Relu",
20
+ "Sigmoid",
21
+ "Sub"
22
+ ],
23
+ "weight_type": "QUInt8"
24
+ }
25
+ },
26
+ "per_channel": false,
27
+ "reduce_range": false
28
+ },
29
+ "int8": {
30
+ "per_model_config": {
31
+ "model": {
32
+ "op_types": [
33
+ "Add",
34
+ "BatchNormalization",
35
+ "Constant",
36
+ "Conv",
37
+ "Div",
38
+ "Erf",
39
+ "Flatten",
40
+ "Gemm",
41
+ "GlobalAveragePool",
42
+ "Identity",
43
+ "Mul",
44
+ "ReduceMean",
45
+ "Relu",
46
+ "Sigmoid",
47
+ "Sub"
48
+ ],
49
+ "weight_type": "QInt8"
50
+ }
51
+ },
52
+ "per_channel": false,
53
+ "reduce_range": false
54
+ },
55
+ "uint8": {
56
+ "per_model_config": {
57
+ "model": {
58
+ "op_types": [
59
+ "Add",
60
+ "BatchNormalization",
61
+ "Constant",
62
+ "Conv",
63
+ "Div",
64
+ "Erf",
65
+ "Flatten",
66
+ "Gemm",
67
+ "GlobalAveragePool",
68
+ "Identity",
69
+ "Mul",
70
+ "ReduceMean",
71
+ "Relu",
72
+ "Sigmoid",
73
+ "Sub"
74
+ ],
75
+ "weight_type": "QUInt8"
76
+ }
77
+ },
78
+ "per_channel": false,
79
+ "reduce_range": false
80
+ },
81
+ "q4": {
82
+ "block_size": 32,
83
+ "is_symmetric": true,
84
+ "accuracy_level": null
85
+ },
86
+ "bnb4": {
87
+ "block_size": 64,
88
+ "quant_type": 1
89
+ }
90
+ }