Upload folder using huggingface_hub

Files changed (6) hide show

.gitattributes CHANGED Viewed

@@ -33,3 +33,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+_model_layers.0_self_attn_rotary_emb_Constant_5_attr__value filter=lfs diff=lfs merge=lfs -text
+_model_layers.0_self_attn_rotary_emb_Constant_attr__value filter=lfs diff=lfs merge=lfs -text

_model_layers.0_self_attn_rotary_emb_Constant_5_attr__value ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:38f44286ec0ca2a407877f4908d4f5607fb5f3a76a9099ee583cc7684dc7de0c
+size 8388608

_model_layers.0_self_attn_rotary_emb_Constant_attr__value ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:4e699ce948b3c9fc0b86dc4beb337c5fb1b1edbce5d094aa07c8ae37cd7199f3
+size 8388608

onnx/model.onnx ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:3d63556db976ef2983174f01cc496aa8d90715a81e6c9f130c2965d473984979
+size 1873498357

onnx/model_quantized.onnx ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:068cad70fa3850652e6ebc0ad7a49847568f32e6eda5a8527e5893de9a7b8939
+size 482326147

quantize_config.json CHANGED Viewed

@@ -4,34 +4,34 @@
     "per_model_config": {
         "model": {
             "op_types": [
-                "Shape",
                 "Reshape",
-                "Expand",
-                "Add",
-                "Div",
-                "Equal",
-                "Where",
-                "Concat",
                 "Slice",
                 "Unsqueeze",
                 "Mul",
                 "Pow",
-                "Neg",
-                "Squeeze",
-                "Constant",
-                "MatMul",
-                "Less",
-                "Gather",
-                "Cast",
-                "ReduceMean",
-                "Sqrt",
                 "Range",
                 "Transpose",
-                "Sigmoid",
                 "ConstantOfShape",
-                "Softmax",
-                "Trilu",
-                "Sub"
             ],
             "weight_type": "QInt8"
         }

     "per_model_config": {
         "model": {
             "op_types": [
+                "Less",
+                "MatMul",
+                "Sqrt",
+                "Softmax",
                 "Reshape",
+                "Gather",
                 "Slice",
+                "Equal",
+                "Neg",
+                "Sigmoid",
                 "Unsqueeze",
+                "Constant",
+                "Expand",
+                "Squeeze",
+                "Concat",
                 "Mul",
+                "Shape",
                 "Pow",
+                "Add",
+                "Where",
+                "Trilu",
                 "Range",
+                "Div",
+                "Cast",
+                "Sub",
                 "Transpose",
                 "ConstantOfShape",
+                "ReduceMean"
             ],
             "weight_type": "QInt8"
         }