Upload folder using huggingface_hub

Browse files

Files changed (8) hide show

onnx/model.onnx +3 -0
onnx/model_bnb4.onnx +3 -0
onnx/model_fp16.onnx +3 -0
onnx/model_int8.onnx +3 -0
onnx/model_q4.onnx +3 -0
onnx/model_quantized.onnx +3 -0
onnx/model_uint8.onnx +3 -0
quantize_config.json +120 -0

onnx/model.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:afb6a5c28f3b6bf1618c6e43f02073ef9dfdc70e937502d51603e57b0a1df10c
+size 99060839

onnx/model_bnb4.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0312c94ffd25c662880df1d55b336f028115166eb574ebc1622901d39e984185
+size 26077648

onnx/model_fp16.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2df6223f206b5164e21f664ace61dabeb9bb6a49b8b5a3e00510b4807d0f5b04
+size 49642442

onnx/model_int8.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:01aa7a23de3f4a0ee1a2bb9997e6918104c85a9f95dea46d27b9b3fb0c6b9001
+size 27258801

onnx/model_q4.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5d55b02762e1907589158af3e366bd61ddf648155852a07bbf5e3a074639fcf8
+size 27404416

onnx/model_quantized.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fcf51f1b230362b28690bb9d1809bf0431f29cad20534e3f589bd7285547f20d
+size 27258801

onnx/model_uint8.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fcf51f1b230362b28690bb9d1809bf0431f29cad20534e3f589bd7285547f20d
+size 27258801

quantize_config.json ADDED Viewed

	@@ -0,0 +1,120 @@

+{
+    "fp16": {},
+    "q8": {
+        "per_model_config": {
+            "model": {
+                "op_types": [
+                    "Add",
+                    "Concat",
+                    "Conv",
+                    "ConvTranspose",
+                    "Div",
+                    "Equal",
+                    "Erf",
+                    "Expand",
+                    "Gather",
+                    "MatMul",
+                    "Mul",
+                    "Pow",
+                    "ReduceMean",
+                    "Relu",
+                    "Reshape",
+                    "Resize",
+                    "Shape",
+                    "Slice",
+                    "Softmax",
+                    "Sqrt",
+                    "Squeeze",
+                    "Sub",
+                    "Transpose",
+                    "Unsqueeze",
+                    "Where"
+                ],
+                "weight_type": "QUInt8"
+            }
+        },
+        "per_channel": true,
+        "reduce_range": true
+    },
+    "int8": {
+        "per_model_config": {
+            "model": {
+                "op_types": [
+                    "Add",
+                    "Concat",
+                    "Conv",
+                    "ConvTranspose",
+                    "Div",
+                    "Equal",
+                    "Erf",
+                    "Expand",
+                    "Gather",
+                    "MatMul",
+                    "Mul",
+                    "Pow",
+                    "ReduceMean",
+                    "Relu",
+                    "Reshape",
+                    "Resize",
+                    "Shape",
+                    "Slice",
+                    "Softmax",
+                    "Sqrt",
+                    "Squeeze",
+                    "Sub",
+                    "Transpose",
+                    "Unsqueeze",
+                    "Where"
+                ],
+                "weight_type": "QInt8"
+            }
+        },
+        "per_channel": true,
+        "reduce_range": true
+    },
+    "uint8": {
+        "per_model_config": {
+            "model": {
+                "op_types": [
+                    "Add",
+                    "Concat",
+                    "Conv",
+                    "ConvTranspose",
+                    "Div",
+                    "Equal",
+                    "Erf",
+                    "Expand",
+                    "Gather",
+                    "MatMul",
+                    "Mul",
+                    "Pow",
+                    "ReduceMean",
+                    "Relu",
+                    "Reshape",
+                    "Resize",
+                    "Shape",
+                    "Slice",
+                    "Softmax",
+                    "Sqrt",
+                    "Squeeze",
+                    "Sub",
+                    "Transpose",
+                    "Unsqueeze",
+                    "Where"
+                ],
+                "weight_type": "QUInt8"
+            }
+        },
+        "per_channel": true,
+        "reduce_range": true
+    },
+    "q4": {
+        "block_size": 32,
+        "is_symmetric": true,
+        "accuracy_level": null
+    },
+    "bnb4": {
+        "block_size": 64,
+        "quant_type": 1
+    }
+}