Upload folder using huggingface_hub

Browse files

Files changed (9) hide show

config.json +1 -1
generation_config.json +1 -1
onnx/decoder_model.onnx +2 -2
onnx/decoder_model_merged.onnx +2 -2
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
quantize_config.json +88 -0

config.json CHANGED Viewed

@@ -47,7 +47,7 @@
   "summary_proj_to_labels": true,
   "summary_type": "cls_index",
   "summary_use_proj": true,
-  "transformers_version": "4.29.2",
   "use_cache": false,
   "vocab_size": 50258,
   "window_size": 256

   "summary_proj_to_labels": true,
   "summary_type": "cls_index",
   "summary_use_proj": true,
+  "transformers_version": "4.33.0.dev0",
   "use_cache": false,
   "vocab_size": 50258,
   "window_size": 256

generation_config.json CHANGED Viewed

@@ -2,5 +2,5 @@
   "_from_model_config": true,
   "bos_token_id": 50256,
   "eos_token_id": 50256,
-  "transformers_version": "4.29.2"
 }

   "_from_model_config": true,
   "bos_token_id": 50256,
   "eos_token_id": 50256,
+  "transformers_version": "4.33.0.dev0"
 }

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b0f586629a5c1dc00495a85d2f5c0a0bdfeca920efed9d81beff576e4cfe90db
-size 663875781

 version https://git-lfs.github.com/spec/v1
+oid sha256:495a71c1e0b3bab2635b246850881ef27a3101b01b5ae000ca0b3918098efbbe
+size 509481664

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a22d3658b34dce337faf404ae6676be07ea8b4067b6d62a3c822f11b01ae04bb
-size 664181010

 version https://git-lfs.github.com/spec/v1
+oid sha256:a9be8abd3ce0240b3b0dd9cdaa378f4f00ea1427abf12a10b1478ba68bc19684
+size 518173878

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:73f9cda9618743ee5334a2fc840fac348e4fde2ef207f9df9ca82059ea3d3637
-size 174104756

 version https://git-lfs.github.com/spec/v1
+oid sha256:7c738a0bebd9cae8408ed1941192bd7cce35140997c8f42fca632dda543d1465
+size 143638305

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1de292dc884bcee7c288153692142da949633eef0dc0433a311af2cf8acaf6dd
-size 173615198

 version https://git-lfs.github.com/spec/v1
+oid sha256:e53834a268d833c5efdc3b890c074806055f093e0d69cc0fa3f469c36dec1cf7
+size 134762955

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9a31ee7af77875693df54e37562d40795077f93bd4f60b597bfd2a22f8418f4c
-size 663883544

 version https://git-lfs.github.com/spec/v1
+oid sha256:423da608d177bea869d8a6683b55097b8de1616ee8a1cb0d1774f1267ebc94cb
+size 509489427

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cea7873f398d5a4f7af7d7315d65689781725b2fce5cea9118c184589fcb0cb6
-size 173624782

 version https://git-lfs.github.com/spec/v1
+oid sha256:f3771be8da093ba69bf84a3847f7bec486acd2f5bdb2ebb37b8f03499b3084ed
+size 134772539

quantize_config.json ADDED Viewed

	@@ -0,0 +1,88 @@

+{
+    "per_channel": true,
+    "reduce_range": true,
+    "per_model_config": {
+        "decoder_model": {
+            "op_types": [
+                "Tanh",
+                "Slice",
+                "MatMul",
+                "Div",
+                "Shape",
+                "ReduceMean",
+                "Concat",
+                "Squeeze",
+                "Constant",
+                "Reshape",
+                "Mul",
+                "Where",
+                "Range",
+                "Gather",
+                "Sqrt",
+                "Pow",
+                "Transpose",
+                "Cast",
+                "Sub",
+                "Unsqueeze",
+                "Add",
+                "Softmax"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_model_merged": {
+            "op_types": [
+                "Tanh",
+                "Slice",
+                "MatMul",
+                "Div",
+                "Shape",
+                "ReduceMean",
+                "Concat",
+                "Squeeze",
+                "Constant",
+                "Reshape",
+                "Mul",
+                "Where",
+                "Range",
+                "Gather",
+                "Sqrt",
+                "Pow",
+                "Transpose",
+                "Cast",
+                "Sub",
+                "Unsqueeze",
+                "Add",
+                "If",
+                "Softmax"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_with_past_model": {
+            "op_types": [
+                "Tanh",
+                "Slice",
+                "MatMul",
+                "Div",
+                "Shape",
+                "ReduceMean",
+                "Concat",
+                "Squeeze",
+                "Constant",
+                "Reshape",
+                "Mul",
+                "Where",
+                "Range",
+                "Gather",
+                "Sqrt",
+                "Pow",
+                "Transpose",
+                "Cast",
+                "Sub",
+                "Unsqueeze",
+                "Add",
+                "Softmax"
+            ],
+            "weight_type": "QInt8"
+        }
+    }
+}