Upload 18 files

Browse files

Files changed (11) hide show

onnx/decoder_model.onnx +1 -1
onnx/decoder_model_merged.onnx +1 -1
onnx/decoder_model_merged_quantized.onnx +1 -1
onnx/decoder_model_quantized.onnx +1 -1
onnx/decoder_with_past_model.onnx +1 -1
onnx/decoder_with_past_model_quantized.onnx +1 -1
onnx/encoder_model.onnx +1 -1
onnx/encoder_model_quantized.onnx +1 -1
pytorch_model.bin +1 -1
quantize_config.json +76 -76
training_args.bin +1 -1

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b562d5631d23b71d9417071e8041f3eb80e84122a9bbb66dfdec8d46d91594d4
 size 385864797

 version https://git-lfs.github.com/spec/v1
+oid sha256:5aedbc7bb81581bdd4b90f65db39dc22b3dcdea3923d67542449aa24bd46eaf7
 size 385864797

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:129100f907e7295525d4529083bfb5bdcc206eedce9f9d4a6223131ea8cb8e87
 size 387342586

 version https://git-lfs.github.com/spec/v1
+oid sha256:c398f8e6fd8bf8b03105a7ada1541f488c07870229210a128205c6492b7c38ed
 size 387342586

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d636dce4f19d08059cf075c25b75f94f71e5b28081d3be8c3823c07f40c59604
 size 99759579

 version https://git-lfs.github.com/spec/v1
+oid sha256:0c66eda97aa444b17357dfba1c9827abc7824d6fd905dd28f097f74ddef02943
 size 99759579

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:87de04f08ef3a7cec2f3cd71d4de440864ab0a7f4f32ad0764fdb8d26387fe94
 size 98065763

 version https://git-lfs.github.com/spec/v1
+oid sha256:8cda4a51db36003185beb5557cc379d0ad773d4efa9329e39793828b74d420f4
 size 98065763

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d3e69a840d8b693b738d31f9bab09434311b1eb022f4c6a89f7c31ae4ac76428
 size 385864377

 version https://git-lfs.github.com/spec/v1
+oid sha256:9ab017c9a31793692bb56c0b93be42cb0090d97f6efc9cbd25f092a93451f45e
 size 385864377

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5da506c3668083b54468a4be3d0581c2749abc28c68d4f6f816d7f03548ea977
 size 98063170

 version https://git-lfs.github.com/spec/v1
+oid sha256:7885df45251f50971c9a8fdf11c79011342988bcabdb0649470751076226b8ae
 size 98063170

onnx/encoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e06aee9b192045a32c40f0bac2e1304e153f7b7521286a65a478893a582b4087
 size 343440632

 version https://git-lfs.github.com/spec/v1
+oid sha256:e48effb1e61fcecf4d1587fb15894d15510f366971ff22224719048168a70707
 size 343440632

onnx/encoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:90563de4250ab0e12730242476b884529a1a825059c36212bd4ae1dac2e87c56
 size 87038173

 version https://git-lfs.github.com/spec/v1
+oid sha256:04622bdece4419687c8a07f4df0e8c1bea1db354fb6decde97bc0bf39f26bab2
 size 87038173

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3c82a8f09d299196b2a3237374d874d008567e0d9d9044c48b24965138d8394e
 size 730052378

 version https://git-lfs.github.com/spec/v1
+oid sha256:ea90951d68491925423f56366196ab4d2a7cbafecc88d58623b8f74ae2118872
 size 730052378

quantize_config.json CHANGED Viewed

@@ -4,120 +4,120 @@
     "per_model_config": {
         "decoder_model": {
             "op_types": [
-                "Add",
-                "Transpose",
-                "Squeeze",
-                "Range",
-                "Slice",
-                "ConstantOfShape",
                 "MatMul",
-                "Where",
-                "ReduceMean",
                 "Div",
-                "Unsqueeze",
                 "Split",
                 "Cast",
                 "Gemm",
                 "Tanh",
-                "Pow",
-                "Mul",
-                "Gather",
-                "Reshape",
-                "Softmax",
-                "Sqrt",
-                "Shape",
-                "Constant",
-                "Sub",
-                "Concat"
             ],
             "weight_type": "QInt8"
         },
         "decoder_model_merged": {
             "op_types": [
-                "Add",
-                "Transpose",
-                "Squeeze",
-                "Range",
-                "Slice",
-                "ConstantOfShape",
                 "MatMul",
-                "Where",
-                "ReduceMean",
                 "Div",
-                "Unsqueeze",
                 "Split",
                 "Cast",
                 "Gemm",
                 "Tanh",
-                "Pow",
-                "Mul",
-                "Gather",
-                "Reshape",
-                "Softmax",
-                "Sqrt",
-                "Shape",
-                "Constant",
-                "Sub",
-                "If",
-                "Concat"
             ],
             "weight_type": "QInt8"
         },
         "decoder_with_past_model": {
             "op_types": [
-                "Add",
-                "Transpose",
-                "Squeeze",
-                "Range",
-                "Slice",
-                "ConstantOfShape",
                 "MatMul",
-                "Where",
-                "ReduceMean",
                 "Div",
-                "Unsqueeze",
                 "Split",
                 "Cast",
                 "Gemm",
                 "Tanh",
-                "Pow",
-                "Mul",
-                "Gather",
-                "Reshape",
-                "Softmax",
-                "Sqrt",
-                "Shape",
-                "Constant",
-                "Sub",
-                "Concat"
             ],
             "weight_type": "QInt8"
         },
         "encoder_model": {
             "op_types": [
-                "Add",
-                "Transpose",
-                "Equal",
-                "Slice",
-                "Expand",
-                "ConstantOfShape",
                 "MatMul",
-                "Where",
-                "ReduceMean",
-                "Div",
-                "Unsqueeze",
-                "Conv",
-                "Pow",
                 "Mul",
-                "Gather",
-                "Reshape",
-                "Softmax",
-                "Sqrt",
-                "Shape",
                 "Constant",
                 "Sub",
                 "Erf",
-                "Concat"
             ],
             "weight_type": "QUInt8"
         }

     "per_model_config": {
         "decoder_model": {
             "op_types": [
+                "Sqrt",
                 "MatMul",
+                "Concat",
+                "Mul",
+                "Constant",
+                "Shape",
+                "Range",
+                "Pow",
                 "Div",
                 "Split",
+                "Sub",
+                "Where",
+                "Reshape",
+                "Gather",
+                "Unsqueeze",
                 "Cast",
+                "ReduceMean",
+                "Softmax",
+                "ConstantOfShape",
+                "Slice",
                 "Gemm",
                 "Tanh",
+                "Transpose",
+                "Add",
+                "Squeeze"
             ],
             "weight_type": "QInt8"
         },
         "decoder_model_merged": {
             "op_types": [
+                "Sqrt",
                 "MatMul",
+                "Concat",
+                "Mul",
+                "If",
+                "Constant",
+                "Shape",
+                "Range",
+                "Pow",
                 "Div",
                 "Split",
+                "Sub",
+                "Where",
+                "Reshape",
+                "Gather",
+                "Unsqueeze",
                 "Cast",
+                "ReduceMean",
+                "Softmax",
+                "ConstantOfShape",
+                "Slice",
                 "Gemm",
                 "Tanh",
+                "Transpose",
+                "Add",
+                "Squeeze"
             ],
             "weight_type": "QInt8"
         },
         "decoder_with_past_model": {
             "op_types": [
+                "Sqrt",
                 "MatMul",
+                "Concat",
+                "Mul",
+                "Constant",
+                "Shape",
+                "Range",
+                "Pow",
                 "Div",
                 "Split",
+                "Sub",
+                "Where",
+                "Reshape",
+                "Gather",
+                "Unsqueeze",
                 "Cast",
+                "ReduceMean",
+                "Softmax",
+                "ConstantOfShape",
+                "Slice",
                 "Gemm",
                 "Tanh",
+                "Transpose",
+                "Squeeze",
+                "Add"
             ],
             "weight_type": "QInt8"
         },
         "encoder_model": {
             "op_types": [
+                "Sqrt",
                 "MatMul",
+                "Concat",
                 "Mul",
                 "Constant",
+                "Expand",
+                "Shape",
+                "Pow",
+                "Div",
+                "Conv",
                 "Sub",
+                "Where",
+                "Reshape",
+                "Gather",
                 "Erf",
+                "Unsqueeze",
+                "Equal",
+                "ReduceMean",
+                "Softmax",
+                "ConstantOfShape",
+                "Slice",
+                "Transpose",
+                "Add"
             ],
             "weight_type": "QUInt8"
         }

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c6124d14554c856f07f64ebbca472baff63ce12555bd850dbac15bdf294e64c5
 size 4728

 version https://git-lfs.github.com/spec/v1
+oid sha256:6df8b3132ea43f82797da62dc92bab7492b597315c59b9eeae0937e97904f9e0
 size 4728