Upload folder using huggingface_hub

Browse files

Files changed (10) hide show

config.json +1 -0
onnx/decoder_model.onnx +2 -2
onnx/decoder_model_merged.onnx +2 -2
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
quantize_config.json +65 -66
special_tokens_map.json +3 -21
tokenizer_config.json +29 -23

config.json CHANGED Viewed

@@ -1,4 +1,5 @@
 {
   "architectures": [
     "LlamaForCausalLM"
   ],

 {
+  "_name_or_path": "Xenova/llama2.c-stories42M",
   "architectures": [
     "LlamaForCausalLM"
   ],

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:57fecedae457d1811cd12abe22589f313aa15c1590e1e09bae3408052e6a74c7
-size 233102386

 version https://git-lfs.github.com/spec/v1
+oid sha256:2875c864cfa242d3ce797f1c8f47c8779bc4d4d22bedffc7c5220d3405a4b1de
+size 167565936

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:46464ab95c2c94ad1e493d0ca7746763f367343fce80cdcf7d0036911947564c
-size 233913496

 version https://git-lfs.github.com/spec/v1
+oid sha256:315d6c6d96edac7ab954841322d443a69102c059e8ac20ba89faf3f0236769aa
+size 168376680

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:afb16b73d5c4f6e825abedc3ce65298ecd567e29c75dc98cc7f7b8dbf9e00074
-size 60022789

 version https://git-lfs.github.com/spec/v1
+oid sha256:b5e81e0464c3028cd88b9f457a8770a16c268258c0fdc290ca04035bdbb575f3
+size 43636490

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ea09156167b318bfb6149e325a18c79e95e0948175dd3fb496da53ca0589f070
-size 59060350

 version https://git-lfs.github.com/spec/v1
+oid sha256:44b2bc266767e042cb7277e7234c916ca678841ccaef3bc1f3e76bfe6c41f689
+size 42675110

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:47d1d207d61288f734b55448c70e5b344262c01087900f6c258b7805e0ed86a9
-size 233104923

 version https://git-lfs.github.com/spec/v1
+oid sha256:7c13e4732ed2e01643955726fa276efa3f3bf49279e42c837ef50893f292b71a
+size 167568570

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ca6889c5883f8686fd4ba12ee26e025b490d7ffcbe1408c8b92f766e3df6f199
-size 59062863

 version https://git-lfs.github.com/spec/v1
+oid sha256:886b10a41ecb479dffa829513765f4e445ddcef1c972d5b95aadd10eecd854df
+size 42677756

quantize_config.json CHANGED Viewed

@@ -2,104 +2,103 @@
     "per_channel": false,
     "reduce_range": false,
     "per_model_config": {
-        "decoder_model": {
             "op_types": [
-                "Sub",
-                "Softmax",
-                "Neg",
-                "Sqrt",
-                "Reshape",
-                "If",
-                "Shape",
-                "Transpose",
                 "Pow",
-                "Mul",
-                "MatMul",
                 "Gather",
                 "Slice",
-                "Less",
-                "ReduceMean",
-                "Concat",
-                "Range",
-                "Unsqueeze",
-                "Equal",
-                "Cast",
                 "ConstantOfShape",
-                "Add",
                 "Sigmoid",
-                "Where",
-                "Squeeze",
-                "Constant",
                 "Identity",
                 "Div",
-                "Expand"
             ],
             "weight_type": "QInt8"
         },
-        "decoder_with_past_model": {
             "op_types": [
-                "Sub",
-                "Softmax",
-                "Neg",
-                "Sqrt",
-                "Reshape",
-                "If",
-                "Shape",
-                "Transpose",
                 "Pow",
-                "Mul",
-                "MatMul",
                 "Gather",
                 "Slice",
-                "ReduceMean",
-                "Concat",
-                "Range",
-                "Unsqueeze",
-                "Equal",
-                "Cast",
                 "ConstantOfShape",
-                "Add",
                 "Sigmoid",
-                "Where",
-                "Squeeze",
-                "Constant",
                 "Identity",
                 "Div",
-                "Expand"
             ],
             "weight_type": "QInt8"
         },
         "decoder_model_merged": {
             "op_types": [
-                "Sub",
-                "Softmax",
-                "Neg",
-                "Sqrt",
-                "Reshape",
-                "If",
-                "Shape",
-                "Transpose",
                 "Pow",
-                "Mul",
-                "MatMul",
                 "Gather",
                 "Slice",
                 "Less",
-                "ReduceMean",
-                "Concat",
-                "Range",
-                "Unsqueeze",
-                "Equal",
-                "Cast",
                 "ConstantOfShape",
-                "Add",
                 "Sigmoid",
-                "Where",
-                "Squeeze",
-                "Constant",
                 "Identity",
                 "Div",
-                "Expand"
             ],
             "weight_type": "QInt8"
         }

     "per_channel": false,
     "reduce_range": false,
     "per_model_config": {
+        "decoder_with_past_model": {
             "op_types": [
+                "Unsqueeze",
                 "Pow",
+                "If",
                 "Gather",
+                "Constant",
+                "Squeeze",
+                "Reshape",
                 "Slice",
+                "Neg",
                 "ConstantOfShape",
                 "Sigmoid",
+                "Softmax",
                 "Identity",
+                "Sub",
+                "Cast",
+                "Expand",
                 "Div",
+                "Mul",
+                "Add",
+                "Shape",
+                "Sqrt",
+                "Where",
+                "Equal",
+                "MatMul",
+                "Concat",
+                "Transpose",
+                "ReduceMean"
             ],
             "weight_type": "QInt8"
         },
+        "decoder_model": {
             "op_types": [
+                "Unsqueeze",
                 "Pow",
+                "If",
                 "Gather",
+                "Constant",
+                "Squeeze",
+                "Reshape",
                 "Slice",
+                "Less",
+                "Neg",
                 "ConstantOfShape",
                 "Sigmoid",
+                "Softmax",
                 "Identity",
+                "Sub",
+                "Expand",
                 "Div",
+                "Mul",
+                "Add",
+                "Shape",
+                "Sqrt",
+                "Where",
+                "Equal",
+                "MatMul",
+                "Concat",
+                "Range",
+                "Transpose",
+                "Cast",
+                "ReduceMean"
             ],
             "weight_type": "QInt8"
         },
         "decoder_model_merged": {
             "op_types": [
+                "Unsqueeze",
                 "Pow",
+                "If",
                 "Gather",
+                "Constant",
+                "Squeeze",
+                "Reshape",
                 "Slice",
                 "Less",
+                "Neg",
                 "ConstantOfShape",
                 "Sigmoid",
+                "Softmax",
                 "Identity",
+                "Sub",
+                "Expand",
                 "Div",
+                "Mul",
+                "Add",
+                "Shape",
+                "Sqrt",
+                "Where",
+                "Equal",
+                "MatMul",
+                "Concat",
+                "Range",
+                "Transpose",
+                "Cast",
+                "ReduceMean"
             ],
             "weight_type": "QInt8"
         }

special_tokens_map.json CHANGED Viewed

@@ -1,23 +1,5 @@
 {
-  "bos_token": {
-    "content": "<s>",
-    "lstrip": false,
-    "normalized": true,
-    "rstrip": false,
-    "single_word": false
-  },
-  "eos_token": {
-    "content": "</s>",
-    "lstrip": false,
-    "normalized": true,
-    "rstrip": false,
-    "single_word": false
-  },
-  "unk_token": {
-    "content": "<unk>",
-    "lstrip": false,
-    "normalized": true,
-    "rstrip": false,
-    "single_word": false
-  }
 }

 {
+  "bos_token": "<s>",
+  "eos_token": "</s>",
+  "unk_token": "<unk>"
 }

tokenizer_config.json CHANGED Viewed

@@ -1,32 +1,38 @@
 {
-  "bos_token": {
-    "__type": "AddedToken",
-    "content": "<s>",
-    "lstrip": false,
-    "normalized": true,
-    "rstrip": false,
-    "single_word": false
   },
   "clean_up_tokenization_spaces": false,
-  "eos_token": {
-    "__type": "AddedToken",
-    "content": "</s>",
-    "lstrip": false,
-    "normalized": true,
-    "rstrip": false,
-    "single_word": false
-  },
   "model_max_length": 2048,
   "pad_token": null,
   "sp_model_kwargs": {},
   "tokenizer_class": "LlamaTokenizer",
-  "unk_token": {
-    "__type": "AddedToken",
-    "content": "<unk>",
-    "lstrip": false,
-    "normalized": true,
-    "rstrip": false,
-    "single_word": false
-  },
   "use_default_system_prompt": true
 }

 {
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
   },
+  "additional_special_tokens": [],
+  "bos_token": "<s>",
   "clean_up_tokenization_spaces": false,
+  "eos_token": "</s>",
   "model_max_length": 2048,
   "pad_token": null,
   "sp_model_kwargs": {},
   "tokenizer_class": "LlamaTokenizer",
+  "unk_token": "<unk>",
   "use_default_system_prompt": true
 }