openvino-ci commited on
Commit
65cc9da
1 Parent(s): bcce2cb

Upload folder using huggingface_hub

Browse files
README.md CHANGED
@@ -14,7 +14,7 @@ This is [RedPajama-INCITE-Chat-3B-v1](https://huggingface.co/togethercomputer/Re
14
  Weight compression was performed using `nncf.compress_weights` with the following parameters:
15
 
16
  * mode: **int4_asym**
17
- * ratio: **0.8**
18
  * group_size: **128**
19
 
20
  For more information on quantization, check the [OpenVINO model optimization guide](https://docs.openvino.ai/2024/openvino-workflow/model-optimization-guide/weight-compression.html).
@@ -24,11 +24,10 @@ For more information on quantization, check the [OpenVINO model optimization gui
24
 
25
  The provided OpenVINO™ IR model is compatible with:
26
 
27
- * OpenVINO version 2024.2.0 and higher
28
- * Optimum Intel 1.19.0 and higher
29
-
30
- ## Running Model Inference with [Optimum Intel](https://huggingface.co/docs/optimum/intel/index)
31
 
 
32
 
33
  1. Install packages required for using [Optimum Intel](https://huggingface.co/docs/optimum/intel/index) integration with the OpenVINO backend:
34
 
@@ -55,40 +54,9 @@ print(text)
55
 
56
  For more examples and possible optimizations, refer to the [OpenVINO Large Language Model Inference Guide](https://docs.openvino.ai/2024/learn-openvino/llm_inference_guide.html).
57
 
58
- ## Running Model Inference with [OpenVINO GenAI](https://github.com/openvinotoolkit/openvino.genai)
59
-
60
- 1. Install packages required for using OpenVINO GenAI.
61
- ```
62
- pip install openvino-genai huggingface_hub
63
- ```
64
-
65
- 2. Download model from HuggingFace Hub
66
-
67
- ```
68
- import huggingface_hub as hf_hub
69
-
70
- model_id = "OpenVINO/RedPajama-INCITE-Chat-3B-v1-int4-ov"
71
- model_path = "RedPajama-INCITE-Chat-3B-v1-int4-ov"
72
-
73
- hf_hub.snapshot_download(model_id, local_dir=model_path)
74
-
75
- ```
76
-
77
- 3. Run model inference:
78
-
79
- ```
80
- import openvino_genai as ov_genai
81
-
82
- device = "CPU"
83
- pipe = ov_genai.LLMPipeline(model_path, device)
84
- print(pipe.generate("What is OpenVINO?", max_length=200))
85
- ```
86
-
87
- More GenAI usage examples can be found in OpenVINO GenAI library [docs](https://github.com/openvinotoolkit/openvino.genai/blob/master/src/README.md) and [samples](https://github.com/openvinotoolkit/openvino.genai?tab=readme-ov-file#openvino-genai-samples)
88
-
89
  ## Limitations
90
 
91
- Check the original model card for [limitations]().
92
 
93
  ## Legal information
94
 
 
14
  Weight compression was performed using `nncf.compress_weights` with the following parameters:
15
 
16
  * mode: **int4_asym**
17
+ * ratio: **1**
18
  * group_size: **128**
19
 
20
  For more information on quantization, check the [OpenVINO model optimization guide](https://docs.openvino.ai/2024/openvino-workflow/model-optimization-guide/weight-compression.html).
 
24
 
25
  The provided OpenVINO™ IR model is compatible with:
26
 
27
+ * OpenVINO version 2024.4.0 and higher
28
+ * Optimum Intel 1.20.0 and higher
 
 
29
 
30
+ ## Running Model Inference
31
 
32
  1. Install packages required for using [Optimum Intel](https://huggingface.co/docs/optimum/intel/index) integration with the OpenVINO backend:
33
 
 
54
 
55
  For more examples and possible optimizations, refer to the [OpenVINO Large Language Model Inference Guide](https://docs.openvino.ai/2024/learn-openvino/llm_inference_guide.html).
56
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
57
  ## Limitations
58
 
59
+ Check the original model card for [original model card](https://huggingface.co/togethercomputer/RedPajama-INCITE-Chat-3B-v1) for limitations.
60
 
61
  ## Legal information
62
 
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "OpenVINO/RedPajama-INCITE-Chat-3B-v1-int4-ov",
3
  "architectures": [
4
  "GPTNeoXForCausalLM"
5
  ],
@@ -18,11 +18,14 @@
18
  "model_type": "gpt_neox",
19
  "num_attention_heads": 32,
20
  "num_hidden_layers": 32,
 
21
  "rope_scaling": null,
 
22
  "rotary_emb_base": 10000,
23
  "rotary_pct": 1.0,
24
  "tie_word_embeddings": false,
25
- "transformers_version": "4.41.2",
 
26
  "use_cache": true,
27
  "use_parallel_residual": false,
28
  "vocab_size": 50432
 
1
  {
2
+ "_name_or_path": "togethercomputer/RedPajama-INCITE-Chat-3B-v1",
3
  "architectures": [
4
  "GPTNeoXForCausalLM"
5
  ],
 
18
  "model_type": "gpt_neox",
19
  "num_attention_heads": 32,
20
  "num_hidden_layers": 32,
21
+ "partial_rotary_factor": 1.0,
22
  "rope_scaling": null,
23
+ "rope_theta": 10000,
24
  "rotary_emb_base": 10000,
25
  "rotary_pct": 1.0,
26
  "tie_word_embeddings": false,
27
+ "torch_dtype": "float16",
28
+ "transformers_version": "4.45.2",
29
  "use_cache": true,
30
  "use_parallel_residual": false,
31
  "vocab_size": 50432
generation_config.json CHANGED
@@ -2,5 +2,5 @@
2
  "_from_model_config": true,
3
  "bos_token_id": 0,
4
  "eos_token_id": 0,
5
- "transformers_version": "4.41.2"
6
  }
 
2
  "_from_model_config": true,
3
  "bos_token_id": 0,
4
  "eos_token_id": 0,
5
+ "transformers_version": "4.45.2"
6
  }
openvino_config.json ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "compression": null,
3
+ "dtype": "int4",
4
+ "input_info": null,
5
+ "optimum_version": "1.23.1",
6
+ "quantization_config": {
7
+ "all_layers": null,
8
+ "bits": 4,
9
+ "dataset": "wikitext2",
10
+ "gptq": null,
11
+ "group_size": 128,
12
+ "ignored_scope": null,
13
+ "num_samples": null,
14
+ "quant_method": "default",
15
+ "ratio": 1.0,
16
+ "scale_estimation": true,
17
+ "sensitivity_metric": null,
18
+ "sym": false,
19
+ "tokenizer": null,
20
+ "trust_remote_code": true,
21
+ "weight_format": "int4"
22
+ },
23
+ "save_onnx_model": false,
24
+ "transformers_version": "4.45.2"
25
+ }
openvino_detokenizer.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:07cc9ef2460d39577b5a80e2b379766a90187c17b436a2e530467180319bc312
3
- size 558446
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1da2b7ea623e526bc5d1b509164ae94e333c3c762fbc6d8f6e90384e6f0d6b66
3
+ size 514079
openvino_detokenizer.xml CHANGED
@@ -1,16 +1,16 @@
1
  <?xml version="1.0"?>
2
  <net name="detokenizer" version="11">
3
  <layers>
4
- <layer id="0" name="Parameter_458255" type="Parameter" version="opset1">
5
  <data shape="?,?" element_type="i64" />
6
  <output>
7
- <port id="0" precision="I64" names="Parameter_458255">
8
  <dim>-1</dim>
9
  <dim>-1</dim>
10
  </port>
11
  </output>
12
  </layer>
13
- <layer id="1" name="Convert_458271" type="Convert" version="opset1">
14
  <data destination_type="i32" />
15
  <input>
16
  <port id="0" precision="I64">
@@ -25,19 +25,19 @@
25
  </port>
26
  </output>
27
  </layer>
28
- <layer id="2" name="Constant_458153" type="Const" version="opset1">
29
- <data element_type="u8" shape="558397" offset="0" size="558397" />
30
  <output>
31
  <port id="0" precision="U8">
32
- <dim>558397</dim>
33
  </port>
34
  </output>
35
  </layer>
36
- <layer id="3" name="StringTensorUnpack_458154" type="StringTensorUnpack" version="extension">
37
  <data mode="begins_ends" />
38
  <input>
39
  <port id="0" precision="U8">
40
- <dim>558397</dim>
41
  </port>
42
  </input>
43
  <output>
@@ -52,7 +52,7 @@
52
  </port>
53
  </output>
54
  </layer>
55
- <layer id="4" name="VocabDecoder_458256" type="VocabDecoder" version="extension">
56
  <data skip_tokens="0, 1" />
57
  <input>
58
  <port id="0" precision="I32">
@@ -87,7 +87,7 @@
87
  </port>
88
  </output>
89
  </layer>
90
- <layer id="5" name="CharsToBytes_458257" type="CharsToBytes" version="extension">
91
  <input>
92
  <port id="0" precision="I32">
93
  <dim>-1</dim>
@@ -101,39 +101,33 @@
101
  <port id="3" precision="I32">
102
  <dim>-1</dim>
103
  </port>
104
- <port id="4" precision="U8">
105
- <dim>-1</dim>
106
- </port>
107
  </input>
108
  <output>
109
- <port id="5" precision="I32">
110
- <dim>-1</dim>
111
- </port>
112
- <port id="6" precision="I32">
113
  <dim>-1</dim>
114
  </port>
115
- <port id="7" precision="U8">
116
  <dim>-1</dim>
117
  </port>
118
  </output>
119
  </layer>
120
- <layer id="6" name="Constant_458259" type="Const" version="opset1">
121
- <data element_type="u8" shape="47" offset="558397" size="47" />
122
  <output>
123
  <port id="0" precision="U8">
124
  <dim>47</dim>
125
  </port>
126
  </output>
127
  </layer>
128
- <layer id="7" name="Constant_458261" type="Const" version="opset1">
129
- <data element_type="u8" shape="2" offset="558444" size="2" />
130
  <output>
131
  <port id="0" precision="U8">
132
  <dim>2</dim>
133
  </port>
134
  </output>
135
  </layer>
136
- <layer id="8" name="RegexNormalization_458262" type="RegexNormalization" version="extension">
137
  <data global_replace="true" />
138
  <input>
139
  <port id="0" precision="I32">
@@ -164,7 +158,7 @@
164
  </port>
165
  </output>
166
  </layer>
167
- <layer id="9" name="StringTensorPack_458263" type="StringTensorPack" version="extension">
168
  <data mode="begins_ends" />
169
  <input>
170
  <port id="0" precision="I32">
@@ -183,7 +177,7 @@
183
  </port>
184
  </output>
185
  </layer>
186
- <layer id="10" name="Result_458264" type="Result" version="opset1">
187
  <input>
188
  <port id="0" precision="STRING">
189
  <dim>-1</dim>
@@ -198,14 +192,13 @@
198
  <edge from-layer="3" from-port="1" to-layer="4" to-port="1" />
199
  <edge from-layer="3" from-port="2" to-layer="4" to-port="2" />
200
  <edge from-layer="3" from-port="3" to-layer="4" to-port="3" />
201
- <edge from-layer="4" from-port="8" to-layer="5" to-port="4" />
202
  <edge from-layer="4" from-port="7" to-layer="5" to-port="3" />
 
203
  <edge from-layer="4" from-port="6" to-layer="5" to-port="2" />
204
  <edge from-layer="4" from-port="5" to-layer="5" to-port="1" />
205
  <edge from-layer="4" from-port="4" to-layer="5" to-port="0" />
206
- <edge from-layer="5" from-port="5" to-layer="8" to-port="0" />
207
- <edge from-layer="5" from-port="6" to-layer="8" to-port="1" />
208
- <edge from-layer="5" from-port="7" to-layer="8" to-port="2" />
209
  <edge from-layer="6" from-port="0" to-layer="8" to-port="3" />
210
  <edge from-layer="7" from-port="0" to-layer="8" to-port="4" />
211
  <edge from-layer="8" from-port="5" to-layer="9" to-port="0" />
@@ -214,6 +207,8 @@
214
  <edge from-layer="9" from-port="3" to-layer="10" to-port="0" />
215
  </edges>
216
  <rt_info>
 
217
  <eos_token_id value="0" />
 
218
  </rt_info>
219
  </net>
 
1
  <?xml version="1.0"?>
2
  <net name="detokenizer" version="11">
3
  <layers>
4
+ <layer id="0" name="Parameter_184670" type="Parameter" version="opset1">
5
  <data shape="?,?" element_type="i64" />
6
  <output>
7
+ <port id="0" precision="I64" names="Parameter_184670">
8
  <dim>-1</dim>
9
  <dim>-1</dim>
10
  </port>
11
  </output>
12
  </layer>
13
+ <layer id="1" name="Convert_184686" type="Convert" version="opset1">
14
  <data destination_type="i32" />
15
  <input>
16
  <port id="0" precision="I64">
 
25
  </port>
26
  </output>
27
  </layer>
28
+ <layer id="2" name="Constant_184640" type="Const" version="opset1">
29
+ <data element_type="u8" shape="514030" offset="0" size="514030" />
30
  <output>
31
  <port id="0" precision="U8">
32
+ <dim>514030</dim>
33
  </port>
34
  </output>
35
  </layer>
36
+ <layer id="3" name="StringTensorUnpack_184641" type="StringTensorUnpack" version="extension">
37
  <data mode="begins_ends" />
38
  <input>
39
  <port id="0" precision="U8">
40
+ <dim>514030</dim>
41
  </port>
42
  </input>
43
  <output>
 
52
  </port>
53
  </output>
54
  </layer>
55
+ <layer id="4" name="VocabDecoder_184671" type="VocabDecoder" version="extension">
56
  <data skip_tokens="0, 1" />
57
  <input>
58
  <port id="0" precision="I32">
 
87
  </port>
88
  </output>
89
  </layer>
90
+ <layer id="5" name="FuzeRagged_184672" type="FuzeRagged" version="extension">
91
  <input>
92
  <port id="0" precision="I32">
93
  <dim>-1</dim>
 
101
  <port id="3" precision="I32">
102
  <dim>-1</dim>
103
  </port>
 
 
 
104
  </input>
105
  <output>
106
+ <port id="4" precision="I32">
 
 
 
107
  <dim>-1</dim>
108
  </port>
109
+ <port id="5" precision="I32">
110
  <dim>-1</dim>
111
  </port>
112
  </output>
113
  </layer>
114
+ <layer id="6" name="Constant_184674" type="Const" version="opset1">
115
+ <data element_type="u8" shape="47" offset="514030" size="47" />
116
  <output>
117
  <port id="0" precision="U8">
118
  <dim>47</dim>
119
  </port>
120
  </output>
121
  </layer>
122
+ <layer id="7" name="Constant_184676" type="Const" version="opset1">
123
+ <data element_type="u8" shape="2" offset="514077" size="2" />
124
  <output>
125
  <port id="0" precision="U8">
126
  <dim>2</dim>
127
  </port>
128
  </output>
129
  </layer>
130
+ <layer id="8" name="RegexNormalization_184677" type="RegexNormalization" version="extension">
131
  <data global_replace="true" />
132
  <input>
133
  <port id="0" precision="I32">
 
158
  </port>
159
  </output>
160
  </layer>
161
+ <layer id="9" name="StringTensorPack_184678" type="StringTensorPack" version="extension">
162
  <data mode="begins_ends" />
163
  <input>
164
  <port id="0" precision="I32">
 
177
  </port>
178
  </output>
179
  </layer>
180
+ <layer id="10" name="Result_184679" type="Result" version="opset1">
181
  <input>
182
  <port id="0" precision="STRING">
183
  <dim>-1</dim>
 
192
  <edge from-layer="3" from-port="1" to-layer="4" to-port="1" />
193
  <edge from-layer="3" from-port="2" to-layer="4" to-port="2" />
194
  <edge from-layer="3" from-port="3" to-layer="4" to-port="3" />
 
195
  <edge from-layer="4" from-port="7" to-layer="5" to-port="3" />
196
+ <edge from-layer="4" from-port="8" to-layer="8" to-port="2" />
197
  <edge from-layer="4" from-port="6" to-layer="5" to-port="2" />
198
  <edge from-layer="4" from-port="5" to-layer="5" to-port="1" />
199
  <edge from-layer="4" from-port="4" to-layer="5" to-port="0" />
200
+ <edge from-layer="5" from-port="4" to-layer="8" to-port="0" />
201
+ <edge from-layer="5" from-port="5" to-layer="8" to-port="1" />
 
202
  <edge from-layer="6" from-port="0" to-layer="8" to-port="3" />
203
  <edge from-layer="7" from-port="0" to-layer="8" to-port="4" />
204
  <edge from-layer="8" from-port="5" to-layer="9" to-port="0" />
 
207
  <edge from-layer="9" from-port="3" to-layer="10" to-port="0" />
208
  </edges>
209
  <rt_info>
210
+ <bos_token_id value="0" />
211
  <eos_token_id value="0" />
212
+ <original_tokenizer_class value="&lt;class 'transformers.models.gpt_neox.tokenization_gpt_neox_fast.GPTNeoXTokenizerFast'>" />
213
  </rt_info>
214
  </net>
openvino_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2c5b22fd54f3e41ac3133a9234ee61e654baa23015c88ff27edb3310d0902dd0
3
- size 1828261828
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:250bdb2ad15b87471f34f3d3ad7dae2d1a45b7aa1591337980ccda2303a33d8b
3
+ size 1569419208
openvino_model.xml CHANGED
The diff for this file is too large to render. See raw diff
 
openvino_tokenizer.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c1c5d770015e1fce984bc6a141f757b4f614587eac66071423500855cce455c1
3
- size 1166215
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abf9aaae1d4e87049398cc549c6c7cc4d67f79ede0898ea8a5a0e28fd03ca521
3
+ size 1227768
openvino_tokenizer.xml CHANGED
@@ -1,21 +1,21 @@
1
  <?xml version="1.0"?>
2
  <net name="tokenizer" version="11">
3
  <layers>
4
- <layer id="0" name="Parameter_458065" type="Parameter" version="opset1">
5
  <data shape="?" element_type="string" />
6
  <output>
7
- <port id="0" precision="STRING" names="Parameter_458065">
8
  <dim>-1</dim>
9
  </port>
10
  </output>
11
  </layer>
12
- <layer id="1" name="Constant_458072" type="Const" version="opset1">
13
  <data element_type="i64" shape="" offset="0" size="8" />
14
  <output>
15
  <port id="0" precision="I64" />
16
  </output>
17
  </layer>
18
- <layer id="2" name="StringTensorUnpack_458066" type="StringTensorUnpack" version="extension">
19
  <data mode="begins_ends" />
20
  <input>
21
  <port id="0" precision="STRING">
@@ -34,32 +34,7 @@
34
  </port>
35
  </output>
36
  </layer>
37
- <layer id="3" name="NormalizeUnicode_458067" type="NormalizeUnicode" version="extension">
38
- <data normalization_form="NFC" />
39
- <input>
40
- <port id="0" precision="I32">
41
- <dim>-1</dim>
42
- </port>
43
- <port id="1" precision="I32">
44
- <dim>-1</dim>
45
- </port>
46
- <port id="2" precision="U8">
47
- <dim>-1</dim>
48
- </port>
49
- </input>
50
- <output>
51
- <port id="3" precision="I32">
52
- <dim>-1</dim>
53
- </port>
54
- <port id="4" precision="I32">
55
- <dim>-1</dim>
56
- </port>
57
- <port id="5" precision="U8">
58
- <dim>-1</dim>
59
- </port>
60
- </output>
61
- </layer>
62
- <layer id="4" name="ShapeOf_458068" type="ShapeOf" version="opset3">
63
  <data output_type="i64" />
64
  <input>
65
  <port id="0" precision="I32">
@@ -72,19 +47,19 @@
72
  </port>
73
  </output>
74
  </layer>
75
- <layer id="5" name="Constant_458069" type="Const" version="opset1">
76
  <data element_type="i64" shape="" offset="0" size="8" />
77
  <output>
78
  <port id="0" precision="I64" />
79
  </output>
80
  </layer>
81
- <layer id="6" name="Constant_458070" type="Const" version="opset1">
82
  <data element_type="i64" shape="" offset="0" size="8" />
83
  <output>
84
  <port id="0" precision="I64" />
85
  </output>
86
  </layer>
87
- <layer id="7" name="Gather_458071" type="Gather" version="opset8">
88
  <data batch_dims="0" />
89
  <input>
90
  <port id="0" precision="I64">
@@ -97,13 +72,13 @@
97
  <port id="3" precision="I64" />
98
  </output>
99
  </layer>
100
- <layer id="8" name="Constant_458073" type="Const" version="opset1">
101
  <data element_type="i64" shape="" offset="8" size="8" />
102
  <output>
103
  <port id="0" precision="I64" />
104
  </output>
105
  </layer>
106
- <layer id="9" name="Range_458074" type="Range" version="opset4">
107
  <data output_type="i32" />
108
  <input>
109
  <port id="0" precision="I64" />
@@ -116,19 +91,19 @@
116
  </port>
117
  </output>
118
  </layer>
119
- <layer id="10" name="Constant_458076" type="Const" version="opset1">
120
  <data element_type="i64" shape="" offset="8" size="8" />
121
  <output>
122
  <port id="0" precision="I64" />
123
  </output>
124
  </layer>
125
- <layer id="11" name="Constant_458077" type="Const" version="opset1">
126
  <data element_type="i64" shape="" offset="8" size="8" />
127
  <output>
128
  <port id="0" precision="I64" />
129
  </output>
130
  </layer>
131
- <layer id="12" name="Add_458078" type="Add" version="opset1">
132
  <data auto_broadcast="numpy" />
133
  <input>
134
  <port id="0" precision="I64" />
@@ -138,13 +113,13 @@
138
  <port id="2" precision="I64" />
139
  </output>
140
  </layer>
141
- <layer id="13" name="Constant_458079" type="Const" version="opset1">
142
  <data element_type="i64" shape="" offset="8" size="8" />
143
  <output>
144
  <port id="0" precision="I64" />
145
  </output>
146
  </layer>
147
- <layer id="14" name="Range_458080" type="Range" version="opset4">
148
  <data output_type="i32" />
149
  <input>
150
  <port id="0" precision="I64" />
@@ -157,16 +132,15 @@
157
  </port>
158
  </output>
159
  </layer>
160
- <layer id="15" name="Constant_458143" type="Const" version="opset1">
161
- <data element_type="u8" shape="620" offset="16" size="620" />
162
  <output>
163
  <port id="0" precision="U8">
164
- <dim>620</dim>
165
  </port>
166
  </output>
167
  </layer>
168
- <layer id="16" name="RegexSplit_458144" type="RegexSplit" version="extension">
169
- <data behaviour="isolate" invert="false" max_splits="-1" />
170
  <input>
171
  <port id="0" precision="I32">
172
  <dim>-1</dim>
@@ -184,7 +158,7 @@
184
  <dim>-1</dim>
185
  </port>
186
  <port id="5" precision="U8">
187
- <dim>620</dim>
188
  </port>
189
  </input>
190
  <output>
@@ -203,45 +177,13 @@
203
  <port id="10" precision="U8">
204
  <dim>-1</dim>
205
  </port>
206
- </output>
207
- </layer>
208
- <layer id="17" name="Constant_458149" type="Const" version="opset1">
209
- <data element_type="u8" shape="64" offset="636" size="64" />
210
- <output>
211
- <port id="0" precision="U8">
212
- <dim>64</dim>
213
- </port>
214
- </output>
215
- </layer>
216
- <layer id="18" name="Constant_458146" type="Const" version="opset1">
217
- <data element_type="u8" shape="399" offset="700" size="399" />
218
- <output>
219
- <port id="0" precision="U8">
220
- <dim>399</dim>
221
- </port>
222
- </output>
223
- </layer>
224
- <layer id="19" name="StringTensorUnpack_458147" type="StringTensorUnpack" version="extension">
225
- <data mode="begins_ends" />
226
- <input>
227
- <port id="0" precision="U8">
228
- <dim>399</dim>
229
- </port>
230
- </input>
231
- <output>
232
- <port id="1" precision="I32">
233
- <dim>-1</dim>
234
- </port>
235
- <port id="2" precision="I32">
236
- <dim>-1</dim>
237
- </port>
238
- <port id="3" precision="U8">
239
  <dim>-1</dim>
240
  </port>
241
  </output>
242
  </layer>
243
- <layer id="20" name="RegexSplit_458150" type="RegexSplit" version="extension">
244
- <data behaviour="isolate" invert="false" max_splits="-1" />
245
  <input>
246
  <port id="0" precision="I32">
247
  <dim>-1</dim>
@@ -249,47 +191,38 @@
249
  <port id="1" precision="I32">
250
  <dim>-1</dim>
251
  </port>
252
- <port id="2" precision="I32">
253
- <dim>-1</dim>
254
- </port>
255
- <port id="3" precision="I32">
256
- <dim>-1</dim>
257
- </port>
258
- <port id="4" precision="U8">
259
- <dim>-1</dim>
260
- </port>
261
- <port id="5" precision="U8">
262
- <dim>64</dim>
263
- </port>
264
- <port id="6" precision="I32">
265
- <dim>-1</dim>
266
- </port>
267
- <port id="7" precision="I32">
268
  <dim>-1</dim>
269
  </port>
270
- <port id="8" precision="U8">
271
  <dim>-1</dim>
272
  </port>
273
  </input>
274
  <output>
275
- <port id="9" precision="I32">
276
  <dim>-1</dim>
277
  </port>
278
- <port id="10" precision="I32">
279
  <dim>-1</dim>
280
  </port>
281
- <port id="11" precision="I32">
282
  <dim>-1</dim>
283
  </port>
284
- <port id="12" precision="I32">
285
  <dim>-1</dim>
286
  </port>
287
- <port id="13" precision="U8">
288
- <dim>-1</dim>
 
 
 
 
 
289
  </port>
290
  </output>
291
  </layer>
292
- <layer id="21" name="BytesToChars_458151" type="BytesToChars" version="extension">
 
293
  <input>
294
  <port id="0" precision="I32">
295
  <dim>-1</dim>
@@ -306,38 +239,47 @@
306
  <port id="4" precision="U8">
307
  <dim>-1</dim>
308
  </port>
 
 
 
 
 
 
309
  </input>
310
  <output>
311
- <port id="5" precision="I32">
312
  <dim>-1</dim>
313
  </port>
314
- <port id="6" precision="I32">
315
  <dim>-1</dim>
316
  </port>
317
- <port id="7" precision="I32">
318
  <dim>-1</dim>
319
  </port>
320
- <port id="8" precision="I32">
321
  <dim>-1</dim>
322
  </port>
323
- <port id="9" precision="U8">
 
 
 
324
  <dim>-1</dim>
325
  </port>
326
  </output>
327
  </layer>
328
- <layer id="22" name="Constant_458153" type="Const" version="opset1">
329
- <data element_type="u8" shape="558397" offset="1099" size="558397" />
330
  <output>
331
  <port id="0" precision="U8">
332
- <dim>558397</dim>
333
  </port>
334
  </output>
335
  </layer>
336
- <layer id="23" name="StringTensorUnpack_458154" type="StringTensorUnpack" version="extension">
337
  <data mode="begins_ends" />
338
  <input>
339
  <port id="0" precision="U8">
340
- <dim>558397</dim>
341
  </port>
342
  </input>
343
  <output>
@@ -352,19 +294,19 @@
352
  </port>
353
  </output>
354
  </layer>
355
- <layer id="24" name="Constant_458234" type="Const" version="opset1">
356
- <data element_type="u8" shape="606619" offset="559496" size="606619" />
357
  <output>
358
  <port id="0" precision="U8">
359
- <dim>606619</dim>
360
  </port>
361
  </output>
362
  </layer>
363
- <layer id="25" name="StringTensorUnpack_458235" type="StringTensorUnpack" version="extension">
364
  <data mode="begins_ends" />
365
  <input>
366
  <port id="0" precision="U8">
367
- <dim>606619</dim>
368
  </port>
369
  </input>
370
  <output>
@@ -379,25 +321,19 @@
379
  </port>
380
  </output>
381
  </layer>
382
- <layer id="26" name="Constant_458162" type="Const" version="opset1">
383
- <data element_type="i64" shape="" offset="0" size="8" />
384
- <output>
385
- <port id="0" precision="I64" />
386
- </output>
387
- </layer>
388
- <layer id="27" name="Constant_458156" type="Const" version="opset1">
389
- <data element_type="u8" shape="399" offset="700" size="399" />
390
  <output>
391
  <port id="0" precision="U8">
392
- <dim>399</dim>
393
  </port>
394
  </output>
395
  </layer>
396
- <layer id="28" name="StringTensorUnpack_458157" type="StringTensorUnpack" version="extension">
397
  <data mode="begins_ends" />
398
  <input>
399
  <port id="0" precision="U8">
400
- <dim>399</dim>
401
  </port>
402
  </input>
403
  <output>
@@ -412,150 +348,43 @@
412
  </port>
413
  </output>
414
  </layer>
415
- <layer id="29" name="ShapeOf_458158" type="ShapeOf" version="opset3">
416
- <data output_type="i64" />
417
- <input>
418
- <port id="0" precision="I32">
419
- <dim>-1</dim>
420
- </port>
421
- </input>
422
- <output>
423
- <port id="1" precision="I64">
424
- <dim>1</dim>
425
- </port>
426
- </output>
427
- </layer>
428
- <layer id="30" name="Constant_458159" type="Const" version="opset1">
429
- <data element_type="i64" shape="" offset="0" size="8" />
430
- <output>
431
- <port id="0" precision="I64" />
432
- </output>
433
- </layer>
434
- <layer id="31" name="Constant_458160" type="Const" version="opset1">
435
- <data element_type="i64" shape="" offset="0" size="8" />
436
  <output>
437
- <port id="0" precision="I64" />
438
- </output>
439
- </layer>
440
- <layer id="32" name="Gather_458161" type="Gather" version="opset8">
441
- <data batch_dims="0" />
442
- <input>
443
- <port id="0" precision="I64">
444
- <dim>1</dim>
445
  </port>
446
- <port id="1" precision="I64" />
447
- <port id="2" precision="I64" />
448
- </input>
449
- <output>
450
- <port id="3" precision="I64" />
451
  </output>
452
  </layer>
453
- <layer id="33" name="Constant_458163" type="Const" version="opset1">
454
- <data element_type="i64" shape="" offset="8" size="8" />
455
- <output>
456
- <port id="0" precision="I64" />
457
- </output>
458
- </layer>
459
- <layer id="34" name="Range_458164" type="Range" version="opset4">
460
- <data output_type="i32" />
461
  <input>
462
- <port id="0" precision="I64" />
463
- <port id="1" precision="I64" />
464
- <port id="2" precision="I64" />
465
- </input>
466
- <output>
467
- <port id="3" precision="I32">
468
- <dim>-1</dim>
469
  </port>
470
- </output>
471
- </layer>
472
- <layer id="35" name="Constant_458166" type="Const" version="opset1">
473
- <data element_type="i64" shape="" offset="8" size="8" />
474
- <output>
475
- <port id="0" precision="I64" />
476
- </output>
477
- </layer>
478
- <layer id="36" name="Constant_458167" type="Const" version="opset1">
479
- <data element_type="i64" shape="" offset="8" size="8" />
480
- <output>
481
- <port id="0" precision="I64" />
482
- </output>
483
- </layer>
484
- <layer id="37" name="Add_458168" type="Add" version="opset1">
485
- <data auto_broadcast="numpy" />
486
- <input>
487
- <port id="0" precision="I64" />
488
- <port id="1" precision="I64" />
489
  </input>
490
  <output>
491
- <port id="2" precision="I64" />
492
- </output>
493
- </layer>
494
- <layer id="38" name="Constant_458169" type="Const" version="opset1">
495
- <data element_type="i64" shape="" offset="8" size="8" />
496
- <output>
497
- <port id="0" precision="I64" />
498
- </output>
499
- </layer>
500
- <layer id="39" name="Range_458170" type="Range" version="opset4">
501
- <data output_type="i32" />
502
- <input>
503
- <port id="0" precision="I64" />
504
- <port id="1" precision="I64" />
505
- <port id="2" precision="I64" />
506
- </input>
507
- <output>
508
- <port id="3" precision="I32">
509
- <dim>-1</dim>
510
- </port>
511
- </output>
512
- </layer>
513
- <layer id="40" name="BytesToChars_458232" type="BytesToChars" version="extension">
514
- <input>
515
- <port id="0" precision="I32">
516
- <dim>-1</dim>
517
- </port>
518
  <port id="1" precision="I32">
519
  <dim>-1</dim>
520
  </port>
521
  <port id="2" precision="I32">
522
  <dim>-1</dim>
523
  </port>
524
- <port id="3" precision="I32">
525
- <dim>-1</dim>
526
- </port>
527
- <port id="4" precision="U8">
528
- <dim>-1</dim>
529
- </port>
530
- </input>
531
- <output>
532
- <port id="5" precision="I32">
533
- <dim>-1</dim>
534
- </port>
535
- <port id="6" precision="I32">
536
- <dim>-1</dim>
537
- </port>
538
- <port id="7" precision="I32">
539
- <dim>-1</dim>
540
- </port>
541
- <port id="8" precision="I32">
542
- <dim>-1</dim>
543
- </port>
544
- <port id="9" precision="U8">
545
  <dim>-1</dim>
546
  </port>
547
  </output>
548
  </layer>
549
- <layer id="41" name="Constant_458236" type="Const" version="opset1">
550
- <data element_type="i32" shape="23" offset="1166115" size="92" />
551
  <output>
552
  <port id="0" precision="I32">
553
- <dim>23</dim>
554
  </port>
555
  </output>
556
  </layer>
557
- <layer id="42" name="BPETokenizer_458237" type="BPETokenizer" version="extension">
558
- <data unk_token="" fuse_unk="false" suffix_indicator="" end_suffix="" byte_fallback="false" />
559
  <input>
560
  <port id="0" precision="I32">
561
  <dim>-1</dim>
@@ -600,22 +429,31 @@
600
  <dim>-1</dim>
601
  </port>
602
  <port id="14" precision="I32">
603
- <dim>23</dim>
604
  </port>
605
- </input>
606
- <output>
607
  <port id="15" precision="I32">
608
  <dim>-1</dim>
609
  </port>
610
- <port id="16" precision="I32">
611
  <dim>-1</dim>
612
  </port>
613
  <port id="17" precision="I32">
 
 
 
 
 
 
 
 
 
 
 
614
  <dim>-1</dim>
615
  </port>
616
  </output>
617
  </layer>
618
- <layer id="43" name="Subtract_458238" type="Subtract" version="opset1">
619
  <data auto_broadcast="numpy" />
620
  <input>
621
  <port id="0" precision="I32">
@@ -631,13 +469,13 @@
631
  </port>
632
  </output>
633
  </layer>
634
- <layer id="44" name="Constant_458239" type="Const" version="opset1">
635
- <data element_type="i32" shape="" offset="1166207" size="4" />
636
  <output>
637
  <port id="0" precision="I32" />
638
  </output>
639
  </layer>
640
- <layer id="45" name="Minimum_458240" type="Minimum" version="opset1">
641
  <data auto_broadcast="numpy" />
642
  <input>
643
  <port id="0" precision="I32">
@@ -651,7 +489,7 @@
651
  </port>
652
  </output>
653
  </layer>
654
- <layer id="46" name="Add_458241" type="Add" version="opset1">
655
  <data auto_broadcast="numpy" />
656
  <input>
657
  <port id="0" precision="I32">
@@ -667,15 +505,15 @@
667
  </port>
668
  </output>
669
  </layer>
670
- <layer id="47" name="Constant_458242" type="Const" version="opset1">
671
- <data element_type="i32" shape="1" offset="1166211" size="4" />
672
  <output>
673
  <port id="0" precision="I32">
674
  <dim>1</dim>
675
  </port>
676
  </output>
677
  </layer>
678
- <layer id="48" name="CombineSegments_458243" type="CombineSegments" version="extension">
679
  <input>
680
  <port id="0" precision="I32">
681
  <dim>-1</dim>
@@ -711,7 +549,7 @@
711
  </port>
712
  </output>
713
  </layer>
714
- <layer id="49" name="Subtract_458244" type="Subtract" version="opset1">
715
  <data auto_broadcast="numpy" />
716
  <input>
717
  <port id="0" precision="I32">
@@ -727,13 +565,13 @@
727
  </port>
728
  </output>
729
  </layer>
730
- <layer id="50" name="Constant_458245" type="Const" version="opset1">
731
- <data element_type="i32" shape="" offset="1166211" size="4" />
732
  <output>
733
  <port id="0" precision="I32" />
734
  </output>
735
  </layer>
736
- <layer id="51" name="ReduceMax_458246" type="ReduceMax" version="opset1">
737
  <data keep_dims="false" />
738
  <input>
739
  <port id="0" precision="I32">
@@ -745,14 +583,14 @@
745
  <port id="2" precision="I32" />
746
  </output>
747
  </layer>
748
- <layer id="52" name="Constant_458247" type="Const" version="opset1">
749
- <data element_type="i32" shape="" offset="1166211" size="4" />
750
  <output>
751
  <port id="0" precision="I32" />
752
  </output>
753
  </layer>
754
- <layer id="53" name="RaggedToDense_458248" type="RaggedToDense" version="extension">
755
- <data pad_right="true" />
756
  <input>
757
  <port id="0" precision="I32">
758
  <dim>-1</dim>
@@ -777,7 +615,7 @@
777
  </port>
778
  </output>
779
  </layer>
780
- <layer id="54" name="Convert_458249" type="Convert" version="opset1">
781
  <data destination_type="i32" />
782
  <input>
783
  <port id="0" precision="BOOL">
@@ -792,7 +630,7 @@
792
  </port>
793
  </output>
794
  </layer>
795
- <layer id="55" name="Convert_458249" type="Convert" version="opset1">
796
  <data destination_type="i64" />
797
  <input>
798
  <port id="0" precision="I32">
@@ -807,7 +645,7 @@
807
  </port>
808
  </output>
809
  </layer>
810
- <layer id="57" name="RaggedToDense_458248.0" type="Convert" version="opset1">
811
  <data destination_type="i64" />
812
  <input>
813
  <port id="0" precision="I32">
@@ -822,7 +660,7 @@
822
  </port>
823
  </output>
824
  </layer>
825
- <layer id="58" name="Result_458252" type="Result" version="opset1">
826
  <input>
827
  <port id="0" precision="I64">
828
  <dim>-1</dim>
@@ -830,7 +668,7 @@
830
  </port>
831
  </input>
832
  </layer>
833
- <layer id="56" name="Result_458254" type="Result" version="opset1">
834
  <input>
835
  <port id="0" precision="I64">
836
  <dim>-1</dim>
@@ -841,103 +679,85 @@
841
  </layers>
842
  <edges>
843
  <edge from-layer="0" from-port="0" to-layer="2" to-port="0" />
844
- <edge from-layer="1" from-port="0" to-layer="9" to-port="0" />
845
  <edge from-layer="2" from-port="1" to-layer="3" to-port="0" />
846
- <edge from-layer="2" from-port="2" to-layer="3" to-port="1" />
847
- <edge from-layer="2" from-port="3" to-layer="3" to-port="2" />
848
- <edge from-layer="3" from-port="5" to-layer="16" to-port="4" />
849
- <edge from-layer="3" from-port="4" to-layer="16" to-port="3" />
850
- <edge from-layer="3" from-port="3" to-layer="16" to-port="2" />
851
- <edge from-layer="3" from-port="3" to-layer="4" to-port="0" />
852
- <edge from-layer="4" from-port="1" to-layer="7" to-port="0" />
853
- <edge from-layer="5" from-port="0" to-layer="7" to-port="1" />
854
- <edge from-layer="6" from-port="0" to-layer="7" to-port="2" />
855
- <edge from-layer="7" from-port="3" to-layer="9" to-port="1" />
856
- <edge from-layer="7" from-port="3" to-layer="12" to-port="0" />
857
- <edge from-layer="8" from-port="0" to-layer="9" to-port="2" />
858
- <edge from-layer="9" from-port="3" to-layer="16" to-port="0" />
859
- <edge from-layer="10" from-port="0" to-layer="14" to-port="0" />
860
- <edge from-layer="11" from-port="0" to-layer="12" to-port="1" />
861
- <edge from-layer="12" from-port="2" to-layer="14" to-port="1" />
862
- <edge from-layer="13" from-port="0" to-layer="14" to-port="2" />
863
- <edge from-layer="14" from-port="3" to-layer="16" to-port="1" />
864
- <edge from-layer="15" from-port="0" to-layer="16" to-port="5" />
865
- <edge from-layer="16" from-port="6" to-layer="20" to-port="0" />
866
- <edge from-layer="16" from-port="7" to-layer="20" to-port="1" />
867
- <edge from-layer="16" from-port="8" to-layer="20" to-port="2" />
868
- <edge from-layer="16" from-port="9" to-layer="20" to-port="3" />
869
- <edge from-layer="16" from-port="10" to-layer="20" to-port="4" />
870
- <edge from-layer="17" from-port="0" to-layer="20" to-port="5" />
871
- <edge from-layer="18" from-port="0" to-layer="19" to-port="0" />
872
- <edge from-layer="19" from-port="1" to-layer="20" to-port="6" />
873
- <edge from-layer="19" from-port="2" to-layer="20" to-port="7" />
874
- <edge from-layer="19" from-port="3" to-layer="20" to-port="8" />
875
- <edge from-layer="20" from-port="9" to-layer="21" to-port="0" />
876
- <edge from-layer="20" from-port="13" to-layer="21" to-port="4" />
877
- <edge from-layer="20" from-port="12" to-layer="21" to-port="3" />
878
- <edge from-layer="20" from-port="10" to-layer="21" to-port="1" />
879
- <edge from-layer="20" from-port="11" to-layer="21" to-port="2" />
880
- <edge from-layer="21" from-port="9" to-layer="42" to-port="4" />
881
- <edge from-layer="21" from-port="8" to-layer="42" to-port="3" />
882
- <edge from-layer="21" from-port="7" to-layer="42" to-port="2" />
883
- <edge from-layer="21" from-port="6" to-layer="42" to-port="1" />
884
- <edge from-layer="21" from-port="5" to-layer="42" to-port="0" />
885
- <edge from-layer="22" from-port="0" to-layer="23" to-port="0" />
886
- <edge from-layer="23" from-port="3" to-layer="42" to-port="7" />
887
- <edge from-layer="23" from-port="2" to-layer="42" to-port="6" />
888
- <edge from-layer="23" from-port="1" to-layer="42" to-port="5" />
889
- <edge from-layer="24" from-port="0" to-layer="25" to-port="0" />
890
- <edge from-layer="25" from-port="3" to-layer="42" to-port="10" />
891
- <edge from-layer="25" from-port="2" to-layer="42" to-port="9" />
892
- <edge from-layer="25" from-port="1" to-layer="42" to-port="8" />
893
- <edge from-layer="26" from-port="0" to-layer="34" to-port="0" />
894
- <edge from-layer="27" from-port="0" to-layer="28" to-port="0" />
895
- <edge from-layer="28" from-port="2" to-layer="40" to-port="3" />
896
- <edge from-layer="28" from-port="1" to-layer="29" to-port="0" />
897
- <edge from-layer="28" from-port="3" to-layer="40" to-port="4" />
898
- <edge from-layer="28" from-port="1" to-layer="40" to-port="2" />
899
- <edge from-layer="29" from-port="1" to-layer="32" to-port="0" />
900
- <edge from-layer="30" from-port="0" to-layer="32" to-port="1" />
901
- <edge from-layer="31" from-port="0" to-layer="32" to-port="2" />
902
- <edge from-layer="32" from-port="3" to-layer="34" to-port="1" />
903
- <edge from-layer="32" from-port="3" to-layer="37" to-port="0" />
904
- <edge from-layer="33" from-port="0" to-layer="34" to-port="2" />
905
- <edge from-layer="34" from-port="3" to-layer="40" to-port="0" />
906
- <edge from-layer="35" from-port="0" to-layer="39" to-port="0" />
 
 
 
 
907
  <edge from-layer="36" from-port="0" to-layer="37" to-port="1" />
908
- <edge from-layer="37" from-port="2" to-layer="39" to-port="1" />
909
- <edge from-layer="38" from-port="0" to-layer="39" to-port="2" />
910
- <edge from-layer="39" from-port="3" to-layer="40" to-port="1" />
911
- <edge from-layer="40" from-port="7" to-layer="42" to-port="11" />
912
- <edge from-layer="40" from-port="8" to-layer="42" to-port="12" />
913
- <edge from-layer="40" from-port="9" to-layer="42" to-port="13" />
914
- <edge from-layer="41" from-port="0" to-layer="42" to-port="14" />
915
- <edge from-layer="42" from-port="17" to-layer="48" to-port="2" />
916
- <edge from-layer="42" from-port="15" to-layer="48" to-port="0" />
917
- <edge from-layer="42" from-port="15" to-layer="46" to-port="0" />
918
- <edge from-layer="42" from-port="15" to-layer="43" to-port="1" />
919
- <edge from-layer="42" from-port="16" to-layer="43" to-port="0" />
920
- <edge from-layer="43" from-port="2" to-layer="45" to-port="0" />
921
- <edge from-layer="44" from-port="0" to-layer="45" to-port="1" />
922
- <edge from-layer="45" from-port="2" to-layer="46" to-port="1" />
923
- <edge from-layer="46" from-port="2" to-layer="48" to-port="1" />
924
- <edge from-layer="47" from-port="0" to-layer="48" to-port="3" />
925
- <edge from-layer="48" from-port="5" to-layer="49" to-port="0" />
926
- <edge from-layer="48" from-port="4" to-layer="49" to-port="1" />
927
- <edge from-layer="48" from-port="4" to-layer="53" to-port="0" />
928
- <edge from-layer="48" from-port="5" to-layer="53" to-port="1" />
929
- <edge from-layer="48" from-port="6" to-layer="53" to-port="2" />
930
- <edge from-layer="49" from-port="2" to-layer="51" to-port="0" />
931
- <edge from-layer="50" from-port="0" to-layer="51" to-port="1" />
932
- <edge from-layer="51" from-port="2" to-layer="53" to-port="3" />
933
- <edge from-layer="52" from-port="0" to-layer="53" to-port="4" />
934
- <edge from-layer="53" from-port="6" to-layer="54" to-port="0" />
935
- <edge from-layer="53" from-port="5" to-layer="57" to-port="0" />
936
- <edge from-layer="54" from-port="1" to-layer="55" to-port="0" />
937
- <edge from-layer="55" from-port="1" to-layer="56" to-port="0" />
938
- <edge from-layer="57" from-port="1" to-layer="58" to-port="0" />
939
  </edges>
940
  <rt_info>
 
941
  <eos_token_id value="0" />
 
942
  </rt_info>
943
  </net>
 
1
  <?xml version="1.0"?>
2
  <net name="tokenizer" version="11">
3
  <layers>
4
+ <layer id="0" name="Parameter_184558" type="Parameter" version="opset1">
5
  <data shape="?" element_type="string" />
6
  <output>
7
+ <port id="0" precision="STRING" names="Parameter_184558">
8
  <dim>-1</dim>
9
  </port>
10
  </output>
11
  </layer>
12
+ <layer id="1" name="Constant_184564" type="Const" version="opset1">
13
  <data element_type="i64" shape="" offset="0" size="8" />
14
  <output>
15
  <port id="0" precision="I64" />
16
  </output>
17
  </layer>
18
+ <layer id="2" name="StringTensorUnpack_184559" type="StringTensorUnpack" version="extension">
19
  <data mode="begins_ends" />
20
  <input>
21
  <port id="0" precision="STRING">
 
34
  </port>
35
  </output>
36
  </layer>
37
+ <layer id="3" name="ShapeOf_184560" type="ShapeOf" version="opset3">
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
38
  <data output_type="i64" />
39
  <input>
40
  <port id="0" precision="I32">
 
47
  </port>
48
  </output>
49
  </layer>
50
+ <layer id="4" name="Constant_184561" type="Const" version="opset1">
51
  <data element_type="i64" shape="" offset="0" size="8" />
52
  <output>
53
  <port id="0" precision="I64" />
54
  </output>
55
  </layer>
56
+ <layer id="5" name="Constant_184562" type="Const" version="opset1">
57
  <data element_type="i64" shape="" offset="0" size="8" />
58
  <output>
59
  <port id="0" precision="I64" />
60
  </output>
61
  </layer>
62
+ <layer id="6" name="Gather_184563" type="Gather" version="opset8">
63
  <data batch_dims="0" />
64
  <input>
65
  <port id="0" precision="I64">
 
72
  <port id="3" precision="I64" />
73
  </output>
74
  </layer>
75
+ <layer id="7" name="Constant_184565" type="Const" version="opset1">
76
  <data element_type="i64" shape="" offset="8" size="8" />
77
  <output>
78
  <port id="0" precision="I64" />
79
  </output>
80
  </layer>
81
+ <layer id="8" name="Range_184566" type="Range" version="opset4">
82
  <data output_type="i32" />
83
  <input>
84
  <port id="0" precision="I64" />
 
91
  </port>
92
  </output>
93
  </layer>
94
+ <layer id="9" name="Constant_184567" type="Const" version="opset1">
95
  <data element_type="i64" shape="" offset="8" size="8" />
96
  <output>
97
  <port id="0" precision="I64" />
98
  </output>
99
  </layer>
100
+ <layer id="10" name="Constant_184568" type="Const" version="opset1">
101
  <data element_type="i64" shape="" offset="8" size="8" />
102
  <output>
103
  <port id="0" precision="I64" />
104
  </output>
105
  </layer>
106
+ <layer id="11" name="Add_184569" type="Add" version="opset1">
107
  <data auto_broadcast="numpy" />
108
  <input>
109
  <port id="0" precision="I64" />
 
113
  <port id="2" precision="I64" />
114
  </output>
115
  </layer>
116
+ <layer id="12" name="Constant_184570" type="Const" version="opset1">
117
  <data element_type="i64" shape="" offset="8" size="8" />
118
  <output>
119
  <port id="0" precision="I64" />
120
  </output>
121
  </layer>
122
+ <layer id="13" name="Range_184571" type="Range" version="opset4">
123
  <data output_type="i32" />
124
  <input>
125
  <port id="0" precision="I64" />
 
132
  </port>
133
  </output>
134
  </layer>
135
+ <layer id="14" name="Constant_184633" type="Const" version="opset1">
136
+ <data element_type="u8" shape="704" offset="16" size="704" />
137
  <output>
138
  <port id="0" precision="U8">
139
+ <dim>704</dim>
140
  </port>
141
  </output>
142
  </layer>
143
+ <layer id="15" name="SpecialTokensSplit_184634" type="SpecialTokensSplit" version="extension">
 
144
  <input>
145
  <port id="0" precision="I32">
146
  <dim>-1</dim>
 
158
  <dim>-1</dim>
159
  </port>
160
  <port id="5" precision="U8">
161
+ <dim>704</dim>
162
  </port>
163
  </input>
164
  <output>
 
177
  <port id="10" precision="U8">
178
  <dim>-1</dim>
179
  </port>
180
+ <port id="11" precision="BOOL">
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
181
  <dim>-1</dim>
182
  </port>
183
  </output>
184
  </layer>
185
+ <layer id="16" name="NormalizeUnicode_184635" type="NormalizeUnicode" version="extension">
186
+ <data normalization_form="NFC" />
187
  <input>
188
  <port id="0" precision="I32">
189
  <dim>-1</dim>
 
191
  <port id="1" precision="I32">
192
  <dim>-1</dim>
193
  </port>
194
+ <port id="2" precision="U8">
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
195
  <dim>-1</dim>
196
  </port>
197
+ <port id="3" precision="BOOL">
198
  <dim>-1</dim>
199
  </port>
200
  </input>
201
  <output>
202
+ <port id="4" precision="I32">
203
  <dim>-1</dim>
204
  </port>
205
+ <port id="5" precision="I32">
206
  <dim>-1</dim>
207
  </port>
208
+ <port id="6" precision="U8">
209
  <dim>-1</dim>
210
  </port>
211
+ <port id="7" precision="BOOL">
212
  <dim>-1</dim>
213
  </port>
214
+ </output>
215
+ </layer>
216
+ <layer id="17" name="Constant_184637" type="Const" version="opset1">
217
+ <data element_type="u8" shape="64" offset="720" size="64" />
218
+ <output>
219
+ <port id="0" precision="U8">
220
+ <dim>64</dim>
221
  </port>
222
  </output>
223
  </layer>
224
+ <layer id="18" name="RegexSplit_184638" type="RegexSplit" version="extension">
225
+ <data behaviour="isolate" invert="false" max_splits="-1" />
226
  <input>
227
  <port id="0" precision="I32">
228
  <dim>-1</dim>
 
239
  <port id="4" precision="U8">
240
  <dim>-1</dim>
241
  </port>
242
+ <port id="5" precision="BOOL">
243
+ <dim>-1</dim>
244
+ </port>
245
+ <port id="6" precision="U8">
246
+ <dim>64</dim>
247
+ </port>
248
  </input>
249
  <output>
250
+ <port id="7" precision="I32">
251
  <dim>-1</dim>
252
  </port>
253
+ <port id="8" precision="I32">
254
  <dim>-1</dim>
255
  </port>
256
+ <port id="9" precision="I32">
257
  <dim>-1</dim>
258
  </port>
259
+ <port id="10" precision="I32">
260
  <dim>-1</dim>
261
  </port>
262
+ <port id="11" precision="U8">
263
+ <dim>-1</dim>
264
+ </port>
265
+ <port id="12" precision="BOOL">
266
  <dim>-1</dim>
267
  </port>
268
  </output>
269
  </layer>
270
+ <layer id="19" name="Constant_184640" type="Const" version="opset1">
271
+ <data element_type="u8" shape="514030" offset="784" size="514030" />
272
  <output>
273
  <port id="0" precision="U8">
274
+ <dim>514030</dim>
275
  </port>
276
  </output>
277
  </layer>
278
+ <layer id="20" name="StringTensorUnpack_184641" type="StringTensorUnpack" version="extension">
279
  <data mode="begins_ends" />
280
  <input>
281
  <port id="0" precision="U8">
282
+ <dim>514030</dim>
283
  </port>
284
  </input>
285
  <output>
 
294
  </port>
295
  </output>
296
  </layer>
297
+ <layer id="21" name="Constant_184646" type="Const" version="opset1">
298
+ <data element_type="u8" shape="362936" offset="514814" size="362936" />
299
  <output>
300
  <port id="0" precision="U8">
301
+ <dim>362936</dim>
302
  </port>
303
  </output>
304
  </layer>
305
+ <layer id="22" name="StringTensorUnpack_184647" type="StringTensorUnpack" version="extension">
306
  <data mode="begins_ends" />
307
  <input>
308
  <port id="0" precision="U8">
309
+ <dim>362936</dim>
310
  </port>
311
  </input>
312
  <output>
 
321
  </port>
322
  </output>
323
  </layer>
324
+ <layer id="23" name="Constant_184649" type="Const" version="opset1">
325
+ <data element_type="u8" shape="349500" offset="877750" size="349500" />
 
 
 
 
 
 
326
  <output>
327
  <port id="0" precision="U8">
328
+ <dim>349500</dim>
329
  </port>
330
  </output>
331
  </layer>
332
+ <layer id="24" name="StringTensorUnpack_184650" type="StringTensorUnpack" version="extension">
333
  <data mode="begins_ends" />
334
  <input>
335
  <port id="0" precision="U8">
336
+ <dim>349500</dim>
337
  </port>
338
  </input>
339
  <output>
 
348
  </port>
349
  </output>
350
  </layer>
351
+ <layer id="25" name="Constant_184643" type="Const" version="opset1">
352
+ <data element_type="u8" shape="414" offset="1227250" size="414" />
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
353
  <output>
354
+ <port id="0" precision="U8">
355
+ <dim>414</dim>
 
 
 
 
 
 
356
  </port>
 
 
 
 
 
357
  </output>
358
  </layer>
359
+ <layer id="26" name="StringTensorUnpack_184644" type="StringTensorUnpack" version="extension">
360
+ <data mode="begins_ends" />
 
 
 
 
 
 
361
  <input>
362
+ <port id="0" precision="U8">
363
+ <dim>414</dim>
 
 
 
 
 
364
  </port>
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
365
  </input>
366
  <output>
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
367
  <port id="1" precision="I32">
368
  <dim>-1</dim>
369
  </port>
370
  <port id="2" precision="I32">
371
  <dim>-1</dim>
372
  </port>
373
+ <port id="3" precision="U8">
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
374
  <dim>-1</dim>
375
  </port>
376
  </output>
377
  </layer>
378
+ <layer id="27" name="Constant_184651" type="Const" version="opset1">
379
+ <data element_type="i32" shape="24" offset="1227664" size="96" />
380
  <output>
381
  <port id="0" precision="I32">
382
+ <dim>24</dim>
383
  </port>
384
  </output>
385
  </layer>
386
+ <layer id="28" name="BPETokenizer_184652" type="BPETokenizer" version="extension">
387
+ <data unk_token="" fuse_unk="false" suffix_indicator="" end_suffix="" byte_fallback="false" cache_capacity="20000" />
388
  <input>
389
  <port id="0" precision="I32">
390
  <dim>-1</dim>
 
429
  <dim>-1</dim>
430
  </port>
431
  <port id="14" precision="I32">
432
+ <dim>-1</dim>
433
  </port>
 
 
434
  <port id="15" precision="I32">
435
  <dim>-1</dim>
436
  </port>
437
+ <port id="16" precision="U8">
438
  <dim>-1</dim>
439
  </port>
440
  <port id="17" precision="I32">
441
+ <dim>24</dim>
442
+ </port>
443
+ </input>
444
+ <output>
445
+ <port id="18" precision="I32">
446
+ <dim>-1</dim>
447
+ </port>
448
+ <port id="19" precision="I32">
449
+ <dim>-1</dim>
450
+ </port>
451
+ <port id="20" precision="I32">
452
  <dim>-1</dim>
453
  </port>
454
  </output>
455
  </layer>
456
+ <layer id="29" name="Subtract_184653" type="Subtract" version="opset1">
457
  <data auto_broadcast="numpy" />
458
  <input>
459
  <port id="0" precision="I32">
 
469
  </port>
470
  </output>
471
  </layer>
472
+ <layer id="30" name="Constant_184654" type="Const" version="opset1">
473
+ <data element_type="i32" shape="" offset="1227760" size="4" />
474
  <output>
475
  <port id="0" precision="I32" />
476
  </output>
477
  </layer>
478
+ <layer id="31" name="Minimum_184655" type="Minimum" version="opset1">
479
  <data auto_broadcast="numpy" />
480
  <input>
481
  <port id="0" precision="I32">
 
489
  </port>
490
  </output>
491
  </layer>
492
+ <layer id="32" name="Subtract_184656" type="Subtract" version="opset1">
493
  <data auto_broadcast="numpy" />
494
  <input>
495
  <port id="0" precision="I32">
 
505
  </port>
506
  </output>
507
  </layer>
508
+ <layer id="33" name="Constant_184657" type="Const" version="opset1">
509
+ <data element_type="i32" shape="1" offset="1227764" size="4" />
510
  <output>
511
  <port id="0" precision="I32">
512
  <dim>1</dim>
513
  </port>
514
  </output>
515
  </layer>
516
+ <layer id="34" name="CombineSegments_184658" type="CombineSegments" version="extension">
517
  <input>
518
  <port id="0" precision="I32">
519
  <dim>-1</dim>
 
549
  </port>
550
  </output>
551
  </layer>
552
+ <layer id="35" name="Subtract_184659" type="Subtract" version="opset1">
553
  <data auto_broadcast="numpy" />
554
  <input>
555
  <port id="0" precision="I32">
 
565
  </port>
566
  </output>
567
  </layer>
568
+ <layer id="36" name="Constant_184660" type="Const" version="opset1">
569
+ <data element_type="i32" shape="" offset="1227764" size="4" />
570
  <output>
571
  <port id="0" precision="I32" />
572
  </output>
573
  </layer>
574
+ <layer id="37" name="ReduceMax_184661" type="ReduceMax" version="opset1">
575
  <data keep_dims="false" />
576
  <input>
577
  <port id="0" precision="I32">
 
583
  <port id="2" precision="I32" />
584
  </output>
585
  </layer>
586
+ <layer id="38" name="Constant_184662" type="Const" version="opset1">
587
+ <data element_type="i32" shape="" offset="1227764" size="4" />
588
  <output>
589
  <port id="0" precision="I32" />
590
  </output>
591
  </layer>
592
+ <layer id="39" name="RaggedToDense_184663" type="RaggedToDense" version="extension">
593
+ <data pad_right="false" />
594
  <input>
595
  <port id="0" precision="I32">
596
  <dim>-1</dim>
 
615
  </port>
616
  </output>
617
  </layer>
618
+ <layer id="40" name="Convert_184664" type="Convert" version="opset1">
619
  <data destination_type="i32" />
620
  <input>
621
  <port id="0" precision="BOOL">
 
630
  </port>
631
  </output>
632
  </layer>
633
+ <layer id="41" name="Convert_184664" type="Convert" version="opset1">
634
  <data destination_type="i64" />
635
  <input>
636
  <port id="0" precision="I32">
 
645
  </port>
646
  </output>
647
  </layer>
648
+ <layer id="43" name="RaggedToDense_184663.0" type="Convert" version="opset1">
649
  <data destination_type="i64" />
650
  <input>
651
  <port id="0" precision="I32">
 
660
  </port>
661
  </output>
662
  </layer>
663
+ <layer id="44" name="Result_184667" type="Result" version="opset1">
664
  <input>
665
  <port id="0" precision="I64">
666
  <dim>-1</dim>
 
668
  </port>
669
  </input>
670
  </layer>
671
+ <layer id="42" name="Result_184669" type="Result" version="opset1">
672
  <input>
673
  <port id="0" precision="I64">
674
  <dim>-1</dim>
 
679
  </layers>
680
  <edges>
681
  <edge from-layer="0" from-port="0" to-layer="2" to-port="0" />
682
+ <edge from-layer="1" from-port="0" to-layer="8" to-port="0" />
683
  <edge from-layer="2" from-port="1" to-layer="3" to-port="0" />
684
+ <edge from-layer="2" from-port="3" to-layer="15" to-port="4" />
685
+ <edge from-layer="2" from-port="2" to-layer="15" to-port="3" />
686
+ <edge from-layer="2" from-port="1" to-layer="15" to-port="2" />
687
+ <edge from-layer="3" from-port="1" to-layer="6" to-port="0" />
688
+ <edge from-layer="4" from-port="0" to-layer="6" to-port="1" />
689
+ <edge from-layer="5" from-port="0" to-layer="6" to-port="2" />
690
+ <edge from-layer="6" from-port="3" to-layer="11" to-port="0" />
691
+ <edge from-layer="6" from-port="3" to-layer="8" to-port="1" />
692
+ <edge from-layer="7" from-port="0" to-layer="8" to-port="2" />
693
+ <edge from-layer="8" from-port="3" to-layer="15" to-port="0" />
694
+ <edge from-layer="9" from-port="0" to-layer="13" to-port="0" />
695
+ <edge from-layer="10" from-port="0" to-layer="11" to-port="1" />
696
+ <edge from-layer="11" from-port="2" to-layer="13" to-port="1" />
697
+ <edge from-layer="12" from-port="0" to-layer="13" to-port="2" />
698
+ <edge from-layer="13" from-port="3" to-layer="15" to-port="1" />
699
+ <edge from-layer="14" from-port="0" to-layer="15" to-port="5" />
700
+ <edge from-layer="15" from-port="9" to-layer="16" to-port="1" />
701
+ <edge from-layer="15" from-port="7" to-layer="18" to-port="1" />
702
+ <edge from-layer="15" from-port="6" to-layer="18" to-port="0" />
703
+ <edge from-layer="15" from-port="11" to-layer="16" to-port="3" />
704
+ <edge from-layer="15" from-port="10" to-layer="16" to-port="2" />
705
+ <edge from-layer="15" from-port="8" to-layer="16" to-port="0" />
706
+ <edge from-layer="16" from-port="4" to-layer="18" to-port="2" />
707
+ <edge from-layer="16" from-port="5" to-layer="18" to-port="3" />
708
+ <edge from-layer="16" from-port="6" to-layer="18" to-port="4" />
709
+ <edge from-layer="16" from-port="7" to-layer="18" to-port="5" />
710
+ <edge from-layer="17" from-port="0" to-layer="18" to-port="6" />
711
+ <edge from-layer="18" from-port="11" to-layer="28" to-port="4" />
712
+ <edge from-layer="18" from-port="10" to-layer="28" to-port="3" />
713
+ <edge from-layer="18" from-port="9" to-layer="28" to-port="2" />
714
+ <edge from-layer="18" from-port="8" to-layer="28" to-port="1" />
715
+ <edge from-layer="18" from-port="7" to-layer="28" to-port="0" />
716
+ <edge from-layer="19" from-port="0" to-layer="20" to-port="0" />
717
+ <edge from-layer="20" from-port="1" to-layer="28" to-port="5" />
718
+ <edge from-layer="20" from-port="2" to-layer="28" to-port="6" />
719
+ <edge from-layer="20" from-port="3" to-layer="28" to-port="7" />
720
+ <edge from-layer="21" from-port="0" to-layer="22" to-port="0" />
721
+ <edge from-layer="22" from-port="1" to-layer="28" to-port="8" />
722
+ <edge from-layer="22" from-port="2" to-layer="28" to-port="9" />
723
+ <edge from-layer="22" from-port="3" to-layer="28" to-port="10" />
724
+ <edge from-layer="23" from-port="0" to-layer="24" to-port="0" />
725
+ <edge from-layer="24" from-port="1" to-layer="28" to-port="11" />
726
+ <edge from-layer="24" from-port="2" to-layer="28" to-port="12" />
727
+ <edge from-layer="24" from-port="3" to-layer="28" to-port="13" />
728
+ <edge from-layer="25" from-port="0" to-layer="26" to-port="0" />
729
+ <edge from-layer="26" from-port="1" to-layer="28" to-port="14" />
730
+ <edge from-layer="26" from-port="2" to-layer="28" to-port="15" />
731
+ <edge from-layer="26" from-port="3" to-layer="28" to-port="16" />
732
+ <edge from-layer="27" from-port="0" to-layer="28" to-port="17" />
733
+ <edge from-layer="28" from-port="19" to-layer="29" to-port="0" />
734
+ <edge from-layer="28" from-port="18" to-layer="29" to-port="1" />
735
+ <edge from-layer="28" from-port="19" to-layer="32" to-port="0" />
736
+ <edge from-layer="28" from-port="20" to-layer="34" to-port="2" />
737
+ <edge from-layer="28" from-port="19" to-layer="34" to-port="1" />
738
+ <edge from-layer="29" from-port="2" to-layer="31" to-port="0" />
739
+ <edge from-layer="30" from-port="0" to-layer="31" to-port="1" />
740
+ <edge from-layer="31" from-port="2" to-layer="32" to-port="1" />
741
+ <edge from-layer="32" from-port="2" to-layer="34" to-port="0" />
742
+ <edge from-layer="33" from-port="0" to-layer="34" to-port="3" />
743
+ <edge from-layer="34" from-port="5" to-layer="39" to-port="1" />
744
+ <edge from-layer="34" from-port="6" to-layer="39" to-port="2" />
745
+ <edge from-layer="34" from-port="4" to-layer="39" to-port="0" />
746
+ <edge from-layer="34" from-port="4" to-layer="35" to-port="1" />
747
+ <edge from-layer="34" from-port="5" to-layer="35" to-port="0" />
748
+ <edge from-layer="35" from-port="2" to-layer="37" to-port="0" />
749
  <edge from-layer="36" from-port="0" to-layer="37" to-port="1" />
750
+ <edge from-layer="37" from-port="2" to-layer="39" to-port="3" />
751
+ <edge from-layer="38" from-port="0" to-layer="39" to-port="4" />
752
+ <edge from-layer="39" from-port="6" to-layer="40" to-port="0" />
753
+ <edge from-layer="39" from-port="5" to-layer="43" to-port="0" />
754
+ <edge from-layer="40" from-port="1" to-layer="41" to-port="0" />
755
+ <edge from-layer="41" from-port="1" to-layer="42" to-port="0" />
756
+ <edge from-layer="43" from-port="1" to-layer="44" to-port="0" />
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
757
  </edges>
758
  <rt_info>
759
+ <bos_token_id value="0" />
760
  <eos_token_id value="0" />
761
+ <original_tokenizer_class value="&lt;class 'transformers.models.gpt_neox.tokenization_gpt_neox_fast.GPTNeoXTokenizerFast'>" />
762
  </rt_info>
763
  </net>
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff