|
<?xml version="1.0"?> |
|
<net name="Model0" version="11"> |
|
<layers> |
|
<layer id="3" name="attention_mask" type="Parameter" version="opset1"> |
|
<data shape="?,?" element_type="i64" /> |
|
<output> |
|
<port id="0" precision="I64" names="attention_mask"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="2" name="position_ids" type="Parameter" version="opset1"> |
|
<data shape="?,?" element_type="i64" /> |
|
<output> |
|
<port id="0" precision="I64" names="position_ids"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="1" name="inputs_embeds" type="Parameter" version="opset1"> |
|
<data shape="?,?,16" element_type="f32" /> |
|
<output> |
|
<port id="0" precision="FP32" names="inputs_embeds"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="0" name="beam_idx" type="Parameter" version="opset1"> |
|
<data shape="?" element_type="i32" /> |
|
<output> |
|
<port id="0" precision="I32" names="beam_idx"> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="4" name="Constant_9487" type="Const" version="opset1"> |
|
<data element_type="f32" shape="" offset="0" size="4" /> |
|
<output> |
|
<port id="0" precision="FP32" /> |
|
</output> |
|
</layer> |
|
<layer id="5" name="ShapeOf_9473" type="ShapeOf" version="opset3"> |
|
<data output_type="i64" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="6" name="Constant_9475" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="4" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="7" name="Constant_9477" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="4" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="8" name="Gather_9478" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="9" name="Constant_9480" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="12" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="10" name="Constant_9482" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="4" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="11" name="Constant_9484" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="12" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="12" name="Concat_9485" type="Concat" version="opset1"> |
|
<data axis="0" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="13" name="Broadcast_9488" type="Broadcast" version="opset3"> |
|
<data mode="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32" /> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>0</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="14" name="ReadValue_9185" type="ReadValue" version="opset6"> |
|
<data variable_id="past_key_values.1.valuepresent.1.value" variable_type="f32" variable_shape="?,4,?,4" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>0</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32" names="past_key_values.1.value"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="15" name="Constant_8891" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="4" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="16" name="Gather_8892" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="17" name="Constant_7373" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 16" offset="20" size="64" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="18" name="Constant_7372" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1" offset="84" size="4" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="19" name="Constant_7370" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1" offset="88" size="4" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="20" name="__module.model.model.layers.0.input_layernorm/aten::pow/Power" type="Power" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="133"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="21" name="Constant_571" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="92" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" names="134"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="22" name="__module.model.model.layers.0.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> |
|
<data keep_dims="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="135,variance.1"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="23" name="Constant_7371" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1" offset="100" size="4" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="24" name="__module.model.model.layers.0.input_layernorm/aten::add/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="136"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="25" name="__module.model.model.layers.0.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="26" name="__module.model.model.layers.0.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> |
|
<data auto_broadcast="numpy" m_pythondiv="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="137"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="27" name="__module.model.model.layers.0.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="138,139,hidden_states.3,hidden_states.5"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="28" name="__module.model.model.layers.0.input_layernorm/aten::mul/Multiply_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="140,142,hidden_states.7"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="29" name="self.model.model.layers.0.self_attn.q_proj.weight" type="Const" version="opset1"> |
|
<data element_type="f32" shape="16, 16" offset="104" size="1024" /> |
|
<output> |
|
<port id="0" precision="FP32" names="self.model.model.layers.0.self_attn.q_proj.weight"> |
|
<dim>16</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="30" name="__module.model.model.layers.0.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>16</dim> |
|
<dim>16</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="151,query_states.1"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="31" name="Constant_7898" type="Const" version="opset1"> |
|
<data element_type="i64" shape="4" offset="1128" size="32" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="32" name="__module.model.model.layers.0.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="157"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="33" name="__module.model.model.layers.0.self_attn/aten::transpose/Constant" type="Const" version="opset1"> |
|
<data element_type="i32" shape="4" offset="1160" size="16" /> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="34" name="__module.model.model.layers.0.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="158,q.1"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="35" name="__module.model.model.rotary_emb/aten::unsqueeze/Unsqueeze_1" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 2, 1" offset="1176" size="8" /> |
|
<output> |
|
<port id="0" precision="FP32" names="103,104"> |
|
<dim>1</dim> |
|
<dim>2</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="36" name="ShapeOf_7694" type="ShapeOf" version="opset3"> |
|
<data output_type="i64" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="37" name="Constant_7695" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="4" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="38" name="Constant_7696" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="4" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="39" name="Gather_7697" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64" names="105,75"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="40" name="Constant_6593" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="1184" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="41" name="Constant_6595" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="1184" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="42" name="__module.model.model.rotary_emb/prim::ListConstruct" type="Concat" version="opset1"> |
|
<data axis="0" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="43" name="__module.model.model.rotary_emb/aten::expand/Broadcast" type="Broadcast" version="opset3"> |
|
<data mode="bidirectional" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>2</dim> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="107,112,inv_freq_expanded,inv_freq_expanded.1"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="44" name="24" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="1184" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" names="24" /> |
|
</output> |
|
</layer> |
|
<layer id="45" name="__module.model.model.rotary_emb/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="109,110"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="46" name="__module.model.model.rotary_emb/aten::to/Convert_2" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32" names="111,113,position_ids_expanded,position_ids_expanded.1"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="47" name="__module.model.model.rotary_emb/aten::matmul/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="false" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="114"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="48" name="__module.model.model.rotary_emb/aten::transpose/Constant" type="Const" version="opset1"> |
|
<data element_type="i32" shape="3" offset="1192" size="12" /> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="49" name="__module.model.model.rotary_emb/aten::transpose/Transpose" type="Transpose" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>3</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="115"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="50" name="__module.model.model.rotary_emb/aten::cat/Concat" type="Concat" version="opset1"> |
|
<data axis="-1" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="117,emb"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="51" name="__module.model.model.rotary_emb/aten::cos/Cos" type="Cos" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32" names="118,120,122,125,cos.1,cos.3,cos.5"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="52" name="__module.model.model.layers.0.self_attn/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="165,290,cos,cos.7"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="53" name="__module.model.model.layers.0.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="167"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="54" name="Constant_965" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="1204" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="55" name="Constant_967" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="1212" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="56" name="Constant_969" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="1184" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="57" name="__module.model.model.layers.0.self_attn/aten::slice/Reshape" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="1220" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="58" name="__module.model.model.layers.0.self_attn/aten::slice/Slice" type="Slice" version="opset8"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="4" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="5" precision="FP32" names="177,x2.1"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="59" name="Constant_7374" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1, 1" offset="1228" size="4" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="60" name="__module.model.model.layers.0.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="178"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="61" name="Constant_862" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="4" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="62" name="Constant_906" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="1204" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="63" name="Constant_908" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="1184" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="64" name="__module.model.model.layers.0.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="4" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="5" precision="FP32" names="172"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="65" name="__module.model.model.layers.0.self_attn/aten::cat/Concat" type="Concat" version="opset1"> |
|
<data axis="-1" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="180"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="66" name="__module.model.model.rotary_emb/aten::sin/Sin" type="Sin" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32" names="119,121,123,126,sin.1,sin.3,sin.5"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="67" name="__module.model.model.layers.0.self_attn/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="166,291,sin,sin.7"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="68" name="__module.model.model.layers.0.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="181"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="69" name="__module.model.model.layers.0.self_attn/aten::add/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="182"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="70" name="Constant_9499" type="Const" version="opset1"> |
|
<data element_type="f32" shape="" offset="0" size="4" /> |
|
<output> |
|
<port id="0" precision="FP32" /> |
|
</output> |
|
</layer> |
|
<layer id="71" name="Constant_9492" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="12" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="72" name="Constant_9494" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="4" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="73" name="Constant_9496" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="12" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="74" name="Concat_9497" type="Concat" version="opset1"> |
|
<data axis="0" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="75" name="Broadcast_9500" type="Broadcast" version="opset3"> |
|
<data mode="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32" /> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>0</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="76" name="ReadValue_9179" type="ReadValue" version="opset6"> |
|
<data variable_id="past_key_values.0.keypresent.0.key" variable_type="f32" variable_shape="?,4,?,4" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>0</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32" names="past_key_values.0.key"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="77" name="Constant_8882" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="4" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="78" name="Gather_8883" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="79" name="self.model.model.layers.0.self_attn.k_proj.weight" type="Const" version="opset1"> |
|
<data element_type="f32" shape="16, 16" offset="1232" size="1024" /> |
|
<output> |
|
<port id="0" precision="FP32" names="self.model.model.layers.0.self_attn.k_proj.weight"> |
|
<dim>16</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="80" name="__module.model.model.layers.0.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>16</dim> |
|
<dim>16</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="153,key_states.3"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="81" name="Constant_7899" type="Const" version="opset1"> |
|
<data element_type="i64" shape="4" offset="1128" size="32" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="82" name="__module.model.model.layers.0.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="160"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="83" name="__module.model.model.layers.0.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> |
|
<data element_type="i32" shape="4" offset="1160" size="16" /> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="84" name="__module.model.model.layers.0.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="161,k.1"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="85" name="__module.model.model.layers.0.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="183"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="86" name="Constant_1108" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="1204" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="87" name="Constant_1110" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="1212" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="88" name="Constant_1112" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="1184" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="89" name="__module.model.model.layers.0.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="4" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="5" precision="FP32" names="193,x2.3"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="90" name="Constant_7375" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1, 1" offset="1228" size="4" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="91" name="__module.model.model.layers.0.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="194"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="92" name="Constant_1005" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="4" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="93" name="Constant_1049" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="1204" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="94" name="Constant_1051" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="1184" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="95" name="__module.model.model.layers.0.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="4" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="5" precision="FP32" names="188"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="96" name="__module.model.model.layers.0.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> |
|
<data axis="-1" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="196"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="97" name="__module.model.model.layers.0.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="197"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="98" name="__module.model.model.layers.0.self_attn/aten::add/Add_1" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="198,key_states.5"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="99" name="__module.model.model.layers.0.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> |
|
<data axis="-2" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="present.0.key"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="100" name="Constant_9511" type="Const" version="opset1"> |
|
<data element_type="f32" shape="" offset="0" size="4" /> |
|
<output> |
|
<port id="0" precision="FP32" /> |
|
</output> |
|
</layer> |
|
<layer id="101" name="Constant_9504" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="12" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="102" name="Constant_9506" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="4" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="103" name="Constant_9508" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="12" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="104" name="Concat_9509" type="Concat" version="opset1"> |
|
<data axis="0" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="105" name="Broadcast_9512" type="Broadcast" version="opset3"> |
|
<data mode="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32" /> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>0</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="106" name="ReadValue_9181" type="ReadValue" version="opset6"> |
|
<data variable_id="past_key_values.0.valuepresent.0.value" variable_type="f32" variable_shape="?,4,?,4" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>0</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32" names="past_key_values.0.value"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="107" name="Constant_8885" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="4" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="108" name="Gather_8886" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="109" name="self.model.model.layers.0.self_attn.v_proj.weight" type="Const" version="opset1"> |
|
<data element_type="f32" shape="16, 16" offset="2256" size="1024" /> |
|
<output> |
|
<port id="0" precision="FP32" names="self.model.model.layers.0.self_attn.v_proj.weight"> |
|
<dim>16</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="110" name="__module.model.model.layers.0.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>16</dim> |
|
<dim>16</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="155,value_states.1"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="111" name="Constant_7900" type="Const" version="opset1"> |
|
<data element_type="i64" shape="4" offset="1128" size="32" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="112" name="__module.model.model.layers.0.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="163"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="113" name="__module.model.model.layers.0.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> |
|
<data element_type="i32" shape="4" offset="1160" size="16" /> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="114" name="__module.model.model.layers.0.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="164"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="115" name="__module.model.model.layers.0.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> |
|
<data axis="-2" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="present.0.value"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="116" name="__module.model.model/aten::triu/Constant" type="Const" version="opset1"> |
|
<data element_type="i32" shape="" offset="0" size="4" /> |
|
<output> |
|
<port id="0" precision="I32" /> |
|
</output> |
|
</layer> |
|
<layer id="117" name="Multiply_7055" type="Const" version="opset1"> |
|
<data element_type="f32" shape="" offset="3280" size="4" /> |
|
<output> |
|
<port id="0" precision="FP32" /> |
|
</output> |
|
</layer> |
|
<layer id="118" name="Constant_7060" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="3284" size="16" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="119" name="Constant_7703" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="1184" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="120" name="Constant_7704" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="4" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="121" name="Gather_7705" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="1" precision="I64" /> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64" names="55,60" /> |
|
</output> |
|
</layer> |
|
<layer id="122" name="Constant_7706" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="1184" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="123" name="Reshape_7707" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="I64" /> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="124" name="ShapeOf_7710" type="ShapeOf" version="opset3"> |
|
<data output_type="i64" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="125" name="Constant_7711" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="1184" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="126" name="Constant_7712" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="4" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="127" name="Gather_7713" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
<port id="1" precision="I64" /> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64" names="61,79" /> |
|
</output> |
|
</layer> |
|
<layer id="128" name="Constant_7714" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="1184" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="129" name="Reshape_7715" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="I64" /> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="130" name="__module.model.model/prim::ListConstruct" type="Concat" version="opset1"> |
|
<data axis="0" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="131" name="Maximum_7061" type="Maximum" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="132" name="__module.model.model/aten::mul/Multiply" type="Broadcast" version="opset3"> |
|
<data mode="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32" /> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="64"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="133" name="ShapeOf_7720" type="ShapeOf" version="opset3"> |
|
<data output_type="i32" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="I32"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="134" name="Constant_7721" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="1184" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="135" name="Constant_7722" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="4" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="136" name="Gather_7723" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<input> |
|
<port id="0" precision="I32"> |
|
<dim>2</dim> |
|
</port> |
|
<port id="1" precision="I64" /> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="I32" /> |
|
</output> |
|
</layer> |
|
<layer id="137" name="__module.model.model/aten::triu/Constant_2" type="Const" version="opset1"> |
|
<data element_type="i32" shape="" offset="3300" size="4" /> |
|
<output> |
|
<port id="0" precision="I32" /> |
|
</output> |
|
</layer> |
|
<layer id="138" name="__module.model.model/aten::triu/Range" type="Range" version="opset4"> |
|
<data output_type="i32" /> |
|
<input> |
|
<port id="0" precision="I32" /> |
|
<port id="1" precision="I32" /> |
|
<port id="2" precision="I32" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="I32"> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="139" name="__module.model.model/aten::triu/Unsqueeze" type="Unsqueeze" version="opset1"> |
|
<input> |
|
<port id="0" precision="I32"> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I32" /> |
|
</input> |
|
<output> |
|
<port id="2" precision="I32"> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="140" name="__module.model.model/aten::triu/Convert" type="Const" version="opset1"> |
|
<data element_type="i32" shape="" offset="3300" size="4" /> |
|
<output> |
|
<port id="0" precision="I32" /> |
|
</output> |
|
</layer> |
|
<layer id="141" name="Constant_7727" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="4" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="142" name="Constant_7728" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="4" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="143" name="Gather_7729" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<input> |
|
<port id="0" precision="I32"> |
|
<dim>2</dim> |
|
</port> |
|
<port id="1" precision="I64" /> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="I32" /> |
|
</output> |
|
</layer> |
|
<layer id="144" name="__module.model.model/aten::triu/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="I32" /> |
|
<port id="1" precision="I32" /> |
|
</input> |
|
<output> |
|
<port id="2" precision="I32" /> |
|
</output> |
|
</layer> |
|
<layer id="145" name="__module.model.model/aten::triu/Range_1" type="Range" version="opset4"> |
|
<data output_type="i32" /> |
|
<input> |
|
<port id="0" precision="I32" /> |
|
<port id="1" precision="I32" /> |
|
<port id="2" precision="I32" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="I32"> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="146" name="__module.model.model/aten::triu/Unsqueeze_1" type="Unsqueeze" version="opset1"> |
|
<input> |
|
<port id="0" precision="I32"> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I32" /> |
|
</input> |
|
<output> |
|
<port id="2" precision="I32"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="147" name="__module.model.model/aten::triu/GreaterEqual" type="GreaterEqual" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="I32"> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="BOOL"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="148" name="__module.model.model/aten::triu/ConvertLike" type="Const" version="opset1"> |
|
<data element_type="f32" shape="" offset="0" size="4" /> |
|
<output> |
|
<port id="0" precision="FP32" /> |
|
</output> |
|
</layer> |
|
<layer id="149" name="__module.model.model/aten::triu/Select" type="Select" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="BOOL"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="2" precision="FP32" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="FP32" names="65_1"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="150" name="__module.model.model/aten::arange/Constant" type="Const" version="opset1"> |
|
<data element_type="i32" shape="" offset="0" size="4" /> |
|
<output> |
|
<port id="0" precision="I32" /> |
|
</output> |
|
</layer> |
|
<layer id="151" name="__module.model.model/aten::arange/Constant_1" type="Const" version="opset1"> |
|
<data element_type="i32" shape="" offset="3300" size="4" /> |
|
<output> |
|
<port id="0" precision="I32" /> |
|
</output> |
|
</layer> |
|
<layer id="152" name="__module.model.model/aten::arange/Range" type="Range" version="opset4"> |
|
<data output_type="f32" /> |
|
<input> |
|
<port id="0" precision="I32" /> |
|
<port id="1" precision="I64" /> |
|
<port id="2" precision="I32" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="FP32"> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="153" name="__module.model.model/aten::arange/ConvertLike" type="Convert" version="opset1"> |
|
<data destination_type="i64" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="I64" names="66"> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="154" name="__module.model.model/aten::gt/Convert" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="155" name="ShapeOf_7734" type="ShapeOf" version="opset3"> |
|
<data output_type="i64" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="156" name="Constant_7735" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="1204" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="157" name="Constant_7736" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="4" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="158" name="Gather_7737" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64" /> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64" names="53" /> |
|
</output> |
|
</layer> |
|
<layer id="159" name="__module.model.model/aten::add/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="I64" /> |
|
<port id="1" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="57" /> |
|
</output> |
|
</layer> |
|
<layer id="160" name="__module.model.model/aten::arange/Constant_2" type="Const" version="opset1"> |
|
<data element_type="i32" shape="" offset="3300" size="4" /> |
|
<output> |
|
<port id="0" precision="I32" /> |
|
</output> |
|
</layer> |
|
<layer id="161" name="__module.model.model/aten::arange/Range_1" type="Range" version="opset4"> |
|
<data output_type="f32" /> |
|
<input> |
|
<port id="0" precision="I64" /> |
|
<port id="1" precision="I64" /> |
|
<port id="2" precision="I32" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="FP32" names="59,cache_position"> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="162" name="Constant_179" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="3304" size="16" /> |
|
<output> |
|
<port id="0" precision="I64" names="67"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="163" name="__module.model.model/aten::reshape/Reshape" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="68"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="164" name="__module.model.model/aten::gt/Greater" type="Greater" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="BOOL" names="69"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="165" name="__module.model.model/aten::mul_/ConvertLike" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<input> |
|
<port id="0" precision="BOOL"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="166" name="__module.model.model/aten::mul_/Multiply" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="65,causal_mask.1"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="167" name="31" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="4" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" names="31" /> |
|
</output> |
|
</layer> |
|
<layer id="168" name="__module.model.model/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="71"> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="169" name="__module.model.model/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="72,73,74"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="170" name="Constant_6601" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="1184" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="171" name="Constant_6603" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="1184" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="172" name="Constant_6605" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="1184" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="173" name="__module.model.model/prim::ListConstruct_1" type="Concat" version="opset1"> |
|
<data axis="0" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="174" name="__module.model.model/aten::expand/Broadcast" type="Broadcast" version="opset3"> |
|
<data mode="bidirectional" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="77,80,81,82,90,91,92,95_1,96_1,97_1,causal_mask.5"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="175" name="Constant_3919" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="92" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="176" name="SliceAssign_396/Reshape_3" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="177" name="Constant_2274" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="4" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="178" name="SliceAssign_396/ShapeOf" type="ShapeOf" version="opset3"> |
|
<data output_type="i64" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="179" name="SliceAssign_396/ReduceProd" type="ReduceProd" version="opset1"> |
|
<data keep_dims="false" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="180" name="Constant_2275" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="1184" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="181" name="SliceAssign_396/Range" type="Range" version="opset4"> |
|
<data output_type="i64" /> |
|
<input> |
|
<port id="0" precision="I64" /> |
|
<port id="1" precision="I64" /> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64"> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="182" name="SliceAssign_396/Reshape" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="183" name="Constant_385" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="4" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="184" name="Constant_388" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="1184" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="185" name="SliceAssign_396/Slice_2" type="Slice" version="opset8"> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="4" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="5" precision="I64"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="186" name="Constant_2277" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="3304" size="16" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="187" name="SliceAssign_396/Reshape_4" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="188" name="Constant_268" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="4" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="189" name="Constant_271" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="1184" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="190" name="__module.model.model/aten::slice/Slice_5" type="Slice" version="opset8"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="4" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="5" precision="FP32" names="83,93,98_1"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="191" name="__module.model.model/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="85"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="192" name="22" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="1204" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" names="22" /> |
|
</output> |
|
</layer> |
|
<layer id="193" name="__module.model.model/aten::unsqueeze/Unsqueeze_3" type="Unsqueeze" version="opset1"> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="86,87"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="194" name="__module.model.model/aten::add/Convert" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="195" name="__module.model.model/aten::add/Add_1" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="88,padding_mask.1"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="196" name="Constant_7376" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1, 1" offset="0" size="4" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="197" name="__module.model.model/aten::eq/Equal" type="Equal" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="BOOL" names="89,padding_mask"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="198" name="34" type="Const" version="opset1"> |
|
<data element_type="f32" shape="" offset="3280" size="4" /> |
|
<output> |
|
<port id="0" precision="FP32" names="34" /> |
|
</output> |
|
</layer> |
|
<layer id="199" name="__module.model.model/aten::masked_fill/Select" type="Select" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="BOOL"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="FP32" /> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="3" precision="FP32" names="94"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="200" name="__module.model.model/aten::copy_/ShapeOf" type="ShapeOf" version="opset3"> |
|
<data output_type="i64" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="201" name="__module.model.model/aten::copy_/Broadcast" type="Broadcast" version="opset3"> |
|
<data mode="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="98"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="202" name="Constant_3921" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="92" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="203" name="SliceAssign_396/Reshape_5" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="204" name="SliceAssign_396/ScatterNDUpdate" type="ScatterNDUpdate" version="opset4"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="3" precision="FP32"> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="205" name="SliceAssign_396/Reshape_6" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="207,208,209,329,330,331,78"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="206" name="Constant_1182" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="4" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="207" name="Constant_7748" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="1184" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="208" name="Reshape_7749" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="I64" /> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="209" name="Add_7752" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="206,328"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="210" name="Constant_1185" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="1184" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="211" name="__module.model.model.layers.0.self_attn/aten::slice/Slice_7" type="Slice" version="opset8"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="4" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="5" precision="FP32" names="210,332"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="212" name="__module.model.model.layers.0.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> |
|
<data causal="false" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="3" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="FP32" names="211,attn_output.1"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="213" name="__module.model.model.layers.0.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> |
|
<data element_type="i32" shape="4" offset="1160" size="16" /> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="214" name="__module.model.model.layers.0.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="212"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="215" name="Constant_6856" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="3320" size="16" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="216" name="Constant_6857" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="4" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="217" name="Gather_6858" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="218" name="Constant_1259" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="92" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="219" name="__module.model.model.layers.0.self_attn/prim::ListConstruct_3" type="Concat" version="opset1"> |
|
<data axis="0" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="220" name="__module.model.model.layers.0.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="215"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="221" name="self.model.model.layers.0.self_attn.o_proj.weight" type="Const" version="opset1"> |
|
<data element_type="f32" shape="16, 16" offset="3336" size="1024" /> |
|
<output> |
|
<port id="0" precision="FP32" names="self.model.model.layers.0.self_attn.o_proj.weight"> |
|
<dim>16</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="222" name="__module.model.model.layers.0.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>16</dim> |
|
<dim>16</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="217,219,hidden_states.13"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="223" name="__module.model.model.layers.0/aten::add/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="222,224,235,hidden_states.15,hidden_states.17"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="224" name="Constant_7379" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1" offset="84" size="4" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="225" name="Constant_7377" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1" offset="88" size="4" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="226" name="__module.model.model.layers.0.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="225"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="227" name="Constant_1286" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="92" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" names="226"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="228" name="__module.model.model.layers.0.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> |
|
<data keep_dims="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="227,variance.3"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="229" name="Constant_7378" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1" offset="100" size="4" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="230" name="__module.model.model.layers.0.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="228"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="231" name="__module.model.model.layers.0.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="232" name="__module.model.model.layers.0.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> |
|
<data auto_broadcast="numpy" m_pythondiv="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="229"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="233" name="__module.model.model.layers.0.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="230,231,232,234,hidden_states.19,hidden_states.21"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="234" name="self.model.model.layers.0.mlp.gate_proj.weight" type="Const" version="opset1"> |
|
<data element_type="f32" shape="64, 16" offset="4360" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32" names="self.model.model.layers.0.mlp.gate_proj.weight"> |
|
<dim>64</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="235" name="__module.model.model.layers.0.mlp.gate_proj/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>64</dim> |
|
<dim>16</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="240,input.1"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="236" name="__module.model.model.layers.0.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32" names="241"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="237" name="self.model.model.layers.0.mlp.up_proj.weight" type="Const" version="opset1"> |
|
<data element_type="f32" shape="64, 16" offset="8456" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32" names="self.model.model.layers.0.mlp.up_proj.weight"> |
|
<dim>64</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="238" name="__module.model.model.layers.0.mlp.up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>64</dim> |
|
<dim>16</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="243"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="239" name="__module.model.model.layers.0.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="244"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="240" name="self.model.model.layers.0.mlp.down_proj.weight" type="Const" version="opset1"> |
|
<data element_type="f32" shape="16, 64" offset="12552" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32" names="self.model.model.layers.0.mlp.down_proj.weight"> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="241" name="__module.model.model.layers.0.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="246,hidden_states.23"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="242" name="__module.model.model.layers.0/aten::add/Add_1" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="247,249,257,268,hidden_states.25,hidden_states.27"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="243" name="Constant_7382" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1" offset="84" size="4" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="244" name="Constant_7380" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1" offset="88" size="4" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="245" name="__module.model.model.layers.1.input_layernorm/aten::pow/Power" type="Power" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="258"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="246" name="Constant_1357" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="92" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" names="259"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="247" name="__module.model.model.layers.1.input_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> |
|
<data keep_dims="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="260,variance.5"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="248" name="Constant_7381" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1" offset="100" size="4" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="249" name="__module.model.model.layers.1.input_layernorm/aten::add/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="261"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="250" name="__module.model.model.layers.1.input_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="251" name="__module.model.model.layers.1.input_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> |
|
<data auto_broadcast="numpy" m_pythondiv="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="262"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="252" name="__module.model.model.layers.1.input_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="263,264,265,267,hidden_states.29,hidden_states.31,hidden_states.33"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="253" name="self.model.model.layers.1.self_attn.v_proj.weight" type="Const" version="opset1"> |
|
<data element_type="f32" shape="16, 16" offset="16648" size="1024" /> |
|
<output> |
|
<port id="0" precision="FP32" names="self.model.model.layers.1.self_attn.v_proj.weight"> |
|
<dim>16</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="254" name="__module.model.model.layers.1.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>16</dim> |
|
<dim>16</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="280,value_states"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="255" name="Constant_7901" type="Const" version="opset1"> |
|
<data element_type="i64" shape="4" offset="1128" size="32" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="256" name="__module.model.model.layers.1.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="288"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="257" name="__module.model.model.layers.1.self_attn/aten::transpose/Constant" type="Const" version="opset1"> |
|
<data element_type="i32" shape="4" offset="1160" size="16" /> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="258" name="__module.model.model.layers.1.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="289"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="259" name="__module.model.model.layers.1.self_attn/aten::cat/Concat" type="Concat" version="opset1"> |
|
<data axis="-2" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="present.1.value"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="261" name="Constant_9523" type="Const" version="opset1"> |
|
<data element_type="f32" shape="" offset="0" size="4" /> |
|
<output> |
|
<port id="0" precision="FP32" /> |
|
</output> |
|
</layer> |
|
<layer id="262" name="Constant_9516" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="12" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="263" name="Constant_9518" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="4" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="264" name="Constant_9520" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="12" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="265" name="Concat_9521" type="Concat" version="opset1"> |
|
<data axis="0" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="266" name="Broadcast_9524" type="Broadcast" version="opset3"> |
|
<data mode="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32" /> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>0</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="267" name="ReadValue_9183" type="ReadValue" version="opset6"> |
|
<data variable_id="past_key_values.1.keypresent.1.key" variable_type="f32" variable_shape="?,4,?,4" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>0</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32" names="past_key_values.1.key"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="268" name="Constant_8888" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="4" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="269" name="Gather_8889" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="270" name="self.model.model.layers.1.self_attn.k_proj.weight" type="Const" version="opset1"> |
|
<data element_type="f32" shape="16, 16" offset="17672" size="1024" /> |
|
<output> |
|
<port id="0" precision="FP32" names="self.model.model.layers.1.self_attn.k_proj.weight"> |
|
<dim>16</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="271" name="__module.model.model.layers.1.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>16</dim> |
|
<dim>16</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="278,key_states"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="272" name="Constant_7902" type="Const" version="opset1"> |
|
<data element_type="i64" shape="4" offset="1128" size="32" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="273" name="__module.model.model.layers.1.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="285"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="274" name="__module.model.model.layers.1.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> |
|
<data element_type="i32" shape="4" offset="1160" size="16" /> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="275" name="__module.model.model.layers.1.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="286,k"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="276" name="__module.model.model.layers.1.self_attn/aten::mul/Multiply" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="308"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="277" name="Constant_1894" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="1204" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="278" name="Constant_1896" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="1212" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="279" name="Constant_1898" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="1184" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="280" name="__module.model.model.layers.1.self_attn/aten::slice/Slice" type="Slice" version="opset8"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="4" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="5" precision="FP32" names="318,x2"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="281" name="Constant_7383" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1, 1" offset="1228" size="4" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="282" name="__module.model.model.layers.1.self_attn/aten::neg/Multiply" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="319"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="283" name="Constant_1791" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="4" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="284" name="Constant_1835" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="1204" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="285" name="Constant_1837" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="1184" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="286" name="__module.model.model.layers.1.self_attn/aten::slice/Slice_1" type="Slice" version="opset8"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="4" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="5" precision="FP32" names="313"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="287" name="__module.model.model.layers.1.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> |
|
<data axis="-1" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="321"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="288" name="__module.model.model.layers.1.self_attn/aten::mul/Multiply_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="322"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="289" name="__module.model.model.layers.1.self_attn/aten::add/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="323"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="290" name="__module.model.model.layers.1.self_attn/aten::cat/Concat_2" type="Concat" version="opset1"> |
|
<data axis="-2" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="present.1.key"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="294" name="self.model.model.layers.1.self_attn.q_proj.weight" type="Const" version="opset1"> |
|
<data element_type="f32" shape="16, 16" offset="18696" size="1024" /> |
|
<output> |
|
<port id="0" precision="FP32" names="self.model.model.layers.1.self_attn.q_proj.weight"> |
|
<dim>16</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="295" name="__module.model.model.layers.1.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>16</dim> |
|
<dim>16</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="276,query_states"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="296" name="Constant_7903" type="Const" version="opset1"> |
|
<data element_type="i64" shape="4" offset="1128" size="32" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="297" name="__module.model.model.layers.1.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="282"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="298" name="__module.model.model.layers.1.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> |
|
<data element_type="i32" shape="4" offset="1160" size="16" /> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="299" name="__module.model.model.layers.1.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="283,q"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="300" name="__module.model.model.layers.1.self_attn/aten::mul/Multiply_2" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="292"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="301" name="Constant_1751" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="1204" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="302" name="Constant_1753" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="1212" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="303" name="Constant_1755" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="1184" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="304" name="__module.model.model.layers.1.self_attn/aten::slice/Slice_2" type="Slice" version="opset8"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="4" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="5" precision="FP32" names="302,x2.5"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="305" name="Constant_7384" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1, 1" offset="1228" size="4" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="306" name="__module.model.model.layers.1.self_attn/aten::neg/Multiply_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="303"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="307" name="Constant_1648" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="4" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="308" name="Constant_1692" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="1204" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="309" name="Constant_1694" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="1184" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="310" name="__module.model.model.layers.1.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="4" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="5" precision="FP32" names="297"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="311" name="__module.model.model.layers.1.self_attn/aten::cat/Concat_3" type="Concat" version="opset1"> |
|
<data axis="-1" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="305"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="312" name="__module.model.model.layers.1.self_attn/aten::mul/Multiply_3" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="306"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="313" name="__module.model.model.layers.1.self_attn/aten::add/Add_1" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="307"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="314" name="__module.model.model.layers.1.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> |
|
<data causal="false" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="3" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="FP32" names="333,attn_output.5"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="315" name="__module.model.model.layers.1.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> |
|
<data element_type="i32" shape="4" offset="1160" size="16" /> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="316" name="__module.model.model.layers.1.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="334"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="317" name="__module.model.model.layers.1.self_attn/aten::view/Reshape_3" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="337"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="318" name="self.model.model.layers.1.self_attn.o_proj.weight" type="Const" version="opset1"> |
|
<data element_type="f32" shape="16, 16" offset="19720" size="1024" /> |
|
<output> |
|
<port id="0" precision="FP32" names="self.model.model.layers.1.self_attn.o_proj.weight"> |
|
<dim>16</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="319" name="__module.model.model.layers.1.self_attn.o_proj/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>16</dim> |
|
<dim>16</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="339,341,hidden_states.39"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="320" name="__module.model.model.layers.1/aten::add/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="344,346,357,hidden_states.41,hidden_states.43"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="321" name="Constant_7387" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1" offset="84" size="4" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="322" name="Constant_7385" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1" offset="88" size="4" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="323" name="__module.model.model.layers.1.post_attention_layernorm/aten::pow/Power" type="Power" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="347"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="324" name="Constant_2066" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="92" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" names="348"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="325" name="__module.model.model.layers.1.post_attention_layernorm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> |
|
<data keep_dims="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="349,variance.7"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="326" name="Constant_7386" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1" offset="100" size="4" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="327" name="__module.model.model.layers.1.post_attention_layernorm/aten::add/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="350"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="328" name="__module.model.model.layers.1.post_attention_layernorm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="329" name="__module.model.model.layers.1.post_attention_layernorm/aten::rsqrt/Divide" type="Divide" version="opset1"> |
|
<data auto_broadcast="numpy" m_pythondiv="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="351"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="330" name="__module.model.model.layers.1.post_attention_layernorm/aten::mul/Multiply" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="352,353,354,356,hidden_states.45,hidden_states.47"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="331" name="self.model.model.layers.1.mlp.gate_proj.weight" type="Const" version="opset1"> |
|
<data element_type="f32" shape="64, 16" offset="20744" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32" names="self.model.model.layers.1.mlp.gate_proj.weight"> |
|
<dim>64</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="332" name="__module.model.model.layers.1.mlp.gate_proj/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>64</dim> |
|
<dim>16</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="362,input"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="333" name="__module.model.model.layers.1.mlp.act_fn/aten::silu/Swish" type="Swish" version="opset4"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32" names="363"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="334" name="self.model.model.layers.1.mlp.up_proj.weight" type="Const" version="opset1"> |
|
<data element_type="f32" shape="64, 16" offset="24840" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32" names="self.model.model.layers.1.mlp.up_proj.weight"> |
|
<dim>64</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="335" name="__module.model.model.layers.1.mlp.up_proj/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>64</dim> |
|
<dim>16</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="365"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="336" name="__module.model.model.layers.1.mlp/aten::mul/Multiply" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="366"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="337" name="self.model.model.layers.1.mlp.down_proj.weight" type="Const" version="opset1"> |
|
<data element_type="f32" shape="16, 64" offset="28936" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32" names="self.model.model.layers.1.mlp.down_proj.weight"> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="338" name="__module.model.model.layers.1.mlp.down_proj/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="368,hidden_states.49"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="339" name="__module.model.model.layers.1/aten::add/Add_1" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="369,371,375,hidden_states.51,hidden_states.53"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="340" name="Constant_7390" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1" offset="84" size="4" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="341" name="Constant_7388" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1" offset="88" size="4" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="342" name="__module.model.model.norm/aten::pow/Power" type="Power" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="376"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="343" name="Constant_2133" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="92" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" names="377"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="344" name="__module.model.model.norm/aten::mean/ReduceMean" type="ReduceMean" version="opset1"> |
|
<data keep_dims="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="378,variance"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="345" name="Constant_7389" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1" offset="100" size="4" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="346" name="__module.model.model.norm/aten::add/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="379"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="347" name="__module.model.model.norm/aten::rsqrt/Sqrt" type="Sqrt" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="348" name="__module.model.model.norm/aten::rsqrt/Divide" type="Divide" version="opset1"> |
|
<data auto_broadcast="numpy" m_pythondiv="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="380"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="349" name="__module.model.model.norm/aten::mul/Multiply" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="381,382,383,385,390,391,392,hidden_states,hidden_states.55,hidden_states.57"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="350" name="self.model.lm_head.weight" type="Const" version="opset1"> |
|
<data element_type="f32" shape="32002, 16" offset="33032" size="2048128" /> |
|
<output> |
|
<port id="0" precision="FP32" names="self.model.lm_head.weight"> |
|
<dim>32002</dim> |
|
<dim>16</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="351" name="__module.model/aten::to/Convert" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>32002</dim> |
|
<dim>16</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="logits"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>32002</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="293" name="Assign_9180" type="Assign" version="opset6"> |
|
<data variable_id="past_key_values.0.keypresent.0.key" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="292" name="Assign_9182" type="Assign" version="opset6"> |
|
<data variable_id="past_key_values.0.valuepresent.0.value" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="291" name="Assign_9184" type="Assign" version="opset6"> |
|
<data variable_id="past_key_values.1.keypresent.1.key" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="260" name="Assign_9186" type="Assign" version="opset6"> |
|
<data variable_id="past_key_values.1.valuepresent.1.value" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="352" name="Result_2261" type="Result" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>32002</dim> |
|
</port> |
|
</input> |
|
</layer> |
|
</layers> |
|
<edges> |
|
<edge from-layer="0" from-port="0" to-layer="269" to-port="1" /> |
|
<edge from-layer="0" from-port="0" to-layer="108" to-port="1" /> |
|
<edge from-layer="0" from-port="0" to-layer="78" to-port="1" /> |
|
<edge from-layer="0" from-port="0" to-layer="16" to-port="1" /> |
|
<edge from-layer="1" from-port="0" to-layer="223" to-port="0" /> |
|
<edge from-layer="1" from-port="0" to-layer="5" to-port="0" /> |
|
<edge from-layer="1" from-port="0" to-layer="27" to-port="0" /> |
|
<edge from-layer="1" from-port="0" to-layer="20" to-port="0" /> |
|
<edge from-layer="2" from-port="0" to-layer="45" to-port="0" /> |
|
<edge from-layer="3" from-port="0" to-layer="191" to-port="0" /> |
|
<edge from-layer="3" from-port="0" to-layer="124" to-port="0" /> |
|
<edge from-layer="4" from-port="0" to-layer="13" to-port="0" /> |
|
<edge from-layer="5" from-port="1" to-layer="8" to-port="0" /> |
|
<edge from-layer="6" from-port="0" to-layer="8" to-port="1" /> |
|
<edge from-layer="7" from-port="0" to-layer="8" to-port="2" /> |
|
<edge from-layer="8" from-port="3" to-layer="12" to-port="0" /> |
|
<edge from-layer="8" from-port="3" to-layer="265" to-port="0" /> |
|
<edge from-layer="8" from-port="3" to-layer="104" to-port="0" /> |
|
<edge from-layer="8" from-port="3" to-layer="74" to-port="0" /> |
|
<edge from-layer="9" from-port="0" to-layer="12" to-port="1" /> |
|
<edge from-layer="10" from-port="0" to-layer="12" to-port="2" /> |
|
<edge from-layer="11" from-port="0" to-layer="12" to-port="3" /> |
|
<edge from-layer="12" from-port="4" to-layer="13" to-port="1" /> |
|
<edge from-layer="13" from-port="2" to-layer="14" to-port="0" /> |
|
<edge from-layer="14" from-port="1" to-layer="16" to-port="0" /> |
|
<edge from-layer="15" from-port="0" to-layer="16" to-port="2" /> |
|
<edge from-layer="16" from-port="3" to-layer="259" to-port="0" /> |
|
<edge from-layer="17" from-port="0" to-layer="28" to-port="0" /> |
|
<edge from-layer="18" from-port="0" to-layer="26" to-port="0" /> |
|
<edge from-layer="19" from-port="0" to-layer="20" to-port="1" /> |
|
<edge from-layer="20" from-port="2" to-layer="22" to-port="0" /> |
|
<edge from-layer="21" from-port="0" to-layer="22" to-port="1" /> |
|
<edge from-layer="22" from-port="2" to-layer="24" to-port="0" /> |
|
<edge from-layer="23" from-port="0" to-layer="24" to-port="1" /> |
|
<edge from-layer="24" from-port="2" to-layer="25" to-port="0" /> |
|
<edge from-layer="25" from-port="1" to-layer="26" to-port="1" /> |
|
<edge from-layer="26" from-port="2" to-layer="27" to-port="1" /> |
|
<edge from-layer="27" from-port="2" to-layer="28" to-port="1" /> |
|
<edge from-layer="28" from-port="2" to-layer="110" to-port="0" /> |
|
<edge from-layer="28" from-port="2" to-layer="36" to-port="0" /> |
|
<edge from-layer="28" from-port="2" to-layer="30" to-port="0" /> |
|
<edge from-layer="28" from-port="2" to-layer="80" to-port="0" /> |
|
<edge from-layer="29" from-port="0" to-layer="30" to-port="1" /> |
|
<edge from-layer="30" from-port="2" to-layer="32" to-port="0" /> |
|
<edge from-layer="31" from-port="0" to-layer="32" to-port="1" /> |
|
<edge from-layer="32" from-port="2" to-layer="34" to-port="0" /> |
|
<edge from-layer="33" from-port="0" to-layer="34" to-port="1" /> |
|
<edge from-layer="34" from-port="2" to-layer="64" to-port="0" /> |
|
<edge from-layer="34" from-port="2" to-layer="58" to-port="0" /> |
|
<edge from-layer="34" from-port="2" to-layer="53" to-port="0" /> |
|
<edge from-layer="35" from-port="0" to-layer="43" to-port="0" /> |
|
<edge from-layer="36" from-port="1" to-layer="121" to-port="0" /> |
|
<edge from-layer="36" from-port="1" to-layer="39" to-port="0" /> |
|
<edge from-layer="36" from-port="1" to-layer="217" to-port="0" /> |
|
<edge from-layer="37" from-port="0" to-layer="39" to-port="1" /> |
|
<edge from-layer="38" from-port="0" to-layer="39" to-port="2" /> |
|
<edge from-layer="39" from-port="3" to-layer="173" to-port="0" /> |
|
<edge from-layer="39" from-port="3" to-layer="42" to-port="0" /> |
|
<edge from-layer="40" from-port="0" to-layer="42" to-port="1" /> |
|
<edge from-layer="41" from-port="0" to-layer="42" to-port="2" /> |
|
<edge from-layer="42" from-port="3" to-layer="43" to-port="1" /> |
|
<edge from-layer="43" from-port="2" to-layer="47" to-port="0" /> |
|
<edge from-layer="44" from-port="0" to-layer="45" to-port="1" /> |
|
<edge from-layer="44" from-port="0" to-layer="191" to-port="1" /> |
|
<edge from-layer="44" from-port="0" to-layer="169" to-port="1" /> |
|
<edge from-layer="44" from-port="0" to-layer="52" to-port="1" /> |
|
<edge from-layer="44" from-port="0" to-layer="67" to-port="1" /> |
|
<edge from-layer="45" from-port="2" to-layer="46" to-port="0" /> |
|
<edge from-layer="46" from-port="1" to-layer="47" to-port="1" /> |
|
<edge from-layer="47" from-port="2" to-layer="49" to-port="0" /> |
|
<edge from-layer="48" from-port="0" to-layer="49" to-port="1" /> |
|
<edge from-layer="49" from-port="2" to-layer="50" to-port="1" /> |
|
<edge from-layer="49" from-port="2" to-layer="50" to-port="0" /> |
|
<edge from-layer="50" from-port="2" to-layer="66" to-port="0" /> |
|
<edge from-layer="50" from-port="2" to-layer="51" to-port="0" /> |
|
<edge from-layer="51" from-port="1" to-layer="52" to-port="0" /> |
|
<edge from-layer="52" from-port="2" to-layer="276" to-port="1" /> |
|
<edge from-layer="52" from-port="2" to-layer="85" to-port="1" /> |
|
<edge from-layer="52" from-port="2" to-layer="300" to-port="1" /> |
|
<edge from-layer="52" from-port="2" to-layer="53" to-port="1" /> |
|
<edge from-layer="53" from-port="2" to-layer="69" to-port="0" /> |
|
<edge from-layer="54" from-port="0" to-layer="58" to-port="1" /> |
|
<edge from-layer="55" from-port="0" to-layer="58" to-port="2" /> |
|
<edge from-layer="56" from-port="0" to-layer="58" to-port="3" /> |
|
<edge from-layer="57" from-port="0" to-layer="280" to-port="4" /> |
|
<edge from-layer="57" from-port="0" to-layer="304" to-port="4" /> |
|
<edge from-layer="57" from-port="0" to-layer="310" to-port="4" /> |
|
<edge from-layer="57" from-port="0" to-layer="185" to-port="4" /> |
|
<edge from-layer="57" from-port="0" to-layer="64" to-port="4" /> |
|
<edge from-layer="57" from-port="0" to-layer="190" to-port="4" /> |
|
<edge from-layer="57" from-port="0" to-layer="89" to-port="4" /> |
|
<edge from-layer="57" from-port="0" to-layer="58" to-port="4" /> |
|
<edge from-layer="57" from-port="0" to-layer="95" to-port="4" /> |
|
<edge from-layer="57" from-port="0" to-layer="211" to-port="4" /> |
|
<edge from-layer="57" from-port="0" to-layer="286" to-port="4" /> |
|
<edge from-layer="58" from-port="5" to-layer="60" to-port="0" /> |
|
<edge from-layer="59" from-port="0" to-layer="60" to-port="1" /> |
|
<edge from-layer="60" from-port="2" to-layer="65" to-port="0" /> |
|
<edge from-layer="61" from-port="0" to-layer="64" to-port="1" /> |
|
<edge from-layer="62" from-port="0" to-layer="64" to-port="2" /> |
|
<edge from-layer="63" from-port="0" to-layer="64" to-port="3" /> |
|
<edge from-layer="64" from-port="5" to-layer="65" to-port="1" /> |
|
<edge from-layer="65" from-port="2" to-layer="68" to-port="0" /> |
|
<edge from-layer="66" from-port="1" to-layer="67" to-port="0" /> |
|
<edge from-layer="67" from-port="2" to-layer="312" to-port="1" /> |
|
<edge from-layer="67" from-port="2" to-layer="288" to-port="1" /> |
|
<edge from-layer="67" from-port="2" to-layer="97" to-port="1" /> |
|
<edge from-layer="67" from-port="2" to-layer="68" to-port="1" /> |
|
<edge from-layer="68" from-port="2" to-layer="69" to-port="1" /> |
|
<edge from-layer="69" from-port="2" to-layer="212" to-port="0" /> |
|
<edge from-layer="70" from-port="0" to-layer="75" to-port="0" /> |
|
<edge from-layer="71" from-port="0" to-layer="74" to-port="1" /> |
|
<edge from-layer="72" from-port="0" to-layer="74" to-port="2" /> |
|
<edge from-layer="73" from-port="0" to-layer="74" to-port="3" /> |
|
<edge from-layer="74" from-port="4" to-layer="75" to-port="1" /> |
|
<edge from-layer="75" from-port="2" to-layer="76" to-port="0" /> |
|
<edge from-layer="76" from-port="1" to-layer="78" to-port="0" /> |
|
<edge from-layer="77" from-port="0" to-layer="78" to-port="2" /> |
|
<edge from-layer="78" from-port="3" to-layer="155" to-port="0" /> |
|
<edge from-layer="78" from-port="3" to-layer="99" to-port="0" /> |
|
<edge from-layer="79" from-port="0" to-layer="80" to-port="1" /> |
|
<edge from-layer="80" from-port="2" to-layer="82" to-port="0" /> |
|
<edge from-layer="81" from-port="0" to-layer="82" to-port="1" /> |
|
<edge from-layer="82" from-port="2" to-layer="84" to-port="0" /> |
|
<edge from-layer="83" from-port="0" to-layer="84" to-port="1" /> |
|
<edge from-layer="84" from-port="2" to-layer="85" to-port="0" /> |
|
<edge from-layer="84" from-port="2" to-layer="89" to-port="0" /> |
|
<edge from-layer="84" from-port="2" to-layer="95" to-port="0" /> |
|
<edge from-layer="85" from-port="2" to-layer="98" to-port="0" /> |
|
<edge from-layer="86" from-port="0" to-layer="89" to-port="1" /> |
|
<edge from-layer="87" from-port="0" to-layer="89" to-port="2" /> |
|
<edge from-layer="88" from-port="0" to-layer="89" to-port="3" /> |
|
<edge from-layer="89" from-port="5" to-layer="91" to-port="0" /> |
|
<edge from-layer="90" from-port="0" to-layer="91" to-port="1" /> |
|
<edge from-layer="91" from-port="2" to-layer="96" to-port="0" /> |
|
<edge from-layer="92" from-port="0" to-layer="95" to-port="1" /> |
|
<edge from-layer="93" from-port="0" to-layer="95" to-port="2" /> |
|
<edge from-layer="94" from-port="0" to-layer="95" to-port="3" /> |
|
<edge from-layer="95" from-port="5" to-layer="96" to-port="1" /> |
|
<edge from-layer="96" from-port="2" to-layer="97" to-port="0" /> |
|
<edge from-layer="97" from-port="2" to-layer="98" to-port="1" /> |
|
<edge from-layer="98" from-port="2" to-layer="99" to-port="1" /> |
|
<edge from-layer="99" from-port="2" to-layer="293" to-port="0" /> |
|
<edge from-layer="99" from-port="2" to-layer="212" to-port="1" /> |
|
<edge from-layer="100" from-port="0" to-layer="105" to-port="0" /> |
|
<edge from-layer="101" from-port="0" to-layer="104" to-port="1" /> |
|
<edge from-layer="102" from-port="0" to-layer="104" to-port="2" /> |
|
<edge from-layer="103" from-port="0" to-layer="104" to-port="3" /> |
|
<edge from-layer="104" from-port="4" to-layer="105" to-port="1" /> |
|
<edge from-layer="105" from-port="2" to-layer="106" to-port="0" /> |
|
<edge from-layer="106" from-port="1" to-layer="108" to-port="0" /> |
|
<edge from-layer="107" from-port="0" to-layer="108" to-port="2" /> |
|
<edge from-layer="108" from-port="3" to-layer="115" to-port="0" /> |
|
<edge from-layer="109" from-port="0" to-layer="110" to-port="1" /> |
|
<edge from-layer="110" from-port="2" to-layer="112" to-port="0" /> |
|
<edge from-layer="111" from-port="0" to-layer="112" to-port="1" /> |
|
<edge from-layer="112" from-port="2" to-layer="114" to-port="0" /> |
|
<edge from-layer="113" from-port="0" to-layer="114" to-port="1" /> |
|
<edge from-layer="114" from-port="2" to-layer="115" to-port="1" /> |
|
<edge from-layer="115" from-port="2" to-layer="292" to-port="0" /> |
|
<edge from-layer="115" from-port="2" to-layer="212" to-port="2" /> |
|
<edge from-layer="116" from-port="0" to-layer="139" to-port="1" /> |
|
<edge from-layer="116" from-port="0" to-layer="138" to-port="0" /> |
|
<edge from-layer="117" from-port="0" to-layer="132" to-port="0" /> |
|
<edge from-layer="118" from-port="0" to-layer="131" to-port="0" /> |
|
<edge from-layer="119" from-port="0" to-layer="121" to-port="1" /> |
|
<edge from-layer="120" from-port="0" to-layer="121" to-port="2" /> |
|
<edge from-layer="121" from-port="3" to-layer="159" to-port="1" /> |
|
<edge from-layer="121" from-port="3" to-layer="123" to-port="0" /> |
|
<edge from-layer="122" from-port="0" to-layer="123" to-port="1" /> |
|
<edge from-layer="123" from-port="2" to-layer="130" to-port="0" /> |
|
<edge from-layer="123" from-port="2" to-layer="209" to-port="1" /> |
|
<edge from-layer="124" from-port="1" to-layer="127" to-port="0" /> |
|
<edge from-layer="125" from-port="0" to-layer="127" to-port="1" /> |
|
<edge from-layer="126" from-port="0" to-layer="127" to-port="2" /> |
|
<edge from-layer="127" from-port="3" to-layer="129" to-port="0" /> |
|
<edge from-layer="127" from-port="3" to-layer="152" to-port="1" /> |
|
<edge from-layer="128" from-port="0" to-layer="129" to-port="1" /> |
|
<edge from-layer="129" from-port="2" to-layer="185" to-port="2" /> |
|
<edge from-layer="129" from-port="2" to-layer="190" to-port="2" /> |
|
<edge from-layer="129" from-port="2" to-layer="130" to-port="1" /> |
|
<edge from-layer="130" from-port="2" to-layer="131" to-port="1" /> |
|
<edge from-layer="131" from-port="2" to-layer="132" to-port="1" /> |
|
<edge from-layer="132" from-port="2" to-layer="149" to-port="1" /> |
|
<edge from-layer="132" from-port="2" to-layer="133" to-port="0" /> |
|
<edge from-layer="133" from-port="1" to-layer="136" to-port="0" /> |
|
<edge from-layer="133" from-port="1" to-layer="143" to-port="0" /> |
|
<edge from-layer="134" from-port="0" to-layer="136" to-port="1" /> |
|
<edge from-layer="135" from-port="0" to-layer="136" to-port="2" /> |
|
<edge from-layer="136" from-port="3" to-layer="138" to-port="1" /> |
|
<edge from-layer="137" from-port="0" to-layer="146" to-port="1" /> |
|
<edge from-layer="137" from-port="0" to-layer="138" to-port="2" /> |
|
<edge from-layer="137" from-port="0" to-layer="145" to-port="2" /> |
|
<edge from-layer="138" from-port="3" to-layer="139" to-port="0" /> |
|
<edge from-layer="139" from-port="2" to-layer="147" to-port="0" /> |
|
<edge from-layer="140" from-port="0" to-layer="144" to-port="1" /> |
|
<edge from-layer="140" from-port="0" to-layer="145" to-port="0" /> |
|
<edge from-layer="141" from-port="0" to-layer="143" to-port="1" /> |
|
<edge from-layer="142" from-port="0" to-layer="143" to-port="2" /> |
|
<edge from-layer="143" from-port="3" to-layer="144" to-port="0" /> |
|
<edge from-layer="144" from-port="2" to-layer="145" to-port="1" /> |
|
<edge from-layer="145" from-port="3" to-layer="146" to-port="0" /> |
|
<edge from-layer="146" from-port="2" to-layer="147" to-port="1" /> |
|
<edge from-layer="147" from-port="2" to-layer="149" to-port="0" /> |
|
<edge from-layer="148" from-port="0" to-layer="149" to-port="2" /> |
|
<edge from-layer="149" from-port="3" to-layer="166" to-port="0" /> |
|
<edge from-layer="150" from-port="0" to-layer="152" to-port="0" /> |
|
<edge from-layer="151" from-port="0" to-layer="152" to-port="2" /> |
|
<edge from-layer="152" from-port="3" to-layer="153" to-port="0" /> |
|
<edge from-layer="153" from-port="1" to-layer="154" to-port="0" /> |
|
<edge from-layer="154" from-port="1" to-layer="164" to-port="0" /> |
|
<edge from-layer="155" from-port="1" to-layer="158" to-port="0" /> |
|
<edge from-layer="156" from-port="0" to-layer="158" to-port="1" /> |
|
<edge from-layer="157" from-port="0" to-layer="158" to-port="2" /> |
|
<edge from-layer="158" from-port="3" to-layer="159" to-port="0" /> |
|
<edge from-layer="158" from-port="3" to-layer="161" to-port="0" /> |
|
<edge from-layer="158" from-port="3" to-layer="208" to-port="0" /> |
|
<edge from-layer="159" from-port="2" to-layer="161" to-port="1" /> |
|
<edge from-layer="160" from-port="0" to-layer="161" to-port="2" /> |
|
<edge from-layer="161" from-port="3" to-layer="163" to-port="0" /> |
|
<edge from-layer="162" from-port="0" to-layer="163" to-port="1" /> |
|
<edge from-layer="163" from-port="2" to-layer="164" to-port="1" /> |
|
<edge from-layer="164" from-port="2" to-layer="165" to-port="0" /> |
|
<edge from-layer="165" from-port="1" to-layer="166" to-port="1" /> |
|
<edge from-layer="166" from-port="2" to-layer="168" to-port="0" /> |
|
<edge from-layer="167" from-port="0" to-layer="168" to-port="1" /> |
|
<edge from-layer="168" from-port="2" to-layer="169" to-port="0" /> |
|
<edge from-layer="169" from-port="2" to-layer="174" to-port="0" /> |
|
<edge from-layer="170" from-port="0" to-layer="173" to-port="1" /> |
|
<edge from-layer="171" from-port="0" to-layer="173" to-port="2" /> |
|
<edge from-layer="172" from-port="0" to-layer="173" to-port="3" /> |
|
<edge from-layer="173" from-port="4" to-layer="174" to-port="1" /> |
|
<edge from-layer="174" from-port="2" to-layer="190" to-port="0" /> |
|
<edge from-layer="174" from-port="2" to-layer="178" to-port="0" /> |
|
<edge from-layer="174" from-port="2" to-layer="176" to-port="0" /> |
|
<edge from-layer="175" from-port="0" to-layer="176" to-port="1" /> |
|
<edge from-layer="176" from-port="2" to-layer="204" to-port="0" /> |
|
<edge from-layer="177" from-port="0" to-layer="181" to-port="0" /> |
|
<edge from-layer="177" from-port="0" to-layer="179" to-port="1" /> |
|
<edge from-layer="178" from-port="1" to-layer="182" to-port="1" /> |
|
<edge from-layer="178" from-port="1" to-layer="179" to-port="0" /> |
|
<edge from-layer="178" from-port="1" to-layer="205" to-port="1" /> |
|
<edge from-layer="179" from-port="2" to-layer="181" to-port="1" /> |
|
<edge from-layer="180" from-port="0" to-layer="181" to-port="2" /> |
|
<edge from-layer="181" from-port="3" to-layer="182" to-port="0" /> |
|
<edge from-layer="182" from-port="2" to-layer="185" to-port="0" /> |
|
<edge from-layer="183" from-port="0" to-layer="185" to-port="1" /> |
|
<edge from-layer="184" from-port="0" to-layer="185" to-port="3" /> |
|
<edge from-layer="185" from-port="5" to-layer="187" to-port="0" /> |
|
<edge from-layer="186" from-port="0" to-layer="187" to-port="1" /> |
|
<edge from-layer="187" from-port="2" to-layer="204" to-port="1" /> |
|
<edge from-layer="188" from-port="0" to-layer="190" to-port="1" /> |
|
<edge from-layer="189" from-port="0" to-layer="190" to-port="3" /> |
|
<edge from-layer="190" from-port="5" to-layer="195" to-port="0" /> |
|
<edge from-layer="190" from-port="5" to-layer="200" to-port="0" /> |
|
<edge from-layer="190" from-port="5" to-layer="199" to-port="2" /> |
|
<edge from-layer="191" from-port="2" to-layer="193" to-port="0" /> |
|
<edge from-layer="192" from-port="0" to-layer="193" to-port="1" /> |
|
<edge from-layer="193" from-port="2" to-layer="194" to-port="0" /> |
|
<edge from-layer="194" from-port="1" to-layer="195" to-port="1" /> |
|
<edge from-layer="195" from-port="2" to-layer="197" to-port="0" /> |
|
<edge from-layer="196" from-port="0" to-layer="197" to-port="1" /> |
|
<edge from-layer="197" from-port="2" to-layer="199" to-port="0" /> |
|
<edge from-layer="198" from-port="0" to-layer="199" to-port="1" /> |
|
<edge from-layer="199" from-port="3" to-layer="201" to-port="0" /> |
|
<edge from-layer="200" from-port="1" to-layer="201" to-port="1" /> |
|
<edge from-layer="201" from-port="2" to-layer="203" to-port="0" /> |
|
<edge from-layer="202" from-port="0" to-layer="203" to-port="1" /> |
|
<edge from-layer="203" from-port="2" to-layer="204" to-port="2" /> |
|
<edge from-layer="204" from-port="3" to-layer="205" to-port="0" /> |
|
<edge from-layer="205" from-port="2" to-layer="211" to-port="0" /> |
|
<edge from-layer="206" from-port="0" to-layer="211" to-port="1" /> |
|
<edge from-layer="207" from-port="0" to-layer="208" to-port="1" /> |
|
<edge from-layer="208" from-port="2" to-layer="209" to-port="0" /> |
|
<edge from-layer="209" from-port="2" to-layer="211" to-port="2" /> |
|
<edge from-layer="210" from-port="0" to-layer="211" to-port="3" /> |
|
<edge from-layer="211" from-port="5" to-layer="314" to-port="3" /> |
|
<edge from-layer="211" from-port="5" to-layer="212" to-port="3" /> |
|
<edge from-layer="212" from-port="4" to-layer="214" to-port="0" /> |
|
<edge from-layer="213" from-port="0" to-layer="214" to-port="1" /> |
|
<edge from-layer="214" from-port="2" to-layer="220" to-port="0" /> |
|
<edge from-layer="215" from-port="0" to-layer="217" to-port="1" /> |
|
<edge from-layer="216" from-port="0" to-layer="217" to-port="2" /> |
|
<edge from-layer="217" from-port="3" to-layer="219" to-port="0" /> |
|
<edge from-layer="218" from-port="0" to-layer="219" to-port="1" /> |
|
<edge from-layer="219" from-port="2" to-layer="317" to-port="1" /> |
|
<edge from-layer="219" from-port="2" to-layer="220" to-port="1" /> |
|
<edge from-layer="220" from-port="2" to-layer="222" to-port="0" /> |
|
<edge from-layer="221" from-port="0" to-layer="222" to-port="1" /> |
|
<edge from-layer="222" from-port="2" to-layer="223" to-port="1" /> |
|
<edge from-layer="223" from-port="2" to-layer="226" to-port="0" /> |
|
<edge from-layer="223" from-port="2" to-layer="242" to-port="0" /> |
|
<edge from-layer="223" from-port="2" to-layer="233" to-port="0" /> |
|
<edge from-layer="224" from-port="0" to-layer="232" to-port="0" /> |
|
<edge from-layer="225" from-port="0" to-layer="226" to-port="1" /> |
|
<edge from-layer="226" from-port="2" to-layer="228" to-port="0" /> |
|
<edge from-layer="227" from-port="0" to-layer="228" to-port="1" /> |
|
<edge from-layer="228" from-port="2" to-layer="230" to-port="0" /> |
|
<edge from-layer="229" from-port="0" to-layer="230" to-port="1" /> |
|
<edge from-layer="230" from-port="2" to-layer="231" to-port="0" /> |
|
<edge from-layer="231" from-port="1" to-layer="232" to-port="1" /> |
|
<edge from-layer="232" from-port="2" to-layer="233" to-port="1" /> |
|
<edge from-layer="233" from-port="2" to-layer="235" to-port="0" /> |
|
<edge from-layer="233" from-port="2" to-layer="238" to-port="0" /> |
|
<edge from-layer="234" from-port="0" to-layer="235" to-port="1" /> |
|
<edge from-layer="235" from-port="2" to-layer="236" to-port="0" /> |
|
<edge from-layer="236" from-port="1" to-layer="239" to-port="0" /> |
|
<edge from-layer="237" from-port="0" to-layer="238" to-port="1" /> |
|
<edge from-layer="238" from-port="2" to-layer="239" to-port="1" /> |
|
<edge from-layer="239" from-port="2" to-layer="241" to-port="0" /> |
|
<edge from-layer="240" from-port="0" to-layer="241" to-port="1" /> |
|
<edge from-layer="241" from-port="2" to-layer="242" to-port="1" /> |
|
<edge from-layer="242" from-port="2" to-layer="252" to-port="0" /> |
|
<edge from-layer="242" from-port="2" to-layer="245" to-port="0" /> |
|
<edge from-layer="242" from-port="2" to-layer="320" to-port="0" /> |
|
<edge from-layer="243" from-port="0" to-layer="251" to-port="0" /> |
|
<edge from-layer="244" from-port="0" to-layer="245" to-port="1" /> |
|
<edge from-layer="245" from-port="2" to-layer="247" to-port="0" /> |
|
<edge from-layer="246" from-port="0" to-layer="247" to-port="1" /> |
|
<edge from-layer="247" from-port="2" to-layer="249" to-port="0" /> |
|
<edge from-layer="248" from-port="0" to-layer="249" to-port="1" /> |
|
<edge from-layer="249" from-port="2" to-layer="250" to-port="0" /> |
|
<edge from-layer="250" from-port="1" to-layer="251" to-port="1" /> |
|
<edge from-layer="251" from-port="2" to-layer="252" to-port="1" /> |
|
<edge from-layer="252" from-port="2" to-layer="254" to-port="0" /> |
|
<edge from-layer="252" from-port="2" to-layer="271" to-port="0" /> |
|
<edge from-layer="252" from-port="2" to-layer="295" to-port="0" /> |
|
<edge from-layer="253" from-port="0" to-layer="254" to-port="1" /> |
|
<edge from-layer="254" from-port="2" to-layer="256" to-port="0" /> |
|
<edge from-layer="255" from-port="0" to-layer="256" to-port="1" /> |
|
<edge from-layer="256" from-port="2" to-layer="258" to-port="0" /> |
|
<edge from-layer="257" from-port="0" to-layer="258" to-port="1" /> |
|
<edge from-layer="258" from-port="2" to-layer="259" to-port="1" /> |
|
<edge from-layer="259" from-port="2" to-layer="314" to-port="2" /> |
|
<edge from-layer="259" from-port="2" to-layer="260" to-port="0" /> |
|
<edge from-layer="261" from-port="0" to-layer="266" to-port="0" /> |
|
<edge from-layer="262" from-port="0" to-layer="265" to-port="1" /> |
|
<edge from-layer="263" from-port="0" to-layer="265" to-port="2" /> |
|
<edge from-layer="264" from-port="0" to-layer="265" to-port="3" /> |
|
<edge from-layer="265" from-port="4" to-layer="266" to-port="1" /> |
|
<edge from-layer="266" from-port="2" to-layer="267" to-port="0" /> |
|
<edge from-layer="267" from-port="1" to-layer="269" to-port="0" /> |
|
<edge from-layer="268" from-port="0" to-layer="269" to-port="2" /> |
|
<edge from-layer="269" from-port="3" to-layer="290" to-port="0" /> |
|
<edge from-layer="270" from-port="0" to-layer="271" to-port="1" /> |
|
<edge from-layer="271" from-port="2" to-layer="273" to-port="0" /> |
|
<edge from-layer="272" from-port="0" to-layer="273" to-port="1" /> |
|
<edge from-layer="273" from-port="2" to-layer="275" to-port="0" /> |
|
<edge from-layer="274" from-port="0" to-layer="275" to-port="1" /> |
|
<edge from-layer="275" from-port="2" to-layer="286" to-port="0" /> |
|
<edge from-layer="275" from-port="2" to-layer="280" to-port="0" /> |
|
<edge from-layer="275" from-port="2" to-layer="276" to-port="0" /> |
|
<edge from-layer="276" from-port="2" to-layer="289" to-port="0" /> |
|
<edge from-layer="277" from-port="0" to-layer="280" to-port="1" /> |
|
<edge from-layer="278" from-port="0" to-layer="280" to-port="2" /> |
|
<edge from-layer="279" from-port="0" to-layer="280" to-port="3" /> |
|
<edge from-layer="280" from-port="5" to-layer="282" to-port="0" /> |
|
<edge from-layer="281" from-port="0" to-layer="282" to-port="1" /> |
|
<edge from-layer="282" from-port="2" to-layer="287" to-port="0" /> |
|
<edge from-layer="283" from-port="0" to-layer="286" to-port="1" /> |
|
<edge from-layer="284" from-port="0" to-layer="286" to-port="2" /> |
|
<edge from-layer="285" from-port="0" to-layer="286" to-port="3" /> |
|
<edge from-layer="286" from-port="5" to-layer="287" to-port="1" /> |
|
<edge from-layer="287" from-port="2" to-layer="288" to-port="0" /> |
|
<edge from-layer="288" from-port="2" to-layer="289" to-port="1" /> |
|
<edge from-layer="289" from-port="2" to-layer="290" to-port="1" /> |
|
<edge from-layer="290" from-port="2" to-layer="291" to-port="0" /> |
|
<edge from-layer="290" from-port="2" to-layer="314" to-port="1" /> |
|
<edge from-layer="294" from-port="0" to-layer="295" to-port="1" /> |
|
<edge from-layer="295" from-port="2" to-layer="297" to-port="0" /> |
|
<edge from-layer="296" from-port="0" to-layer="297" to-port="1" /> |
|
<edge from-layer="297" from-port="2" to-layer="299" to-port="0" /> |
|
<edge from-layer="298" from-port="0" to-layer="299" to-port="1" /> |
|
<edge from-layer="299" from-port="2" to-layer="310" to-port="0" /> |
|
<edge from-layer="299" from-port="2" to-layer="300" to-port="0" /> |
|
<edge from-layer="299" from-port="2" to-layer="304" to-port="0" /> |
|
<edge from-layer="300" from-port="2" to-layer="313" to-port="0" /> |
|
<edge from-layer="301" from-port="0" to-layer="304" to-port="1" /> |
|
<edge from-layer="302" from-port="0" to-layer="304" to-port="2" /> |
|
<edge from-layer="303" from-port="0" to-layer="304" to-port="3" /> |
|
<edge from-layer="304" from-port="5" to-layer="306" to-port="0" /> |
|
<edge from-layer="305" from-port="0" to-layer="306" to-port="1" /> |
|
<edge from-layer="306" from-port="2" to-layer="311" to-port="0" /> |
|
<edge from-layer="307" from-port="0" to-layer="310" to-port="1" /> |
|
<edge from-layer="308" from-port="0" to-layer="310" to-port="2" /> |
|
<edge from-layer="309" from-port="0" to-layer="310" to-port="3" /> |
|
<edge from-layer="310" from-port="5" to-layer="311" to-port="1" /> |
|
<edge from-layer="311" from-port="2" to-layer="312" to-port="0" /> |
|
<edge from-layer="312" from-port="2" to-layer="313" to-port="1" /> |
|
<edge from-layer="313" from-port="2" to-layer="314" to-port="0" /> |
|
<edge from-layer="314" from-port="4" to-layer="316" to-port="0" /> |
|
<edge from-layer="315" from-port="0" to-layer="316" to-port="1" /> |
|
<edge from-layer="316" from-port="2" to-layer="317" to-port="0" /> |
|
<edge from-layer="317" from-port="2" to-layer="319" to-port="0" /> |
|
<edge from-layer="318" from-port="0" to-layer="319" to-port="1" /> |
|
<edge from-layer="319" from-port="2" to-layer="320" to-port="1" /> |
|
<edge from-layer="320" from-port="2" to-layer="323" to-port="0" /> |
|
<edge from-layer="320" from-port="2" to-layer="339" to-port="0" /> |
|
<edge from-layer="320" from-port="2" to-layer="330" to-port="0" /> |
|
<edge from-layer="321" from-port="0" to-layer="329" to-port="0" /> |
|
<edge from-layer="322" from-port="0" to-layer="323" to-port="1" /> |
|
<edge from-layer="323" from-port="2" to-layer="325" to-port="0" /> |
|
<edge from-layer="324" from-port="0" to-layer="325" to-port="1" /> |
|
<edge from-layer="325" from-port="2" to-layer="327" to-port="0" /> |
|
<edge from-layer="326" from-port="0" to-layer="327" to-port="1" /> |
|
<edge from-layer="327" from-port="2" to-layer="328" to-port="0" /> |
|
<edge from-layer="328" from-port="1" to-layer="329" to-port="1" /> |
|
<edge from-layer="329" from-port="2" to-layer="330" to-port="1" /> |
|
<edge from-layer="330" from-port="2" to-layer="332" to-port="0" /> |
|
<edge from-layer="330" from-port="2" to-layer="335" to-port="0" /> |
|
<edge from-layer="331" from-port="0" to-layer="332" to-port="1" /> |
|
<edge from-layer="332" from-port="2" to-layer="333" to-port="0" /> |
|
<edge from-layer="333" from-port="1" to-layer="336" to-port="0" /> |
|
<edge from-layer="334" from-port="0" to-layer="335" to-port="1" /> |
|
<edge from-layer="335" from-port="2" to-layer="336" to-port="1" /> |
|
<edge from-layer="336" from-port="2" to-layer="338" to-port="0" /> |
|
<edge from-layer="337" from-port="0" to-layer="338" to-port="1" /> |
|
<edge from-layer="338" from-port="2" to-layer="339" to-port="1" /> |
|
<edge from-layer="339" from-port="2" to-layer="342" to-port="0" /> |
|
<edge from-layer="339" from-port="2" to-layer="349" to-port="0" /> |
|
<edge from-layer="340" from-port="0" to-layer="348" to-port="0" /> |
|
<edge from-layer="341" from-port="0" to-layer="342" to-port="1" /> |
|
<edge from-layer="342" from-port="2" to-layer="344" to-port="0" /> |
|
<edge from-layer="343" from-port="0" to-layer="344" to-port="1" /> |
|
<edge from-layer="344" from-port="2" to-layer="346" to-port="0" /> |
|
<edge from-layer="345" from-port="0" to-layer="346" to-port="1" /> |
|
<edge from-layer="346" from-port="2" to-layer="347" to-port="0" /> |
|
<edge from-layer="347" from-port="1" to-layer="348" to-port="1" /> |
|
<edge from-layer="348" from-port="2" to-layer="349" to-port="1" /> |
|
<edge from-layer="349" from-port="2" to-layer="351" to-port="0" /> |
|
<edge from-layer="350" from-port="0" to-layer="351" to-port="1" /> |
|
<edge from-layer="351" from-port="2" to-layer="352" to-port="0" /> |
|
</edges> |
|
<rt_info> |
|
<Runtime_version value="2024.5.0-17202-a7ccc5e0efc" /> |
|
<conversion_parameters> |
|
<framework value="pytorch" /> |
|
<is_python_object value="True" /> |
|
</conversion_parameters> |
|
<optimum> |
|
<optimum_intel_version value="1.20.0.dev0+7cc52a7" /> |
|
<optimum_version value="1.23.2" /> |
|
<pytorch_version value="2.5.1" /> |
|
<transformers_version value="4.45.2" /> |
|
</optimum> |
|
</rt_info> |
|
</net> |
|
|