|
<?xml version="1.0"?> |
|
<net name="main_graph" version="11"> |
|
<layers> |
|
<layer id="5" name="input_ids" type="Parameter" version="opset1"> |
|
<data shape="?,?" element_type="i64" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="input_ids" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="input_ids"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="4" name="past_key_values.0.key" type="Parameter" version="opset1"> |
|
<data shape="?,2,?,4" element_type="f32" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="past_key_values.0.key" /> |
|
<attribute name="old_api_map_element_type" version="0" value="f16" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="FP32" names="past_key_values.0.key"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="3" name="past_key_values.0.value" type="Parameter" version="opset1"> |
|
<data shape="?,2,?,4" element_type="f32" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="past_key_values.0.value" /> |
|
<attribute name="old_api_map_element_type" version="0" value="f16" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="FP32" names="past_key_values.0.value"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="2" name="past_key_values.1.key" type="Parameter" version="opset1"> |
|
<data shape="?,2,?,4" element_type="f32" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="past_key_values.1.key" /> |
|
<attribute name="old_api_map_element_type" version="0" value="f16" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="FP32" names="past_key_values.1.key"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="1" name="past_key_values.1.value" type="Parameter" version="opset1"> |
|
<data shape="?,2,?,4" element_type="f32" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="past_key_values.1.value" /> |
|
<attribute name="old_api_map_element_type" version="0" value="f16" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="FP32" names="past_key_values.1.value"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="0" name="attention_mask" type="Parameter" version="opset1"> |
|
<data shape="?,?" element_type="i64" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Cast, attention_mask" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/Cast_output_0,attention_mask"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="6" name="/transformer/Constant_39" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="0" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant_39" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/Constant_39_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="7" name="/transformer/Unsqueeze_13" type="Unsqueeze" version="opset1"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Unsqueeze_13" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="/transformer/Unsqueeze_13_output_0"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="8" name="/transformer/Constant_40" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="8" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant_40" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/Constant_40_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="9" name="/transformer/Unsqueeze_14" type="Unsqueeze" version="opset1"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Unsqueeze_14" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="/transformer/Unsqueeze_14_output_0"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="10" name="/transformer/Cast_4" type="Convert" version="opset1"> |
|
<data destination_type="boolean" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Cast_4" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="BOOL" names="/transformer/Cast_4_output_0"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="11" name="/transformer/Not" type="LogicalNot" version="opset1"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Not" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="BOOL"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="BOOL" names="/transformer/Not_output_0"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="12" name="/transformer/Shape_11" type="ShapeOf" version="opset3"> |
|
<data output_type="i64" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Shape_11, /transformer/Shape_12" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="I64" names="/transformer/Shape_11_output_0,/transformer/Shape_12_output_0"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="13" name="Constant_914323" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="16" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant_37, /transformer/Constant_41, /transformer/Gather_5, /transformer/Unsqueeze_15, Constant_898507" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="14" name="Constant_898507" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="16" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="Constant_898507" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="15" name="/transformer/Gather_5" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant_37, /transformer/Constant_41, /transformer/Gather_5, /transformer/Unsqueeze_15, Constant_898507" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64" names="/transformer/Gather_5_output_0,/transformer/Unsqueeze_15_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="16" name="/transformer/Constant_42" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="0" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant_42" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/Constant_42_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="17" name="/transformer/Shape" type="ShapeOf" version="opset3"> |
|
<data output_type="i64" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Shape, /transformer/Shape_1" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="I64" names="/transformer/Shape_1_output_0,/transformer/Shape_output_0"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="18" name="/transformer/Constant_1" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="0" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant_1" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/Constant_1_output_0" /> |
|
</output> |
|
</layer> |
|
<layer id="19" name="Constant_898056" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="16" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="Constant_898056" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="20" name="/transformer/Gather_1" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Cast_1, /transformer/Constant_1, /transformer/Gather_1, Constant_898056" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
<port id="1" precision="I64" /> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64" names="/transformer/Cast_1_output_0,/transformer/Gather_1_output_0" /> |
|
</output> |
|
</layer> |
|
<layer id="21" name="/transformer/Constant_43" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="16" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant_43" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/Constant_43_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="22" name="/transformer/Unsqueeze_16" type="Unsqueeze" version="opset1"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant_33, /transformer/Constant_43, /transformer/Unsqueeze, /transformer/Unsqueeze_11, /transformer/Unsqueeze_16, Constant_12" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64" /> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="/transformer/Unsqueeze_11_output_0,/transformer/Unsqueeze_16_output_0,/transformer/Unsqueeze_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="23" name="Constant_914328" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="0" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant_38, /transformer/Constant_44, /transformer/Gather_6, /transformer/Unsqueeze_17, Constant_898511" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="24" name="Constant_898511" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="16" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="Constant_898511" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="25" name="/transformer/Gather_6" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant_38, /transformer/Constant_44, /transformer/Gather_6, /transformer/Unsqueeze_17, Constant_898511" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64" names="/transformer/Gather_6_output_0,/transformer/Unsqueeze_17_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="26" name="/transformer/Concat_4" type="Concat" version="opset1"> |
|
<data axis="0" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Concat_4, /transformer/Constant_42" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="I64" names="/transformer/Concat_4_output_0"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="27" name="Constant_901734" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="24" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Reshape_3" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="28" name="/transformer/Reshape_3" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Reshape_3" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="/transformer/Reshape_3_output_0"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="29" name="/transformer/Mul_3" type="Const" version="opset1"> |
|
<data element_type="i64" shape="4" offset="32" size="32" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/ConstantOfShape_4, /transformer/Constant_46, /transformer/Mul_3, /transformer/Shape_13, Constant_898533" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/Mul_3_output_0"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="30" name="/transformer/Equal_3" type="Equal" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/ConstantOfShape_4, /transformer/Constant_46, /transformer/Equal_3, /transformer/Mul_3, /transformer/Shape_13, Constant_898533" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="BOOL" names="/transformer/Equal_3_output_0"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="31" name="/transformer/ConstantOfShape_4" type="Const" version="opset1"> |
|
<data element_type="i64" shape="4" offset="64" size="32" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/ConstantOfShape_4, /transformer/Shape_13, Constant_898533" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/ConstantOfShape_4_output_0"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="32" name="/transformer/Where_3" type="Select" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/ConstantOfShape_4, /transformer/Shape_13, /transformer/Where_3, Constant_898533" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="BOOL"> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64" names="/transformer/Where_3_output_0"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="33" name="/transformer/Expand_4" type="Broadcast" version="opset3"> |
|
<data mode="bidirectional" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Expand_4" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="BOOL"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="BOOL" names="/transformer/Expand_4_output_0"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="34" name="Constant_898072" type="Const" version="opset1"> |
|
<data element_type="boolean" shape="" offset="96" size="1" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="Constant_898072" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="BOOL" /> |
|
</output> |
|
</layer> |
|
<layer id="35" name="/transformer/Shape_2" type="ShapeOf" version="opset3"> |
|
<data output_type="i64" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Shape_2" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="I64" names="/transformer/Shape_2_output_0"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="36" name="/transformer/Constant_2" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="8" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant_2" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/Constant_2_output_0" /> |
|
</output> |
|
</layer> |
|
<layer id="37" name="Constant_898062" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="16" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="Constant_898062" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="38" name="/transformer/Gather_2" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant_2, /transformer/Gather_2, Constant_898062" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64" /> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64" names="/transformer/Gather_2_output_0" /> |
|
</output> |
|
</layer> |
|
<layer id="39" name="/transformer/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Add" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64" /> |
|
<port id="1" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="/transformer/Add_output_0" /> |
|
</output> |
|
</layer> |
|
<layer id="40" name="/transformer/Constant_34" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="16" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant_34" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/Constant_34_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="41" name="/transformer/Unsqueeze_12" type="Unsqueeze" version="opset1"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant_34, /transformer/Unsqueeze_1, /transformer/Unsqueeze_12, Constant_14" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64" /> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="/transformer/Unsqueeze_12_output_0,/transformer/Unsqueeze_1_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="42" name="/transformer/Concat" type="Concat" version="opset1"> |
|
<data axis="0" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Concat" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="/transformer/Concat_output_0"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="43" name="/transformer/ConstantOfShape" type="Broadcast" version="opset3"> |
|
<data mode="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/ConstantOfShape" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="BOOL" /> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="BOOL" names="/transformer/ConstantOfShape_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="44" name="/transformer/Constant_12" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="16" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant_12" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/Constant_12_output_0" /> |
|
</output> |
|
</layer> |
|
<layer id="45" name="/transformer/Shape_4" type="ShapeOf" version="opset3"> |
|
<data output_type="i64" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Shape_4, /transformer/Shape_5" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="BOOL"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="I64" names="/transformer/Shape_4_output_0,/transformer/Shape_5_output_0"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="46" name="/transformer/Constant_11" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="16" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant_11" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/Constant_11_output_0" /> |
|
</output> |
|
</layer> |
|
<layer id="47" name="Constant_898182" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="16" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="Constant_898182" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="48" name="/transformer/Gather_3" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Cast_2, /transformer/Constant_11, /transformer/Gather_3, Constant_898182" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
<port id="1" precision="I64" /> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64" names="/transformer/Cast_2_output_0,/transformer/Gather_3_output_0" /> |
|
</output> |
|
</layer> |
|
<layer id="49" name="/transformer/Constant_13" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="0" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant_13" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/Constant_13_output_0" /> |
|
</output> |
|
</layer> |
|
<layer id="50" name="/transformer/Range_1" type="Range" version="opset4"> |
|
<data output_type="i64" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Range_1" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64" /> |
|
<port id="1" precision="I64" /> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64" names="/transformer/Range_1_output_0"> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="51" name="/transformer/Constant_21" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="97" size="16" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant_21" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/Constant_21_output_0"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="52" name="/transformer/Reshape" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Reshape" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="/transformer/Reshape_output_0"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="53" name="/transformer/Constant_15" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="16" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant_15" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/Constant_15_output_0" /> |
|
</output> |
|
</layer> |
|
<layer id="54" name="/transformer/Constant_14" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="0" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant_14" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/Constant_14_output_0" /> |
|
</output> |
|
</layer> |
|
<layer id="55" name="Constant_898203" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="16" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="Constant_898203" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="56" name="/transformer/Gather_4" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Cast_3, /transformer/Constant_14, /transformer/Gather_4, Constant_898203" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
<port id="1" precision="I64" /> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64" names="/transformer/Cast_3_output_0,/transformer/Gather_4_output_0" /> |
|
</output> |
|
</layer> |
|
<layer id="57" name="/transformer/Constant_16" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="0" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant_16" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/Constant_16_output_0" /> |
|
</output> |
|
</layer> |
|
<layer id="58" name="/transformer/Range_2" type="Range" version="opset4"> |
|
<data output_type="i64" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Range_2" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64" /> |
|
<port id="1" precision="I64" /> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64" names="/transformer/Range_2_output_0"> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="59" name="/transformer/Constant_8" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="16" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant_8" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/Constant_8_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="60" name="/transformer/Unsqueeze_4" type="Unsqueeze" version="opset1"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant_8, /transformer/Slice_1" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64" /> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="/transformer/Unsqueeze_4_output_0,/transformer/Unsqueeze_5_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="61" name="/transformer/Constant_19" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="113" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Slice_1" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/Constant_19_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="62" name="/transformer/Constant_20" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="0" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Slice_1" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/Constant_20_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="63" name="/transformer/Slice_1" type="StridedSlice" version="opset1"> |
|
<data begin_mask="0" end_mask="0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Slice_1" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="I64" names="/transformer/Slice_1_output_0"> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="64" name="/transformer/Add_1" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Add_1" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="/transformer/Add_1_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="65" name="/transformer/Shape_6" type="ShapeOf" version="opset3"> |
|
<data output_type="i64" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Concat_2, /transformer/Shape_6" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="I64" names="/transformer/Concat_2_output_0,/transformer/Shape_6_output_0"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="66" name="/transformer/Mul" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="121" size="16" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/ConstantOfShape_1, /transformer/Constant_22, /transformer/Mul, /transformer/Shape_7, Constant_898239" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/Mul_output_0"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="67" name="/transformer/Equal" type="Equal" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/ConstantOfShape_1, /transformer/Constant_22, /transformer/Equal, /transformer/Mul, /transformer/Shape_7, Constant_898239" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="BOOL" names="/transformer/Equal_output_0"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="68" name="/transformer/ConstantOfShape_1" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="137" size="16" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/ConstantOfShape_1, /transformer/Shape_7, Constant_898239" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/ConstantOfShape_1_output_0"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="69" name="/transformer/Where" type="Select" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/ConstantOfShape_1, /transformer/Shape_7, /transformer/Where, Constant_898239" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="BOOL"> |
|
<dim>2</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64" names="/transformer/Where_output_0"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="70" name="/transformer/Expand_1" type="Broadcast" version="opset3"> |
|
<data mode="bidirectional" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Expand_1" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="/transformer/Expand_1_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="71" name="/transformer/Constant_23" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="24" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant_23" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/Constant_23_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="72" name="/transformer/Unsqueeze_6" type="Unsqueeze" version="opset1"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Unsqueeze_6" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="/transformer/Unsqueeze_6_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="73" name="/transformer/Mul_1" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="121" size="16" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/ConstantOfShape_2, /transformer/Constant_24, /transformer/Mul_1, /transformer/Shape_8, Constant_898294" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/Mul_1_output_0"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="74" name="/transformer/Equal_1" type="Equal" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/ConstantOfShape_2, /transformer/Constant_24, /transformer/Equal_1, /transformer/Mul_1, /transformer/Shape_8, Constant_898294" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="BOOL" names="/transformer/Equal_1_output_0"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="75" name="/transformer/ConstantOfShape_2" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="137" size="16" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/ConstantOfShape_2, /transformer/Shape_8, Constant_898294" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/ConstantOfShape_2_output_0"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="76" name="/transformer/Where_1" type="Select" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/ConstantOfShape_2, /transformer/Shape_8, /transformer/Where_1, Constant_898294" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="BOOL"> |
|
<dim>2</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64" names="/transformer/Where_1_output_0"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="77" name="/transformer/Expand_2" type="Broadcast" version="opset3"> |
|
<data mode="bidirectional" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Expand_2" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="/transformer/Expand_2_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="78" name="/transformer/Constant_25" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="24" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant_25" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/Constant_25_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="79" name="/transformer/Unsqueeze_7" type="Unsqueeze" version="opset1"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Unsqueeze_7" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="/transformer/Unsqueeze_7_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="80" name="/transformer/Concat_1" type="Concat" version="opset1"> |
|
<data axis="-1" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Concat_1" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="/transformer/Concat_1_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="81" name="/transformer/Constant_3" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="16" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant_3" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/Constant_3_output_0" /> |
|
</output> |
|
</layer> |
|
<layer id="82" name="/transformer/Constant_4" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="0" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant_4" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/Constant_4_output_0" /> |
|
</output> |
|
</layer> |
|
<layer id="83" name="/transformer/Range" type="Range" version="opset4"> |
|
<data output_type="i64" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Range" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64" /> |
|
<port id="1" precision="I64" /> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64" names="/transformer/Range_output_0"> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="84" name="/transformer/Constant_5" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="0" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant_5" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/Constant_5_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="85" name="/transformer/Unsqueeze_2" type="Unsqueeze" version="opset1"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Unsqueeze_2" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="/transformer/Unsqueeze_2_output_0"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="86" name="/transformer/Constant_6" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="16" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant_6" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/Constant_6_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="87" name="/transformer/Unsqueeze_3" type="Unsqueeze" version="opset1"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Unsqueeze_3" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="/transformer/Unsqueeze_3_output_0"> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="88" name="/transformer/Less" type="Less" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Less" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="BOOL" names="/transformer/Less_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="89" name="Constant_915162" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="153" size="16" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Slice" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="90" name="Constant_915161" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="0" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Slice" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="91" name="Constant_915160" type="Const" version="opset1"> |
|
<data element_type="i32" shape="1" offset="169" size="4" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Slice" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="92" name="ScatterUpdate_915163" type="ScatterUpdate" version="opset3"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Slice" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="93" name="Constant_915166" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="173" size="16" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Slice" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="94" name="Constant_915169" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="137" size="16" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Slice" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="95" name="/transformer/Slice" type="StridedSlice" version="opset1"> |
|
<data begin_mask="1, 0" end_mask="1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Slice" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="BOOL"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="BOOL" names="/transformer/Slice_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="96" name="/transformer/Shape_3" type="ShapeOf" version="opset3"> |
|
<data output_type="i64" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Shape_3" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="BOOL"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="I64" names="/transformer/Shape_3_output_0"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="97" name="/transformer/Expand" type="Broadcast" version="opset3"> |
|
<data mode="bidirectional" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Expand" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="BOOL"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="BOOL" names="/transformer/Expand_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="98" name="/transformer/Reshape_1" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Reshape_1" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="BOOL"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="BOOL" names="/transformer/Reshape_1_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="99" name="/transformer/ScatterND" type="ScatterNDUpdate" version="opset4"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/ScatterND" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="BOOL"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
</port> |
|
<port id="2" precision="BOOL"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="3" precision="BOOL" names="/transformer/ScatterND_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="100" name="/transformer/Constant_29" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="16" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant_29" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/Constant_29_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="101" name="/transformer/Unsqueeze_8" type="Unsqueeze" version="opset1"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Unsqueeze_8" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="BOOL"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="BOOL" names="/transformer/Unsqueeze_8_output_0"> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="102" name="/transformer/Constant_30" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="0" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant_30" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/Constant_30_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="103" name="/transformer/Unsqueeze_9" type="Unsqueeze" version="opset1"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Unsqueeze_9" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="BOOL"> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="BOOL" names="/transformer/Unsqueeze_9_output_0"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="104" name="Constant_914333" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="16" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant, /transformer/Constant_31, /transformer/Gather, /transformer/Unsqueeze_10, Constant_898052" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="105" name="Constant_898052" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="16" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="Constant_898052" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="106" name="/transformer/Gather" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant, /transformer/Constant_31, /transformer/Gather, /transformer/Unsqueeze_10, Constant_898052" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64" names="/transformer/Gather_output_0,/transformer/Unsqueeze_10_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="107" name="/transformer/Constant_32" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="0" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Constant_32" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/Constant_32_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="108" name="/transformer/Concat_3" type="Concat" version="opset1"> |
|
<data axis="0" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Concat_3, /transformer/Constant_32" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="I64" names="/transformer/Concat_3_output_0"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="109" name="Constant_901735" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="24" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Reshape_2" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="110" name="/transformer/Reshape_2" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Reshape_2" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="/transformer/Reshape_2_output_0"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="111" name="/transformer/Mul_2" type="Const" version="opset1"> |
|
<data element_type="i64" shape="4" offset="32" size="32" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/ConstantOfShape_3, /transformer/Constant_36, /transformer/Mul_2, /transformer/Shape_10, Constant_898390" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/Mul_2_output_0"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="112" name="/transformer/Equal_2" type="Equal" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/ConstantOfShape_3, /transformer/Constant_36, /transformer/Equal_2, /transformer/Mul_2, /transformer/Shape_10, Constant_898390" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="BOOL" names="/transformer/Equal_2_output_0"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="113" name="/transformer/ConstantOfShape_3" type="Const" version="opset1"> |
|
<data element_type="i64" shape="4" offset="64" size="32" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/ConstantOfShape_3, /transformer/Shape_10, Constant_898390" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/ConstantOfShape_3_output_0"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="114" name="/transformer/Where_2" type="Select" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/ConstantOfShape_3, /transformer/Shape_10, /transformer/Where_2, Constant_898390" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="BOOL"> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64" names="/transformer/Where_2_output_0"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="115" name="/transformer/Expand_3" type="Broadcast" version="opset3"> |
|
<data mode="bidirectional" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Expand_3" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="BOOL"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="BOOL" names="/transformer/Expand_3_output_0"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="116" name="/transformer/Or" type="LogicalOr" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/Or, /transformer/blocks.0/attn/Cast, /transformer/blocks.1/attn/Cast" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="BOOL"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="BOOL"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="BOOL" names="/transformer/Or_output_0,/transformer/blocks.0/attn/Cast_output_0,/transformer/blocks.1/attn/Cast_output_0"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="117" name="/transformer/blocks.0/attn/Constant_22" type="Const" version="opset1"> |
|
<data element_type="f32" shape="" offset="189" size="4" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_22" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="FP32" names="/transformer/blocks.0/attn/Constant_22_output_0" /> |
|
</output> |
|
</layer> |
|
<layer id="118" name="transformer.wte.weight_compressed" type="Const" version="opset1"> |
|
<data element_type="f16" shape="50432, 8" offset="193" size="806912" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="transformer.wte.weight" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>50432</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="119" name="transformer.wte.weight" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<rt_info> |
|
<attribute name="decompression" version="0" /> |
|
<attribute name="fused_names" version="0" value="transformer.wte.weight" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>50432</dim> |
|
<dim>8</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32" names="transformer.wte.weight"> |
|
<dim>50432</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="120" name="Constant_898058" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="16" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="Constant_898058" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="121" name="/transformer/wte/Gather" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/wte/Gather" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>50432</dim> |
|
<dim>8</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="FP32" names="/transformer/wte/Gather_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="122" name="Constant_898593" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="24" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="Constant_898593" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="123" name="/transformer/blocks.0/norm_1/Div" type="MVN" version="opset6"> |
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/norm_1/Add, /transformer/blocks.0/norm_1/Div, /transformer/blocks.0/norm_1/Pow, /transformer/blocks.0/norm_1/ReduceMean, /transformer/blocks.0/norm_1/ReduceMean_1, /transformer/blocks.0/norm_1/Sqrt, /transformer/blocks.0/norm_1/Sub" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.0/norm_1/Div_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="124" name="Constant_917172_compressed" type="Const" version="opset1"> |
|
<data element_type="f16" shape="1, 1, 8" offset="807105" size="16" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="transformer.blocks.0.norm_1.weight" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="125" name="Constant_917172" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<rt_info> |
|
<attribute name="decompression" version="0" /> |
|
<attribute name="fused_names" version="0" value="transformer.blocks.0.norm_1.weight" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="126" name="/transformer/blocks.0/norm_1/Mul" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/norm_1/Mul" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.0/norm_1/Mul_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="127" name="Transpose_916930_compressed" type="Const" version="opset1"> |
|
<data element_type="f16" shape="24, 8" offset="807121" size="384" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Wqkv/MatMul, onnx::MatMul_454" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>24</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="128" name="Transpose_916930" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<rt_info> |
|
<attribute name="decompression" version="0" /> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Wqkv/MatMul, onnx::MatMul_454" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>24</dim> |
|
<dim>8</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>24</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="129" name="/transformer/blocks.0/attn/Wqkv/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Wqkv/MatMul" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>24</dim> |
|
<dim>8</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.0/attn/Wqkv/MatMul_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>24</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="130" name="Constant_915179" type="Const" version="opset1"> |
|
<data element_type="i64" shape="3" offset="807505" size="24" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_2, /transformer/blocks.0/attn/Slice" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="131" name="Constant_915180" type="Const" version="opset1"> |
|
<data element_type="i64" shape="3" offset="807505" size="24" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_2, /transformer/blocks.0/attn/Slice" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="132" name="Constant_915176" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="8" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_2, /transformer/blocks.0/attn/Slice" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="133" name="/transformer/blocks.0/attn/Shape_2" type="ShapeOf" version="opset3"> |
|
<data output_type="i64" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Shape_2" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>24</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="I64" names="/transformer/blocks.0/attn/Shape_2_output_0"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="134" name="/transformer/blocks.0/attn/Constant_2" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="8" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_2" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/blocks.0/attn/Constant_2_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="135" name="Constant_898616" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="16" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="Constant_898616" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="136" name="/transformer/blocks.0/attn/Gather_2" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_2, /transformer/blocks.0/attn/Gather_2, Constant_898616" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64" names="/transformer/blocks.0/attn/Gather_2_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="137" name="/transformer/blocks.0/attn/Constant_4" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="8" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_4" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/blocks.0/attn/Constant_4_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="138" name="/transformer/blocks.0/attn/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Add, /transformer/blocks.0/attn/Constant_4" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="/transformer/blocks.0/attn/Add_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="139" name="/transformer/blocks.0/attn/Constant_5" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="807529" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_5" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/blocks.0/attn/Constant_5_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="140" name="/transformer/blocks.0/attn/Div" type="Divide" version="opset1"> |
|
<data auto_broadcast="numpy" m_pythondiv="true" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_5, /transformer/blocks.0/attn/Constant_6, /transformer/blocks.0/attn/Div, /transformer/blocks.0/attn/Mul" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="/transformer/blocks.0/attn/Div_output_0,/transformer/blocks.0/attn/Mul_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="141" name="Constant_915175" type="Const" version="opset1"> |
|
<data element_type="i32" shape="1" offset="169" size="4" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_2, /transformer/blocks.0/attn/Slice" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="142" name="ScatterUpdate_915181" type="ScatterUpdate" version="opset3"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_2, /transformer/blocks.0/attn/Slice" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="143" name="Constant_915184" type="Const" version="opset1"> |
|
<data element_type="i64" shape="3" offset="807537" size="24" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_2, /transformer/blocks.0/attn/Slice" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="144" name="/transformer/blocks.0/attn/Slice" type="StridedSlice" version="opset1"> |
|
<data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_2, /transformer/blocks.0/attn/Slice" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>24</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="FP32" names="/transformer/blocks.0/attn/Slice_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="145" name="/transformer/blocks.0/attn/Shape" type="ShapeOf" version="opset3"> |
|
<data output_type="i64" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Shape, /transformer/blocks.0/attn/Shape_1" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="I64" names="/transformer/blocks.0/attn/Shape_1_output_0,/transformer/blocks.0/attn/Shape_output_0"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="146" name="Constant_914360" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="807561" size="16" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Concat_5, /transformer/blocks.0/attn/Constant_23" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="147" name="Constant_914361" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="16" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Concat_5, /transformer/blocks.0/attn/Constant_23" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="148" name="Gather_914362" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Concat, /transformer/blocks.0/attn/Concat_1, /transformer/blocks.0/attn/Concat_2, /transformer/blocks.0/attn/Concat_5, /transformer/blocks.0/attn/Constant_10, /transformer/blocks.0/attn/Constant_11, /transformer/blocks.0/attn/Constant_12, /transformer/blocks.0/attn/Constant_13, /transformer/blocks.0/attn/Constant_14, /transformer/blocks.0/attn/Constant_23, /transformer/blocks.0/attn/Constant_9" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="149" name="/transformer/blocks.0/attn/Constant_9" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="8" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_9" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/blocks.0/attn/Constant_9_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="150" name="/transformer/blocks.0/attn/Constant_10" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="807577" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_10" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/blocks.0/attn/Constant_10_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="151" name="/transformer/blocks.0/attn/Concat" type="Concat" version="opset1"> |
|
<data axis="0" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Concat, /transformer/blocks.0/attn/Concat_1, /transformer/blocks.0/attn/Concat_2, /transformer/blocks.0/attn/Constant_10, /transformer/blocks.0/attn/Constant_11, /transformer/blocks.0/attn/Constant_12, /transformer/blocks.0/attn/Constant_13, /transformer/blocks.0/attn/Constant_14, /transformer/blocks.0/attn/Constant_9" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64" names="/transformer/blocks.0/attn/Concat_1_output_0,/transformer/blocks.0/attn/Concat_2_output_0,/transformer/blocks.0/attn/Concat_output_0"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="152" name="/transformer/blocks.0/attn/Reshape" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Reshape" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.0/attn/Reshape_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="153" name="Constant_898818" type="Const" version="opset1"> |
|
<data element_type="i64" shape="4" offset="807585" size="32" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="Constant_898818" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="154" name="/transformer/blocks.0/attn/Transpose" type="Transpose" version="opset1"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Transpose" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.0/attn/Transpose_output_0"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="155" name="Constant_915232" type="Const" version="opset1"> |
|
<data element_type="i64" shape="3" offset="807505" size="24" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_2, /transformer/blocks.0/attn/Slice_1" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="156" name="Constant_915231" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="8" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_2, /transformer/blocks.0/attn/Slice_1" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="157" name="Constant_915230" type="Const" version="opset1"> |
|
<data element_type="i32" shape="1" offset="169" size="4" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_2, /transformer/blocks.0/attn/Slice_1" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="158" name="ScatterUpdate_915233" type="ScatterUpdate" version="opset3"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_2, /transformer/blocks.0/attn/Slice_1" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="159" name="Constant_915234" type="Const" version="opset1"> |
|
<data element_type="i64" shape="3" offset="807505" size="24" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_2, /transformer/blocks.0/attn/Slice_1" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="160" name="/transformer/blocks.0/attn/Constant_7" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="8" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_7" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/blocks.0/attn/Constant_7_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="161" name="/transformer/blocks.0/attn/Mul_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_7, /transformer/blocks.0/attn/Mul_1" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="/transformer/blocks.0/attn/Mul_1_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="162" name="ScatterUpdate_915235" type="ScatterUpdate" version="opset3"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_2, /transformer/blocks.0/attn/Slice_1" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="163" name="Constant_915238" type="Const" version="opset1"> |
|
<data element_type="i64" shape="3" offset="807537" size="24" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_2, /transformer/blocks.0/attn/Slice_1" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="164" name="/transformer/blocks.0/attn/Slice_1" type="StridedSlice" version="opset1"> |
|
<data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_2, /transformer/blocks.0/attn/Slice_1" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>24</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="FP32" names="/transformer/blocks.0/attn/Slice_1_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="165" name="/transformer/blocks.0/attn/Reshape_1" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Reshape_1" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.0/attn/Reshape_1_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="166" name="Constant_898831" type="Const" version="opset1"> |
|
<data element_type="i64" shape="4" offset="807585" size="32" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="Constant_898831" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="167" name="/transformer/blocks.0/attn/Transpose_1" type="Transpose" version="opset1"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Transpose_1" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.0/attn/Transpose_1_output_0"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="168" name="present.0.key" type="Concat" version="opset1"> |
|
<data axis="2" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="present.0.key" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="present.0.key"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="169" name="Constant_917173_compressed" type="Const" version="opset1"> |
|
<data element_type="f16" shape="1, 1, 1, 1" offset="807617" size="2" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_15" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="170" name="Constant_917173" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<rt_info> |
|
<attribute name="decompression" version="0" /> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_15" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="171" name="Multiply_916962" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/MatMul, /transformer/blocks.0/attn/Mul_3, /transformer/blocks.0/attn/Transpose_3, present.0.key" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="172" name="/transformer/blocks.0/attn/Mul_3" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/MatMul, /transformer/blocks.0/attn/Mul_3, /transformer/blocks.0/attn/Transpose_3, present.0.key" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.0/attn/Mul_3_output_0"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="173" name="Constant_209_compressed" type="Const" version="opset1"> |
|
<data element_type="f16" shape="2, 1, 2048" offset="807619" size="8192" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="Constant_209" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>2</dim> |
|
<dim>1</dim> |
|
<dim>2048</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="174" name="Constant_209" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<rt_info> |
|
<attribute name="decompression" version="0" /> |
|
<attribute name="fused_names" version="0" value="Constant_209" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>2</dim> |
|
<dim>1</dim> |
|
<dim>2048</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32" names="onnx::Slice_250"> |
|
<dim>2</dim> |
|
<dim>1</dim> |
|
<dim>2048</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="175" name="Constant_915330" type="Const" version="opset1"> |
|
<data element_type="i64" shape="3" offset="807505" size="24" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Slice_3" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="176" name="Constant_915329" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="8" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Slice_3" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="177" name="/transformer/blocks.0/attn/Constant_17" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="815811" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_17" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/blocks.0/attn/Constant_17_output_0" /> |
|
</output> |
|
</layer> |
|
<layer id="178" name="/transformer/blocks.0/attn/Shape_3" type="ShapeOf" version="opset3"> |
|
<data output_type="i64" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Shape_3" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="I64" names="/transformer/blocks.0/attn/Shape_3_output_0"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="179" name="/transformer/blocks.0/attn/Constant_16" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="8" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_16" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/blocks.0/attn/Constant_16_output_0" /> |
|
</output> |
|
</layer> |
|
<layer id="180" name="Constant_898855" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="16" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="Constant_898855" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="181" name="/transformer/blocks.0/attn/Gather_3" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_16, /transformer/blocks.0/attn/Gather_3, Constant_898855" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64" /> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64" names="/transformer/blocks.0/attn/Gather_3_output_0" /> |
|
</output> |
|
</layer> |
|
<layer id="182" name="/transformer/blocks.0/attn/Sub" type="Subtract" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_17, /transformer/blocks.0/attn/Sub" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64" /> |
|
<port id="1" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="/transformer/blocks.0/attn/Sub_output_0" /> |
|
</output> |
|
</layer> |
|
<layer id="183" name="/transformer/blocks.0/attn/Constant_19" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="16" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_19" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/blocks.0/attn/Constant_19_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="184" name="/transformer/blocks.0/attn/Unsqueeze_6" type="Unsqueeze" version="opset1"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_19, /transformer/blocks.0/attn/Unsqueeze_6" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64" /> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="/transformer/blocks.0/attn/Unsqueeze_6_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="185" name="Constant_915328" type="Const" version="opset1"> |
|
<data element_type="i32" shape="1" offset="169" size="4" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Slice_3" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="186" name="ScatterUpdate_915331" type="ScatterUpdate" version="opset3"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Slice_3" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="187" name="Constant_915334" type="Const" version="opset1"> |
|
<data element_type="i64" shape="3" offset="815819" size="24" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Slice_3" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="188" name="Constant_915337" type="Const" version="opset1"> |
|
<data element_type="i64" shape="3" offset="807537" size="24" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Slice_3" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="189" name="/transformer/blocks.0/attn/Slice_3" type="StridedSlice" version="opset1"> |
|
<data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Slice_3" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>2</dim> |
|
<dim>1</dim> |
|
<dim>2048</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="FP32" names="/transformer/blocks.0/attn/Slice_3_output_0"> |
|
<dim>2</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="190" name="/transformer/blocks.0/attn/Add_1" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Add_1" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>2</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.0/attn/Add_1_output_0"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="191" name="/transformer/blocks.0/attn/Where" type="Select" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Cast_1, /transformer/blocks.0/attn/Where" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="BOOL"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="FP32" /> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="3" precision="FP32" names="/transformer/blocks.0/attn/Cast_1_output_0,/transformer/blocks.0/attn/Where_output_0"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="192" name="/transformer/blocks.0/attn/Softmax" type="SoftMax" version="opset8"> |
|
<data axis="-1" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Cast_2, /transformer/blocks.0/attn/Softmax" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32" names="/transformer/blocks.0/attn/Cast_2_output_0,/transformer/blocks.0/attn/Softmax_output_0"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="193" name="Constant_915401" type="Const" version="opset1"> |
|
<data element_type="i64" shape="3" offset="807505" size="24" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_2, /transformer/blocks.0/attn/Slice_2" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="194" name="Constant_915400" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="8" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_2, /transformer/blocks.0/attn/Slice_2" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="195" name="Constant_915399" type="Const" version="opset1"> |
|
<data element_type="i32" shape="1" offset="169" size="4" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_2, /transformer/blocks.0/attn/Slice_2" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="196" name="ScatterUpdate_915402" type="ScatterUpdate" version="opset3"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_2, /transformer/blocks.0/attn/Slice_2" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="197" name="Constant_915403" type="Const" version="opset1"> |
|
<data element_type="i64" shape="3" offset="807505" size="24" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_2, /transformer/blocks.0/attn/Slice_2" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="198" name="/transformer/blocks.0/attn/Constant_8" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="807529" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_8" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/blocks.0/attn/Constant_8_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="199" name="/transformer/blocks.0/attn/Mul_2" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_8, /transformer/blocks.0/attn/Mul_2" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="/transformer/blocks.0/attn/Mul_2_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="200" name="ScatterUpdate_915404" type="ScatterUpdate" version="opset3"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_2, /transformer/blocks.0/attn/Slice_2" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="201" name="Constant_915407" type="Const" version="opset1"> |
|
<data element_type="i64" shape="3" offset="807537" size="24" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_2, /transformer/blocks.0/attn/Slice_2" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="202" name="/transformer/blocks.0/attn/Slice_2" type="StridedSlice" version="opset1"> |
|
<data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_2, /transformer/blocks.0/attn/Slice_2" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>24</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="FP32" names="/transformer/blocks.0/attn/Slice_2_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="203" name="/transformer/blocks.0/attn/Reshape_2" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Reshape_2" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.0/attn/Reshape_2_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="204" name="Constant_898844" type="Const" version="opset1"> |
|
<data element_type="i64" shape="4" offset="807585" size="32" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="Constant_898844" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="205" name="/transformer/blocks.0/attn/Transpose_2" type="Transpose" version="opset1"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Transpose_2" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.0/attn/Transpose_2_output_0"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="206" name="present.0.value" type="Concat" version="opset1"> |
|
<data axis="2" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="present.0.value" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="present.0.value"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="207" name="/transformer/blocks.0/attn/MatMul_1" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="false" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/MatMul_1" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.0/attn/MatMul_1_output_0"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="208" name="Constant_898934" type="Const" version="opset1"> |
|
<data element_type="i64" shape="4" offset="807585" size="32" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="Constant_898934" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="209" name="/transformer/blocks.0/attn/Transpose_4" type="Transpose" version="opset1"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Transpose_4" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.0/attn/Transpose_4_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="210" name="/transformer/blocks.0/attn/Constant_23" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="24" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Constant_23" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/blocks.0/attn/Constant_23_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="211" name="/transformer/blocks.0/attn/Concat_5" type="Concat" version="opset1"> |
|
<data axis="0" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Concat_5, /transformer/blocks.0/attn/Constant_23" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="/transformer/blocks.0/attn/Concat_5_output_0"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="212" name="/transformer/blocks.0/attn/Reshape_3" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/Reshape_3" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.0/attn/Reshape_3_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="213" name="Transpose_916933_compressed" type="Const" version="opset1"> |
|
<data element_type="f16" shape="8, 8" offset="815843" size="128" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/out_proj/MatMul, onnx::MatMul_465" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>8</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="214" name="Transpose_916933" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<rt_info> |
|
<attribute name="decompression" version="0" /> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/out_proj/MatMul, onnx::MatMul_465" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>8</dim> |
|
<dim>8</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>8</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="215" name="/transformer/blocks.0/attn/out_proj/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/attn/out_proj/MatMul" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>8</dim> |
|
<dim>8</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.0/attn/out_proj/MatMul_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="216" name="/transformer/blocks.0/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/Add" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.0/Add_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="217" name="Constant_898955" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="24" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="Constant_898955" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="218" name="/transformer/blocks.0/norm_2/Div" type="MVN" version="opset6"> |
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/norm_2/Add, /transformer/blocks.0/norm_2/Div, /transformer/blocks.0/norm_2/Pow, /transformer/blocks.0/norm_2/ReduceMean, /transformer/blocks.0/norm_2/ReduceMean_1, /transformer/blocks.0/norm_2/Sqrt, /transformer/blocks.0/norm_2/Sub" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.0/norm_2/Div_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="219" name="Constant_917174_compressed" type="Const" version="opset1"> |
|
<data element_type="f16" shape="1, 1, 8" offset="815971" size="16" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="transformer.blocks.0.norm_2.weight" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="220" name="Constant_917174" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<rt_info> |
|
<attribute name="decompression" version="0" /> |
|
<attribute name="fused_names" version="0" value="transformer.blocks.0.norm_2.weight" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="221" name="/transformer/blocks.0/norm_2/Mul" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/norm_2/Mul" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.0/norm_2/Mul_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="222" name="Transpose_916937_compressed" type="Const" version="opset1"> |
|
<data element_type="f16" shape="32, 8" offset="815987" size="512" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/ffn/up_proj/MatMul, onnx::MatMul_466" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>32</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="223" name="Transpose_916937" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<rt_info> |
|
<attribute name="decompression" version="0" /> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/ffn/up_proj/MatMul, onnx::MatMul_466" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>32</dim> |
|
<dim>8</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>32</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="224" name="/transformer/blocks.0/ffn/up_proj/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/ffn/up_proj/MatMul" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>32</dim> |
|
<dim>8</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.0/ffn/up_proj/MatMul_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>32</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="225" name="/transformer/blocks.0/ffn/act/Mul_1" type="Gelu" version="opset7"> |
|
<data approximation_mode="ERF" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/ffn/act/Add, /transformer/blocks.0/ffn/act/Div, /transformer/blocks.0/ffn/act/Erf, /transformer/blocks.0/ffn/act/Mul, /transformer/blocks.0/ffn/act/Mul_1" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>32</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32" names="/transformer/blocks.0/ffn/act/Mul_1_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>32</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="226" name="Transpose_916941_compressed" type="Const" version="opset1"> |
|
<data element_type="f16" shape="8, 32" offset="816499" size="512" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/ffn/down_proj/MatMul, onnx::MatMul_467" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>8</dim> |
|
<dim>32</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="227" name="Transpose_916941" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<rt_info> |
|
<attribute name="decompression" version="0" /> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/ffn/down_proj/MatMul, onnx::MatMul_467" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>8</dim> |
|
<dim>32</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>8</dim> |
|
<dim>32</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="228" name="/transformer/blocks.0/ffn/down_proj/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/ffn/down_proj/MatMul" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>32</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>8</dim> |
|
<dim>32</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.0/ffn/down_proj/MatMul_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="229" name="/transformer/blocks.0/ffn/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.0/ffn/Add" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.0/ffn/Add_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="230" name="Constant_898978" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="24" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="Constant_898978" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="231" name="/transformer/blocks.1/norm_1/Div" type="MVN" version="opset6"> |
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/norm_1/Add, /transformer/blocks.1/norm_1/Div, /transformer/blocks.1/norm_1/Pow, /transformer/blocks.1/norm_1/ReduceMean, /transformer/blocks.1/norm_1/ReduceMean_1, /transformer/blocks.1/norm_1/Sqrt, /transformer/blocks.1/norm_1/Sub" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.1/norm_1/Div_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="232" name="Constant_917175_compressed" type="Const" version="opset1"> |
|
<data element_type="f16" shape="1, 1, 8" offset="817011" size="16" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="transformer.blocks.1.norm_1.weight" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="233" name="Constant_917175" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<rt_info> |
|
<attribute name="decompression" version="0" /> |
|
<attribute name="fused_names" version="0" value="transformer.blocks.1.norm_1.weight" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="234" name="/transformer/blocks.1/norm_1/Mul" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/norm_1/Mul" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.1/norm_1/Mul_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="235" name="Transpose_916945_compressed" type="Const" version="opset1"> |
|
<data element_type="f16" shape="24, 8" offset="817027" size="384" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Wqkv/MatMul, onnx::MatMul_468" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>24</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="236" name="Transpose_916945" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<rt_info> |
|
<attribute name="decompression" version="0" /> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Wqkv/MatMul, onnx::MatMul_468" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>24</dim> |
|
<dim>8</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>24</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="237" name="/transformer/blocks.1/attn/Wqkv/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Wqkv/MatMul" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>24</dim> |
|
<dim>8</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.1/attn/Wqkv/MatMul_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>24</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="238" name="Constant_915499" type="Const" version="opset1"> |
|
<data element_type="i64" shape="3" offset="807505" size="24" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_2, /transformer/blocks.1/attn/Slice_2" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="239" name="Constant_915498" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="8" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_2, /transformer/blocks.1/attn/Slice_2" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="240" name="/transformer/blocks.1/attn/Shape_2" type="ShapeOf" version="opset3"> |
|
<data output_type="i64" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Shape_2" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>24</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="I64" names="/transformer/blocks.1/attn/Shape_2_output_0"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="241" name="/transformer/blocks.1/attn/Constant_2" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="8" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_2" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/blocks.1/attn/Constant_2_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="242" name="Constant_899001" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="16" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="Constant_899001" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="243" name="/transformer/blocks.1/attn/Gather_2" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_2, /transformer/blocks.1/attn/Gather_2, Constant_899001" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64" names="/transformer/blocks.1/attn/Gather_2_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="244" name="/transformer/blocks.1/attn/Constant_4" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="8" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_4" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/blocks.1/attn/Constant_4_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="245" name="/transformer/blocks.1/attn/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Add, /transformer/blocks.1/attn/Constant_4" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="/transformer/blocks.1/attn/Add_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="246" name="/transformer/blocks.1/attn/Constant_5" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="807529" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_5" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/blocks.1/attn/Constant_5_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="247" name="/transformer/blocks.1/attn/Div" type="Divide" version="opset1"> |
|
<data auto_broadcast="numpy" m_pythondiv="true" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_5, /transformer/blocks.1/attn/Constant_6, /transformer/blocks.1/attn/Div, /transformer/blocks.1/attn/Mul" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="/transformer/blocks.1/attn/Div_output_0,/transformer/blocks.1/attn/Mul_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="248" name="/transformer/blocks.1/attn/Constant_7" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="8" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_7" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/blocks.1/attn/Constant_7_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="249" name="/transformer/blocks.1/attn/Mul_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_7, /transformer/blocks.1/attn/Mul_1" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="/transformer/blocks.1/attn/Mul_1_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="250" name="Constant_915497" type="Const" version="opset1"> |
|
<data element_type="i32" shape="1" offset="169" size="4" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_2, /transformer/blocks.1/attn/Slice_2" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="251" name="ScatterUpdate_915500" type="ScatterUpdate" version="opset3"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_2, /transformer/blocks.1/attn/Slice_2" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="252" name="Constant_915501" type="Const" version="opset1"> |
|
<data element_type="i64" shape="3" offset="807505" size="24" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_2, /transformer/blocks.1/attn/Slice_2" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="253" name="/transformer/blocks.1/attn/Constant_8" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="807529" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_8" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/blocks.1/attn/Constant_8_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="254" name="/transformer/blocks.1/attn/Mul_2" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_8, /transformer/blocks.1/attn/Mul_2" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="/transformer/blocks.1/attn/Mul_2_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="255" name="ScatterUpdate_915502" type="ScatterUpdate" version="opset3"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_2, /transformer/blocks.1/attn/Slice_2" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="256" name="Constant_915505" type="Const" version="opset1"> |
|
<data element_type="i64" shape="3" offset="807537" size="24" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_2, /transformer/blocks.1/attn/Slice_2" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="257" name="/transformer/blocks.1/attn/Slice_2" type="StridedSlice" version="opset1"> |
|
<data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_2, /transformer/blocks.1/attn/Slice_2" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>24</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="FP32" names="/transformer/blocks.1/attn/Slice_2_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="258" name="/transformer/blocks.1/attn/Shape" type="ShapeOf" version="opset3"> |
|
<data output_type="i64" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Shape, /transformer/blocks.1/attn/Shape_1" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="I64" names="/transformer/blocks.1/attn/Shape_1_output_0,/transformer/blocks.1/attn/Shape_output_0"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="259" name="Constant_914365" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="807561" size="16" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Concat, /transformer/blocks.1/attn/Concat_1, /transformer/blocks.1/attn/Concat_2, /transformer/blocks.1/attn/Constant_10, /transformer/blocks.1/attn/Constant_11, /transformer/blocks.1/attn/Constant_12, /transformer/blocks.1/attn/Constant_13, /transformer/blocks.1/attn/Constant_14, /transformer/blocks.1/attn/Constant_9" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="260" name="Constant_914366" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="16" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Concat, /transformer/blocks.1/attn/Concat_1, /transformer/blocks.1/attn/Concat_2, /transformer/blocks.1/attn/Constant_10, /transformer/blocks.1/attn/Constant_11, /transformer/blocks.1/attn/Constant_12, /transformer/blocks.1/attn/Constant_13, /transformer/blocks.1/attn/Constant_14, /transformer/blocks.1/attn/Constant_9" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="261" name="Gather_914367" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Concat, /transformer/blocks.1/attn/Concat_1, /transformer/blocks.1/attn/Concat_2, /transformer/blocks.1/attn/Concat_5, /transformer/blocks.1/attn/Constant_10, /transformer/blocks.1/attn/Constant_11, /transformer/blocks.1/attn/Constant_12, /transformer/blocks.1/attn/Constant_13, /transformer/blocks.1/attn/Constant_14, /transformer/blocks.1/attn/Constant_23, /transformer/blocks.1/attn/Constant_9" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="262" name="/transformer/blocks.1/attn/Constant_13" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="8" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_13" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/blocks.1/attn/Constant_13_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="263" name="/transformer/blocks.1/attn/Constant_14" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="807577" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_14" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/blocks.1/attn/Constant_14_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="264" name="/transformer/blocks.1/attn/Concat_2" type="Concat" version="opset1"> |
|
<data axis="0" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Concat, /transformer/blocks.1/attn/Concat_1, /transformer/blocks.1/attn/Concat_2, /transformer/blocks.1/attn/Constant_10, /transformer/blocks.1/attn/Constant_11, /transformer/blocks.1/attn/Constant_12, /transformer/blocks.1/attn/Constant_13, /transformer/blocks.1/attn/Constant_14, /transformer/blocks.1/attn/Constant_9" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64" names="/transformer/blocks.1/attn/Concat_1_output_0,/transformer/blocks.1/attn/Concat_2_output_0,/transformer/blocks.1/attn/Concat_output_0"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="265" name="/transformer/blocks.1/attn/Reshape_2" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Reshape_2" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.1/attn/Reshape_2_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="266" name="Constant_899229" type="Const" version="opset1"> |
|
<data element_type="i64" shape="4" offset="807585" size="32" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="Constant_899229" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="267" name="/transformer/blocks.1/attn/Transpose_2" type="Transpose" version="opset1"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Transpose_2" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.1/attn/Transpose_2_output_0"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="268" name="present.1.value" type="Concat" version="opset1"> |
|
<data axis="2" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="present.1.value" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="present.1.value"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="270" name="Constant_915597" type="Const" version="opset1"> |
|
<data element_type="i64" shape="3" offset="807505" size="24" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_2, /transformer/blocks.1/attn/Slice_1" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="271" name="Constant_915596" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="8" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_2, /transformer/blocks.1/attn/Slice_1" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="272" name="Constant_915595" type="Const" version="opset1"> |
|
<data element_type="i32" shape="1" offset="169" size="4" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_2, /transformer/blocks.1/attn/Slice_1" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="273" name="ScatterUpdate_915598" type="ScatterUpdate" version="opset3"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_2, /transformer/blocks.1/attn/Slice_1" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="274" name="Constant_915599" type="Const" version="opset1"> |
|
<data element_type="i64" shape="3" offset="807505" size="24" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_2, /transformer/blocks.1/attn/Slice_1" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="275" name="ScatterUpdate_915600" type="ScatterUpdate" version="opset3"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_2, /transformer/blocks.1/attn/Slice_1" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="276" name="Constant_915603" type="Const" version="opset1"> |
|
<data element_type="i64" shape="3" offset="807537" size="24" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_2, /transformer/blocks.1/attn/Slice_1" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="277" name="/transformer/blocks.1/attn/Slice_1" type="StridedSlice" version="opset1"> |
|
<data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_2, /transformer/blocks.1/attn/Slice_1" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>24</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="FP32" names="/transformer/blocks.1/attn/Slice_1_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="278" name="/transformer/blocks.1/attn/Reshape_1" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Reshape_1" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.1/attn/Reshape_1_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="279" name="Constant_899216" type="Const" version="opset1"> |
|
<data element_type="i64" shape="4" offset="807585" size="32" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="Constant_899216" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="280" name="/transformer/blocks.1/attn/Transpose_1" type="Transpose" version="opset1"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Transpose_1" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.1/attn/Transpose_1_output_0"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="281" name="present.1.key" type="Concat" version="opset1"> |
|
<data axis="2" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="present.1.key" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="present.1.key"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="285" name="/transformer/blocks.1/attn/Constant_22" type="Const" version="opset1"> |
|
<data element_type="f32" shape="" offset="189" size="4" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_22" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="FP32" names="/transformer/blocks.1/attn/Constant_22_output_0" /> |
|
</output> |
|
</layer> |
|
<layer id="286" name="Constant_915697" type="Const" version="opset1"> |
|
<data element_type="i64" shape="3" offset="807505" size="24" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_2, /transformer/blocks.1/attn/Slice" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="287" name="Constant_915698" type="Const" version="opset1"> |
|
<data element_type="i64" shape="3" offset="807505" size="24" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_2, /transformer/blocks.1/attn/Slice" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="288" name="Constant_915694" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="8" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_2, /transformer/blocks.1/attn/Slice" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="289" name="Constant_915693" type="Const" version="opset1"> |
|
<data element_type="i32" shape="1" offset="169" size="4" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_2, /transformer/blocks.1/attn/Slice" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="290" name="ScatterUpdate_915699" type="ScatterUpdate" version="opset3"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_2, /transformer/blocks.1/attn/Slice" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="291" name="Constant_915702" type="Const" version="opset1"> |
|
<data element_type="i64" shape="3" offset="807537" size="24" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_2, /transformer/blocks.1/attn/Slice" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="292" name="/transformer/blocks.1/attn/Slice" type="StridedSlice" version="opset1"> |
|
<data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_2, /transformer/blocks.1/attn/Slice" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>24</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="FP32" names="/transformer/blocks.1/attn/Slice_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="293" name="/transformer/blocks.1/attn/Reshape" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Reshape" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.1/attn/Reshape_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="294" name="Constant_899203" type="Const" version="opset1"> |
|
<data element_type="i64" shape="4" offset="807585" size="32" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="Constant_899203" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="295" name="/transformer/blocks.1/attn/Transpose" type="Transpose" version="opset1"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Transpose" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.1/attn/Transpose_output_0"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="296" name="Constant_917176_compressed" type="Const" version="opset1"> |
|
<data element_type="f16" shape="1, 1, 1, 1" offset="807617" size="2" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_15" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="297" name="Constant_917176" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<rt_info> |
|
<attribute name="decompression" version="0" /> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_15" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="298" name="Multiply_916964" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/MatMul, /transformer/blocks.1/attn/Mul_3, /transformer/blocks.1/attn/Transpose_3, present.1.key" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="299" name="/transformer/blocks.1/attn/Mul_3" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/MatMul, /transformer/blocks.1/attn/Mul_3, /transformer/blocks.1/attn/Transpose_3, present.1.key" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.1/attn/Mul_3_output_0"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="300" name="Constant_915750" type="Const" version="opset1"> |
|
<data element_type="i64" shape="3" offset="807505" size="24" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Slice_3" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="301" name="Constant_915749" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="8" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Slice_3" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="302" name="/transformer/blocks.1/attn/Constant_17" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="815811" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_17" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/blocks.1/attn/Constant_17_output_0" /> |
|
</output> |
|
</layer> |
|
<layer id="303" name="/transformer/blocks.1/attn/Shape_3" type="ShapeOf" version="opset3"> |
|
<data output_type="i64" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Shape_3" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="I64" names="/transformer/blocks.1/attn/Shape_3_output_0"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="304" name="/transformer/blocks.1/attn/Constant_16" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="8" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_16" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/blocks.1/attn/Constant_16_output_0" /> |
|
</output> |
|
</layer> |
|
<layer id="305" name="Constant_899240" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="16" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="Constant_899240" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="306" name="/transformer/blocks.1/attn/Gather_3" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_16, /transformer/blocks.1/attn/Gather_3, Constant_899240" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64" /> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64" names="/transformer/blocks.1/attn/Gather_3_output_0" /> |
|
</output> |
|
</layer> |
|
<layer id="307" name="/transformer/blocks.1/attn/Sub" type="Subtract" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_17, /transformer/blocks.1/attn/Sub" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64" /> |
|
<port id="1" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="/transformer/blocks.1/attn/Sub_output_0" /> |
|
</output> |
|
</layer> |
|
<layer id="308" name="/transformer/blocks.1/attn/Constant_19" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="16" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_19" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/blocks.1/attn/Constant_19_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="309" name="/transformer/blocks.1/attn/Unsqueeze_6" type="Unsqueeze" version="opset1"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_19, /transformer/blocks.1/attn/Unsqueeze_6" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64" /> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="/transformer/blocks.1/attn/Unsqueeze_6_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="310" name="Constant_915748" type="Const" version="opset1"> |
|
<data element_type="i32" shape="1" offset="169" size="4" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Slice_3" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="311" name="ScatterUpdate_915751" type="ScatterUpdate" version="opset3"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Slice_3" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="312" name="Constant_915754" type="Const" version="opset1"> |
|
<data element_type="i64" shape="3" offset="815819" size="24" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Slice_3" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="313" name="Constant_915757" type="Const" version="opset1"> |
|
<data element_type="i64" shape="3" offset="807537" size="24" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Slice_3" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="314" name="/transformer/blocks.1/attn/Slice_3" type="StridedSlice" version="opset1"> |
|
<data begin_mask="1, 1, 0" end_mask="1, 1, 0" new_axis_mask="" shrink_axis_mask="" ellipsis_mask="" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Slice_3" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>2</dim> |
|
<dim>1</dim> |
|
<dim>2048</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="FP32" names="/transformer/blocks.1/attn/Slice_3_output_0"> |
|
<dim>2</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="315" name="/transformer/blocks.1/attn/Add_1" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Add_1" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>2</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.1/attn/Add_1_output_0"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="316" name="/transformer/blocks.1/attn/Where" type="Select" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Cast_1, /transformer/blocks.1/attn/Where" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="BOOL"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="FP32" /> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="3" precision="FP32" names="/transformer/blocks.1/attn/Cast_1_output_0,/transformer/blocks.1/attn/Where_output_0"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="317" name="/transformer/blocks.1/attn/Softmax" type="SoftMax" version="opset8"> |
|
<data axis="-1" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Cast_2, /transformer/blocks.1/attn/Softmax" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32" names="/transformer/blocks.1/attn/Cast_2_output_0,/transformer/blocks.1/attn/Softmax_output_0"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="318" name="/transformer/blocks.1/attn/MatMul_1" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="false" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/MatMul_1" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.1/attn/MatMul_1_output_0"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="319" name="Constant_899318" type="Const" version="opset1"> |
|
<data element_type="i64" shape="4" offset="807585" size="32" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="Constant_899318" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="320" name="/transformer/blocks.1/attn/Transpose_4" type="Transpose" version="opset1"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Transpose_4" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.1/attn/Transpose_4_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="321" name="/transformer/blocks.1/attn/Constant_23" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="24" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Constant_23" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64" names="/transformer/blocks.1/attn/Constant_23_output_0"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="322" name="/transformer/blocks.1/attn/Concat_5" type="Concat" version="opset1"> |
|
<data axis="0" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Concat_5, /transformer/blocks.1/attn/Constant_23" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="/transformer/blocks.1/attn/Concat_5_output_0"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="323" name="/transformer/blocks.1/attn/Reshape_3" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/Reshape_3" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.1/attn/Reshape_3_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="324" name="Transpose_916948_compressed" type="Const" version="opset1"> |
|
<data element_type="f16" shape="8, 8" offset="817411" size="128" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/out_proj/MatMul, onnx::MatMul_479" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>8</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="325" name="Transpose_916948" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<rt_info> |
|
<attribute name="decompression" version="0" /> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/out_proj/MatMul, onnx::MatMul_479" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>8</dim> |
|
<dim>8</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>8</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="326" name="/transformer/blocks.1/attn/out_proj/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/attn/out_proj/MatMul" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>8</dim> |
|
<dim>8</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.1/attn/out_proj/MatMul_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="327" name="/transformer/blocks.1/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/Add" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.1/Add_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="328" name="Constant_899339" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="24" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="Constant_899339" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="329" name="/transformer/blocks.1/norm_2/Div" type="MVN" version="opset6"> |
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/norm_2/Add, /transformer/blocks.1/norm_2/Div, /transformer/blocks.1/norm_2/Pow, /transformer/blocks.1/norm_2/ReduceMean, /transformer/blocks.1/norm_2/ReduceMean_1, /transformer/blocks.1/norm_2/Sqrt, /transformer/blocks.1/norm_2/Sub" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.1/norm_2/Div_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="330" name="Constant_917177_compressed" type="Const" version="opset1"> |
|
<data element_type="f16" shape="1, 1, 8" offset="817539" size="16" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="transformer.blocks.1.norm_2.weight" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="331" name="Constant_917177" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<rt_info> |
|
<attribute name="decompression" version="0" /> |
|
<attribute name="fused_names" version="0" value="transformer.blocks.1.norm_2.weight" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="332" name="/transformer/blocks.1/norm_2/Mul" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/norm_2/Mul" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.1/norm_2/Mul_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="333" name="Transpose_916952_compressed" type="Const" version="opset1"> |
|
<data element_type="f16" shape="32, 8" offset="817555" size="512" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/ffn/up_proj/MatMul, onnx::MatMul_480" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>32</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="334" name="Transpose_916952" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<rt_info> |
|
<attribute name="decompression" version="0" /> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/ffn/up_proj/MatMul, onnx::MatMul_480" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>32</dim> |
|
<dim>8</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>32</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="335" name="/transformer/blocks.1/ffn/up_proj/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/ffn/up_proj/MatMul" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>32</dim> |
|
<dim>8</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.1/ffn/up_proj/MatMul_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>32</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="336" name="/transformer/blocks.1/ffn/act/Mul_1" type="Gelu" version="opset7"> |
|
<data approximation_mode="ERF" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/ffn/act/Add, /transformer/blocks.1/ffn/act/Div, /transformer/blocks.1/ffn/act/Erf, /transformer/blocks.1/ffn/act/Mul, /transformer/blocks.1/ffn/act/Mul_1" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>32</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32" names="/transformer/blocks.1/ffn/act/Mul_1_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>32</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="337" name="Transpose_916956_compressed" type="Const" version="opset1"> |
|
<data element_type="f16" shape="8, 32" offset="818067" size="512" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/ffn/down_proj/MatMul, onnx::MatMul_481" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>8</dim> |
|
<dim>32</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="338" name="Transpose_916956" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<rt_info> |
|
<attribute name="decompression" version="0" /> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/ffn/down_proj/MatMul, onnx::MatMul_481" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>8</dim> |
|
<dim>32</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>8</dim> |
|
<dim>32</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="339" name="/transformer/blocks.1/ffn/down_proj/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/ffn/down_proj/MatMul" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>32</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>8</dim> |
|
<dim>32</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.1/ffn/down_proj/MatMul_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="340" name="/transformer/blocks.1/ffn/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/blocks.1/ffn/Add" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/blocks.1/ffn/Add_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="341" name="Constant_899362" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="24" size="8" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="Constant_899362" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="342" name="/transformer/norm_f/Div" type="MVN" version="opset6"> |
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/norm_f/Add, /transformer/norm_f/Div, /transformer/norm_f/Pow, /transformer/norm_f/ReduceMean, /transformer/norm_f/ReduceMean_1, /transformer/norm_f/Sqrt, /transformer/norm_f/Sub" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/norm_f/Div_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="343" name="Constant_917178_compressed" type="Const" version="opset1"> |
|
<data element_type="f16" shape="1, 1, 8" offset="818579" size="16" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="transformer.norm_f.weight" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="344" name="Constant_917178" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<rt_info> |
|
<attribute name="decompression" version="0" /> |
|
<attribute name="fused_names" version="0" value="transformer.norm_f.weight" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="345" name="/transformer/norm_f/Mul" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="/transformer/norm_f/Mul" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="/transformer/norm_f/Mul_output_0"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="346" name="Transpose_916960_compressed" type="Const" version="opset1"> |
|
<data element_type="f16" shape="50432, 8" offset="193" size="806912" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="logits, onnx::MatMul_482" /> |
|
</rt_info> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>50432</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="347" name="Transpose_916960" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<rt_info> |
|
<attribute name="decompression" version="0" /> |
|
<attribute name="fused_names" version="0" value="logits, onnx::MatMul_482" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>50432</dim> |
|
<dim>8</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>50432</dim> |
|
<dim>8</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="348" name="logits" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="logits" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>8</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>50432</dim> |
|
<dim>8</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="logits"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>50432</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="349" name="logits/sink_port_0" type="Result" version="opset1"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="logits/sink_port_0" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>50432</dim> |
|
</port> |
|
</input> |
|
</layer> |
|
<layer id="284" name="present.0.key/sink_port_0" type="Result" version="opset1"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="present.0.key/sink_port_0" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
</layer> |
|
<layer id="283" name="present.0.value/sink_port_0" type="Result" version="opset1"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="present.0.value/sink_port_0" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
</layer> |
|
<layer id="282" name="present.1.key/sink_port_0" type="Result" version="opset1"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="present.1.key/sink_port_0" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
</layer> |
|
<layer id="269" name="present.1.value/sink_port_0" type="Result" version="opset1"> |
|
<rt_info> |
|
<attribute name="fused_names" version="0" value="present.1.value/sink_port_0" /> |
|
</rt_info> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>2</dim> |
|
<dim>-1</dim> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
</layer> |
|
</layers> |
|
<edges> |
|
<edge from-layer="0" from-port="0" to-layer="12" to-port="0" /> |
|
<edge from-layer="0" from-port="0" to-layer="7" to-port="0" /> |
|
<edge from-layer="1" from-port="0" to-layer="268" to-port="0" /> |
|
<edge from-layer="2" from-port="0" to-layer="281" to-port="0" /> |
|
<edge from-layer="3" from-port="0" to-layer="206" to-port="0" /> |
|
<edge from-layer="4" from-port="0" to-layer="35" to-port="0" /> |
|
<edge from-layer="4" from-port="0" to-layer="168" to-port="0" /> |
|
<edge from-layer="5" from-port="0" to-layer="17" to-port="0" /> |
|
<edge from-layer="5" from-port="0" to-layer="121" to-port="1" /> |
|
<edge from-layer="6" from-port="0" to-layer="7" to-port="1" /> |
|
<edge from-layer="7" from-port="2" to-layer="9" to-port="0" /> |
|
<edge from-layer="8" from-port="0" to-layer="9" to-port="1" /> |
|
<edge from-layer="9" from-port="2" to-layer="10" to-port="0" /> |
|
<edge from-layer="10" from-port="1" to-layer="11" to-port="0" /> |
|
<edge from-layer="11" from-port="1" to-layer="33" to-port="0" /> |
|
<edge from-layer="12" from-port="1" to-layer="25" to-port="0" /> |
|
<edge from-layer="12" from-port="1" to-layer="15" to-port="0" /> |
|
<edge from-layer="13" from-port="0" to-layer="15" to-port="1" /> |
|
<edge from-layer="14" from-port="0" to-layer="15" to-port="2" /> |
|
<edge from-layer="15" from-port="3" to-layer="26" to-port="0" /> |
|
<edge from-layer="16" from-port="0" to-layer="26" to-port="1" /> |
|
<edge from-layer="17" from-port="1" to-layer="106" to-port="0" /> |
|
<edge from-layer="17" from-port="1" to-layer="20" to-port="0" /> |
|
<edge from-layer="18" from-port="0" to-layer="20" to-port="1" /> |
|
<edge from-layer="19" from-port="0" to-layer="20" to-port="2" /> |
|
<edge from-layer="20" from-port="3" to-layer="22" to-port="0" /> |
|
<edge from-layer="20" from-port="3" to-layer="83" to-port="1" /> |
|
<edge from-layer="20" from-port="3" to-layer="39" to-port="0" /> |
|
<edge from-layer="21" from-port="0" to-layer="22" to-port="1" /> |
|
<edge from-layer="22" from-port="2" to-layer="42" to-port="0" /> |
|
<edge from-layer="22" from-port="2" to-layer="108" to-port="2" /> |
|
<edge from-layer="22" from-port="2" to-layer="26" to-port="2" /> |
|
<edge from-layer="23" from-port="0" to-layer="25" to-port="1" /> |
|
<edge from-layer="24" from-port="0" to-layer="25" to-port="2" /> |
|
<edge from-layer="25" from-port="3" to-layer="26" to-port="3" /> |
|
<edge from-layer="26" from-port="4" to-layer="28" to-port="0" /> |
|
<edge from-layer="27" from-port="0" to-layer="28" to-port="1" /> |
|
<edge from-layer="28" from-port="2" to-layer="32" to-port="2" /> |
|
<edge from-layer="28" from-port="2" to-layer="30" to-port="0" /> |
|
<edge from-layer="29" from-port="0" to-layer="30" to-port="1" /> |
|
<edge from-layer="30" from-port="2" to-layer="32" to-port="0" /> |
|
<edge from-layer="31" from-port="0" to-layer="32" to-port="1" /> |
|
<edge from-layer="32" from-port="3" to-layer="33" to-port="1" /> |
|
<edge from-layer="33" from-port="2" to-layer="116" to-port="0" /> |
|
<edge from-layer="34" from-port="0" to-layer="43" to-port="0" /> |
|
<edge from-layer="35" from-port="1" to-layer="38" to-port="0" /> |
|
<edge from-layer="36" from-port="0" to-layer="38" to-port="1" /> |
|
<edge from-layer="37" from-port="0" to-layer="38" to-port="2" /> |
|
<edge from-layer="38" from-port="3" to-layer="39" to-port="1" /> |
|
<edge from-layer="38" from-port="3" to-layer="60" to-port="0" /> |
|
<edge from-layer="39" from-port="2" to-layer="41" to-port="0" /> |
|
<edge from-layer="40" from-port="0" to-layer="41" to-port="1" /> |
|
<edge from-layer="41" from-port="2" to-layer="108" to-port="3" /> |
|
<edge from-layer="41" from-port="2" to-layer="42" to-port="1" /> |
|
<edge from-layer="42" from-port="2" to-layer="43" to-port="1" /> |
|
<edge from-layer="43" from-port="2" to-layer="99" to-port="0" /> |
|
<edge from-layer="43" from-port="2" to-layer="45" to-port="0" /> |
|
<edge from-layer="43" from-port="2" to-layer="95" to-port="0" /> |
|
<edge from-layer="44" from-port="0" to-layer="50" to-port="0" /> |
|
<edge from-layer="45" from-port="1" to-layer="56" to-port="0" /> |
|
<edge from-layer="45" from-port="1" to-layer="48" to-port="0" /> |
|
<edge from-layer="46" from-port="0" to-layer="48" to-port="1" /> |
|
<edge from-layer="47" from-port="0" to-layer="48" to-port="2" /> |
|
<edge from-layer="48" from-port="3" to-layer="50" to-port="1" /> |
|
<edge from-layer="49" from-port="0" to-layer="50" to-port="2" /> |
|
<edge from-layer="50" from-port="3" to-layer="52" to-port="0" /> |
|
<edge from-layer="51" from-port="0" to-layer="52" to-port="1" /> |
|
<edge from-layer="52" from-port="2" to-layer="70" to-port="0" /> |
|
<edge from-layer="52" from-port="2" to-layer="64" to-port="0" /> |
|
<edge from-layer="53" from-port="0" to-layer="58" to-port="0" /> |
|
<edge from-layer="54" from-port="0" to-layer="56" to-port="1" /> |
|
<edge from-layer="55" from-port="0" to-layer="56" to-port="2" /> |
|
<edge from-layer="56" from-port="3" to-layer="58" to-port="1" /> |
|
<edge from-layer="57" from-port="0" to-layer="58" to-port="2" /> |
|
<edge from-layer="58" from-port="3" to-layer="63" to-port="0" /> |
|
<edge from-layer="59" from-port="0" to-layer="60" to-port="1" /> |
|
<edge from-layer="60" from-port="2" to-layer="92" to-port="2" /> |
|
<edge from-layer="60" from-port="2" to-layer="63" to-port="1" /> |
|
<edge from-layer="61" from-port="0" to-layer="63" to-port="2" /> |
|
<edge from-layer="62" from-port="0" to-layer="63" to-port="3" /> |
|
<edge from-layer="63" from-port="4" to-layer="77" to-port="0" /> |
|
<edge from-layer="63" from-port="4" to-layer="64" to-port="1" /> |
|
<edge from-layer="64" from-port="2" to-layer="65" to-port="0" /> |
|
<edge from-layer="65" from-port="1" to-layer="74" to-port="0" /> |
|
<edge from-layer="65" from-port="1" to-layer="69" to-port="2" /> |
|
<edge from-layer="65" from-port="1" to-layer="76" to-port="2" /> |
|
<edge from-layer="65" from-port="1" to-layer="67" to-port="0" /> |
|
<edge from-layer="65" from-port="1" to-layer="98" to-port="1" /> |
|
<edge from-layer="66" from-port="0" to-layer="67" to-port="1" /> |
|
<edge from-layer="67" from-port="2" to-layer="69" to-port="0" /> |
|
<edge from-layer="68" from-port="0" to-layer="69" to-port="1" /> |
|
<edge from-layer="69" from-port="3" to-layer="70" to-port="1" /> |
|
<edge from-layer="70" from-port="2" to-layer="72" to-port="0" /> |
|
<edge from-layer="71" from-port="0" to-layer="72" to-port="1" /> |
|
<edge from-layer="72" from-port="2" to-layer="80" to-port="0" /> |
|
<edge from-layer="73" from-port="0" to-layer="74" to-port="1" /> |
|
<edge from-layer="74" from-port="2" to-layer="76" to-port="0" /> |
|
<edge from-layer="75" from-port="0" to-layer="76" to-port="1" /> |
|
<edge from-layer="76" from-port="3" to-layer="77" to-port="1" /> |
|
<edge from-layer="77" from-port="2" to-layer="79" to-port="0" /> |
|
<edge from-layer="78" from-port="0" to-layer="79" to-port="1" /> |
|
<edge from-layer="79" from-port="2" to-layer="80" to-port="1" /> |
|
<edge from-layer="80" from-port="2" to-layer="99" to-port="1" /> |
|
<edge from-layer="81" from-port="0" to-layer="83" to-port="0" /> |
|
<edge from-layer="82" from-port="0" to-layer="83" to-port="2" /> |
|
<edge from-layer="83" from-port="3" to-layer="87" to-port="0" /> |
|
<edge from-layer="83" from-port="3" to-layer="85" to-port="0" /> |
|
<edge from-layer="84" from-port="0" to-layer="85" to-port="1" /> |
|
<edge from-layer="85" from-port="2" to-layer="88" to-port="0" /> |
|
<edge from-layer="86" from-port="0" to-layer="87" to-port="1" /> |
|
<edge from-layer="87" from-port="2" to-layer="88" to-port="1" /> |
|
<edge from-layer="88" from-port="2" to-layer="97" to-port="0" /> |
|
<edge from-layer="89" from-port="0" to-layer="92" to-port="0" /> |
|
<edge from-layer="90" from-port="0" to-layer="92" to-port="1" /> |
|
<edge from-layer="91" from-port="0" to-layer="92" to-port="3" /> |
|
<edge from-layer="92" from-port="4" to-layer="95" to-port="1" /> |
|
<edge from-layer="93" from-port="0" to-layer="95" to-port="2" /> |
|
<edge from-layer="94" from-port="0" to-layer="95" to-port="3" /> |
|
<edge from-layer="95" from-port="4" to-layer="96" to-port="0" /> |
|
<edge from-layer="96" from-port="1" to-layer="97" to-port="1" /> |
|
<edge from-layer="97" from-port="2" to-layer="98" to-port="0" /> |
|
<edge from-layer="98" from-port="2" to-layer="99" to-port="2" /> |
|
<edge from-layer="99" from-port="3" to-layer="101" to-port="0" /> |
|
<edge from-layer="100" from-port="0" to-layer="101" to-port="1" /> |
|
<edge from-layer="101" from-port="2" to-layer="103" to-port="0" /> |
|
<edge from-layer="102" from-port="0" to-layer="103" to-port="1" /> |
|
<edge from-layer="103" from-port="2" to-layer="115" to-port="0" /> |
|
<edge from-layer="104" from-port="0" to-layer="106" to-port="1" /> |
|
<edge from-layer="105" from-port="0" to-layer="106" to-port="2" /> |
|
<edge from-layer="106" from-port="3" to-layer="108" to-port="0" /> |
|
<edge from-layer="107" from-port="0" to-layer="108" to-port="1" /> |
|
<edge from-layer="108" from-port="4" to-layer="110" to-port="0" /> |
|
<edge from-layer="109" from-port="0" to-layer="110" to-port="1" /> |
|
<edge from-layer="110" from-port="2" to-layer="112" to-port="0" /> |
|
<edge from-layer="110" from-port="2" to-layer="114" to-port="2" /> |
|
<edge from-layer="111" from-port="0" to-layer="112" to-port="1" /> |
|
<edge from-layer="112" from-port="2" to-layer="114" to-port="0" /> |
|
<edge from-layer="113" from-port="0" to-layer="114" to-port="1" /> |
|
<edge from-layer="114" from-port="3" to-layer="115" to-port="1" /> |
|
<edge from-layer="115" from-port="2" to-layer="116" to-port="1" /> |
|
<edge from-layer="116" from-port="2" to-layer="191" to-port="0" /> |
|
<edge from-layer="116" from-port="2" to-layer="316" to-port="0" /> |
|
<edge from-layer="117" from-port="0" to-layer="191" to-port="1" /> |
|
<edge from-layer="118" from-port="0" to-layer="119" to-port="0" /> |
|
<edge from-layer="119" from-port="1" to-layer="121" to-port="0" /> |
|
<edge from-layer="120" from-port="0" to-layer="121" to-port="2" /> |
|
<edge from-layer="121" from-port="3" to-layer="123" to-port="0" /> |
|
<edge from-layer="121" from-port="3" to-layer="216" to-port="1" /> |
|
<edge from-layer="122" from-port="0" to-layer="123" to-port="1" /> |
|
<edge from-layer="123" from-port="2" to-layer="126" to-port="0" /> |
|
<edge from-layer="124" from-port="0" to-layer="125" to-port="0" /> |
|
<edge from-layer="125" from-port="1" to-layer="126" to-port="1" /> |
|
<edge from-layer="126" from-port="2" to-layer="129" to-port="0" /> |
|
<edge from-layer="126" from-port="2" to-layer="145" to-port="0" /> |
|
<edge from-layer="127" from-port="0" to-layer="128" to-port="0" /> |
|
<edge from-layer="128" from-port="1" to-layer="129" to-port="1" /> |
|
<edge from-layer="129" from-port="2" to-layer="133" to-port="0" /> |
|
<edge from-layer="129" from-port="2" to-layer="164" to-port="0" /> |
|
<edge from-layer="129" from-port="2" to-layer="202" to-port="0" /> |
|
<edge from-layer="129" from-port="2" to-layer="144" to-port="0" /> |
|
<edge from-layer="130" from-port="0" to-layer="144" to-port="1" /> |
|
<edge from-layer="131" from-port="0" to-layer="142" to-port="0" /> |
|
<edge from-layer="132" from-port="0" to-layer="142" to-port="1" /> |
|
<edge from-layer="133" from-port="1" to-layer="136" to-port="0" /> |
|
<edge from-layer="134" from-port="0" to-layer="136" to-port="1" /> |
|
<edge from-layer="135" from-port="0" to-layer="136" to-port="2" /> |
|
<edge from-layer="136" from-port="3" to-layer="138" to-port="0" /> |
|
<edge from-layer="137" from-port="0" to-layer="138" to-port="1" /> |
|
<edge from-layer="138" from-port="2" to-layer="140" to-port="0" /> |
|
<edge from-layer="139" from-port="0" to-layer="140" to-port="1" /> |
|
<edge from-layer="140" from-port="2" to-layer="199" to-port="0" /> |
|
<edge from-layer="140" from-port="2" to-layer="158" to-port="2" /> |
|
<edge from-layer="140" from-port="2" to-layer="142" to-port="2" /> |
|
<edge from-layer="140" from-port="2" to-layer="161" to-port="0" /> |
|
<edge from-layer="141" from-port="0" to-layer="142" to-port="3" /> |
|
<edge from-layer="142" from-port="4" to-layer="144" to-port="2" /> |
|
<edge from-layer="143" from-port="0" to-layer="144" to-port="3" /> |
|
<edge from-layer="144" from-port="4" to-layer="152" to-port="0" /> |
|
<edge from-layer="145" from-port="1" to-layer="148" to-port="0" /> |
|
<edge from-layer="146" from-port="0" to-layer="148" to-port="1" /> |
|
<edge from-layer="147" from-port="0" to-layer="148" to-port="2" /> |
|
<edge from-layer="148" from-port="3" to-layer="211" to-port="0" /> |
|
<edge from-layer="148" from-port="3" to-layer="151" to-port="0" /> |
|
<edge from-layer="149" from-port="0" to-layer="151" to-port="1" /> |
|
<edge from-layer="150" from-port="0" to-layer="151" to-port="2" /> |
|
<edge from-layer="151" from-port="3" to-layer="203" to-port="1" /> |
|
<edge from-layer="151" from-port="3" to-layer="152" to-port="1" /> |
|
<edge from-layer="151" from-port="3" to-layer="165" to-port="1" /> |
|
<edge from-layer="152" from-port="2" to-layer="154" to-port="0" /> |
|
<edge from-layer="153" from-port="0" to-layer="154" to-port="1" /> |
|
<edge from-layer="154" from-port="2" to-layer="172" to-port="0" /> |
|
<edge from-layer="155" from-port="0" to-layer="158" to-port="0" /> |
|
<edge from-layer="156" from-port="0" to-layer="158" to-port="1" /> |
|
<edge from-layer="156" from-port="0" to-layer="162" to-port="1" /> |
|
<edge from-layer="157" from-port="0" to-layer="158" to-port="3" /> |
|
<edge from-layer="157" from-port="0" to-layer="162" to-port="3" /> |
|
<edge from-layer="158" from-port="4" to-layer="164" to-port="1" /> |
|
<edge from-layer="159" from-port="0" to-layer="162" to-port="0" /> |
|
<edge from-layer="160" from-port="0" to-layer="161" to-port="1" /> |
|
<edge from-layer="161" from-port="2" to-layer="196" to-port="2" /> |
|
<edge from-layer="161" from-port="2" to-layer="162" to-port="2" /> |
|
<edge from-layer="162" from-port="4" to-layer="164" to-port="2" /> |
|
<edge from-layer="163" from-port="0" to-layer="164" to-port="3" /> |
|
<edge from-layer="164" from-port="4" to-layer="165" to-port="0" /> |
|
<edge from-layer="165" from-port="2" to-layer="167" to-port="0" /> |
|
<edge from-layer="166" from-port="0" to-layer="167" to-port="1" /> |
|
<edge from-layer="167" from-port="2" to-layer="168" to-port="1" /> |
|
<edge from-layer="168" from-port="2" to-layer="178" to-port="0" /> |
|
<edge from-layer="168" from-port="2" to-layer="171" to-port="0" /> |
|
<edge from-layer="168" from-port="2" to-layer="284" to-port="0" /> |
|
<edge from-layer="169" from-port="0" to-layer="170" to-port="0" /> |
|
<edge from-layer="170" from-port="1" to-layer="171" to-port="1" /> |
|
<edge from-layer="171" from-port="2" to-layer="172" to-port="1" /> |
|
<edge from-layer="172" from-port="2" to-layer="190" to-port="0" /> |
|
<edge from-layer="173" from-port="0" to-layer="174" to-port="0" /> |
|
<edge from-layer="174" from-port="1" to-layer="189" to-port="0" /> |
|
<edge from-layer="174" from-port="1" to-layer="314" to-port="0" /> |
|
<edge from-layer="175" from-port="0" to-layer="186" to-port="0" /> |
|
<edge from-layer="176" from-port="0" to-layer="186" to-port="1" /> |
|
<edge from-layer="177" from-port="0" to-layer="182" to-port="0" /> |
|
<edge from-layer="178" from-port="1" to-layer="181" to-port="0" /> |
|
<edge from-layer="179" from-port="0" to-layer="181" to-port="1" /> |
|
<edge from-layer="180" from-port="0" to-layer="181" to-port="2" /> |
|
<edge from-layer="181" from-port="3" to-layer="182" to-port="1" /> |
|
<edge from-layer="182" from-port="2" to-layer="184" to-port="0" /> |
|
<edge from-layer="183" from-port="0" to-layer="184" to-port="1" /> |
|
<edge from-layer="184" from-port="2" to-layer="186" to-port="2" /> |
|
<edge from-layer="185" from-port="0" to-layer="186" to-port="3" /> |
|
<edge from-layer="186" from-port="4" to-layer="189" to-port="1" /> |
|
<edge from-layer="187" from-port="0" to-layer="189" to-port="2" /> |
|
<edge from-layer="188" from-port="0" to-layer="189" to-port="3" /> |
|
<edge from-layer="189" from-port="4" to-layer="190" to-port="1" /> |
|
<edge from-layer="190" from-port="2" to-layer="191" to-port="2" /> |
|
<edge from-layer="191" from-port="3" to-layer="192" to-port="0" /> |
|
<edge from-layer="192" from-port="1" to-layer="207" to-port="0" /> |
|
<edge from-layer="193" from-port="0" to-layer="196" to-port="0" /> |
|
<edge from-layer="194" from-port="0" to-layer="200" to-port="1" /> |
|
<edge from-layer="194" from-port="0" to-layer="196" to-port="1" /> |
|
<edge from-layer="195" from-port="0" to-layer="196" to-port="3" /> |
|
<edge from-layer="195" from-port="0" to-layer="200" to-port="3" /> |
|
<edge from-layer="196" from-port="4" to-layer="202" to-port="1" /> |
|
<edge from-layer="197" from-port="0" to-layer="200" to-port="0" /> |
|
<edge from-layer="198" from-port="0" to-layer="199" to-port="1" /> |
|
<edge from-layer="199" from-port="2" to-layer="200" to-port="2" /> |
|
<edge from-layer="200" from-port="4" to-layer="202" to-port="2" /> |
|
<edge from-layer="201" from-port="0" to-layer="202" to-port="3" /> |
|
<edge from-layer="202" from-port="4" to-layer="203" to-port="0" /> |
|
<edge from-layer="203" from-port="2" to-layer="205" to-port="0" /> |
|
<edge from-layer="204" from-port="0" to-layer="205" to-port="1" /> |
|
<edge from-layer="205" from-port="2" to-layer="206" to-port="1" /> |
|
<edge from-layer="206" from-port="2" to-layer="283" to-port="0" /> |
|
<edge from-layer="206" from-port="2" to-layer="207" to-port="1" /> |
|
<edge from-layer="207" from-port="2" to-layer="209" to-port="0" /> |
|
<edge from-layer="208" from-port="0" to-layer="209" to-port="1" /> |
|
<edge from-layer="209" from-port="2" to-layer="212" to-port="0" /> |
|
<edge from-layer="210" from-port="0" to-layer="211" to-port="1" /> |
|
<edge from-layer="211" from-port="2" to-layer="212" to-port="1" /> |
|
<edge from-layer="212" from-port="2" to-layer="215" to-port="0" /> |
|
<edge from-layer="213" from-port="0" to-layer="214" to-port="0" /> |
|
<edge from-layer="214" from-port="1" to-layer="215" to-port="1" /> |
|
<edge from-layer="215" from-port="2" to-layer="216" to-port="0" /> |
|
<edge from-layer="216" from-port="2" to-layer="229" to-port="1" /> |
|
<edge from-layer="216" from-port="2" to-layer="218" to-port="0" /> |
|
<edge from-layer="217" from-port="0" to-layer="218" to-port="1" /> |
|
<edge from-layer="218" from-port="2" to-layer="221" to-port="0" /> |
|
<edge from-layer="219" from-port="0" to-layer="220" to-port="0" /> |
|
<edge from-layer="220" from-port="1" to-layer="221" to-port="1" /> |
|
<edge from-layer="221" from-port="2" to-layer="224" to-port="0" /> |
|
<edge from-layer="222" from-port="0" to-layer="223" to-port="0" /> |
|
<edge from-layer="223" from-port="1" to-layer="224" to-port="1" /> |
|
<edge from-layer="224" from-port="2" to-layer="225" to-port="0" /> |
|
<edge from-layer="225" from-port="1" to-layer="228" to-port="0" /> |
|
<edge from-layer="226" from-port="0" to-layer="227" to-port="0" /> |
|
<edge from-layer="227" from-port="1" to-layer="228" to-port="1" /> |
|
<edge from-layer="228" from-port="2" to-layer="229" to-port="0" /> |
|
<edge from-layer="229" from-port="2" to-layer="231" to-port="0" /> |
|
<edge from-layer="229" from-port="2" to-layer="327" to-port="1" /> |
|
<edge from-layer="230" from-port="0" to-layer="231" to-port="1" /> |
|
<edge from-layer="231" from-port="2" to-layer="234" to-port="0" /> |
|
<edge from-layer="232" from-port="0" to-layer="233" to-port="0" /> |
|
<edge from-layer="233" from-port="1" to-layer="234" to-port="1" /> |
|
<edge from-layer="234" from-port="2" to-layer="258" to-port="0" /> |
|
<edge from-layer="234" from-port="2" to-layer="237" to-port="0" /> |
|
<edge from-layer="235" from-port="0" to-layer="236" to-port="0" /> |
|
<edge from-layer="236" from-port="1" to-layer="237" to-port="1" /> |
|
<edge from-layer="237" from-port="2" to-layer="292" to-port="0" /> |
|
<edge from-layer="237" from-port="2" to-layer="257" to-port="0" /> |
|
<edge from-layer="237" from-port="2" to-layer="277" to-port="0" /> |
|
<edge from-layer="237" from-port="2" to-layer="240" to-port="0" /> |
|
<edge from-layer="238" from-port="0" to-layer="251" to-port="0" /> |
|
<edge from-layer="239" from-port="0" to-layer="251" to-port="1" /> |
|
<edge from-layer="239" from-port="0" to-layer="255" to-port="1" /> |
|
<edge from-layer="240" from-port="1" to-layer="243" to-port="0" /> |
|
<edge from-layer="241" from-port="0" to-layer="243" to-port="1" /> |
|
<edge from-layer="242" from-port="0" to-layer="243" to-port="2" /> |
|
<edge from-layer="243" from-port="3" to-layer="245" to-port="0" /> |
|
<edge from-layer="244" from-port="0" to-layer="245" to-port="1" /> |
|
<edge from-layer="245" from-port="2" to-layer="247" to-port="0" /> |
|
<edge from-layer="246" from-port="0" to-layer="247" to-port="1" /> |
|
<edge from-layer="247" from-port="2" to-layer="290" to-port="2" /> |
|
<edge from-layer="247" from-port="2" to-layer="273" to-port="2" /> |
|
<edge from-layer="247" from-port="2" to-layer="249" to-port="0" /> |
|
<edge from-layer="247" from-port="2" to-layer="254" to-port="0" /> |
|
<edge from-layer="248" from-port="0" to-layer="249" to-port="1" /> |
|
<edge from-layer="249" from-port="2" to-layer="251" to-port="2" /> |
|
<edge from-layer="249" from-port="2" to-layer="275" to-port="2" /> |
|
<edge from-layer="250" from-port="0" to-layer="251" to-port="3" /> |
|
<edge from-layer="250" from-port="0" to-layer="255" to-port="3" /> |
|
<edge from-layer="251" from-port="4" to-layer="257" to-port="1" /> |
|
<edge from-layer="252" from-port="0" to-layer="255" to-port="0" /> |
|
<edge from-layer="253" from-port="0" to-layer="254" to-port="1" /> |
|
<edge from-layer="254" from-port="2" to-layer="255" to-port="2" /> |
|
<edge from-layer="255" from-port="4" to-layer="257" to-port="2" /> |
|
<edge from-layer="256" from-port="0" to-layer="257" to-port="3" /> |
|
<edge from-layer="257" from-port="4" to-layer="265" to-port="0" /> |
|
<edge from-layer="258" from-port="1" to-layer="261" to-port="0" /> |
|
<edge from-layer="259" from-port="0" to-layer="261" to-port="1" /> |
|
<edge from-layer="260" from-port="0" to-layer="261" to-port="2" /> |
|
<edge from-layer="261" from-port="3" to-layer="322" to-port="0" /> |
|
<edge from-layer="261" from-port="3" to-layer="264" to-port="0" /> |
|
<edge from-layer="262" from-port="0" to-layer="264" to-port="1" /> |
|
<edge from-layer="263" from-port="0" to-layer="264" to-port="2" /> |
|
<edge from-layer="264" from-port="3" to-layer="265" to-port="1" /> |
|
<edge from-layer="264" from-port="3" to-layer="278" to-port="1" /> |
|
<edge from-layer="264" from-port="3" to-layer="293" to-port="1" /> |
|
<edge from-layer="265" from-port="2" to-layer="267" to-port="0" /> |
|
<edge from-layer="266" from-port="0" to-layer="267" to-port="1" /> |
|
<edge from-layer="267" from-port="2" to-layer="268" to-port="1" /> |
|
<edge from-layer="268" from-port="2" to-layer="318" to-port="1" /> |
|
<edge from-layer="268" from-port="2" to-layer="269" to-port="0" /> |
|
<edge from-layer="270" from-port="0" to-layer="273" to-port="0" /> |
|
<edge from-layer="271" from-port="0" to-layer="275" to-port="1" /> |
|
<edge from-layer="271" from-port="0" to-layer="273" to-port="1" /> |
|
<edge from-layer="272" from-port="0" to-layer="275" to-port="3" /> |
|
<edge from-layer="272" from-port="0" to-layer="273" to-port="3" /> |
|
<edge from-layer="273" from-port="4" to-layer="277" to-port="1" /> |
|
<edge from-layer="274" from-port="0" to-layer="275" to-port="0" /> |
|
<edge from-layer="275" from-port="4" to-layer="277" to-port="2" /> |
|
<edge from-layer="276" from-port="0" to-layer="277" to-port="3" /> |
|
<edge from-layer="277" from-port="4" to-layer="278" to-port="0" /> |
|
<edge from-layer="278" from-port="2" to-layer="280" to-port="0" /> |
|
<edge from-layer="279" from-port="0" to-layer="280" to-port="1" /> |
|
<edge from-layer="280" from-port="2" to-layer="281" to-port="1" /> |
|
<edge from-layer="281" from-port="2" to-layer="282" to-port="0" /> |
|
<edge from-layer="281" from-port="2" to-layer="303" to-port="0" /> |
|
<edge from-layer="281" from-port="2" to-layer="298" to-port="0" /> |
|
<edge from-layer="285" from-port="0" to-layer="316" to-port="1" /> |
|
<edge from-layer="286" from-port="0" to-layer="292" to-port="1" /> |
|
<edge from-layer="287" from-port="0" to-layer="290" to-port="0" /> |
|
<edge from-layer="288" from-port="0" to-layer="290" to-port="1" /> |
|
<edge from-layer="289" from-port="0" to-layer="290" to-port="3" /> |
|
<edge from-layer="290" from-port="4" to-layer="292" to-port="2" /> |
|
<edge from-layer="291" from-port="0" to-layer="292" to-port="3" /> |
|
<edge from-layer="292" from-port="4" to-layer="293" to-port="0" /> |
|
<edge from-layer="293" from-port="2" to-layer="295" to-port="0" /> |
|
<edge from-layer="294" from-port="0" to-layer="295" to-port="1" /> |
|
<edge from-layer="295" from-port="2" to-layer="299" to-port="0" /> |
|
<edge from-layer="296" from-port="0" to-layer="297" to-port="0" /> |
|
<edge from-layer="297" from-port="1" to-layer="298" to-port="1" /> |
|
<edge from-layer="298" from-port="2" to-layer="299" to-port="1" /> |
|
<edge from-layer="299" from-port="2" to-layer="315" to-port="0" /> |
|
<edge from-layer="300" from-port="0" to-layer="311" to-port="0" /> |
|
<edge from-layer="301" from-port="0" to-layer="311" to-port="1" /> |
|
<edge from-layer="302" from-port="0" to-layer="307" to-port="0" /> |
|
<edge from-layer="303" from-port="1" to-layer="306" to-port="0" /> |
|
<edge from-layer="304" from-port="0" to-layer="306" to-port="1" /> |
|
<edge from-layer="305" from-port="0" to-layer="306" to-port="2" /> |
|
<edge from-layer="306" from-port="3" to-layer="307" to-port="1" /> |
|
<edge from-layer="307" from-port="2" to-layer="309" to-port="0" /> |
|
<edge from-layer="308" from-port="0" to-layer="309" to-port="1" /> |
|
<edge from-layer="309" from-port="2" to-layer="311" to-port="2" /> |
|
<edge from-layer="310" from-port="0" to-layer="311" to-port="3" /> |
|
<edge from-layer="311" from-port="4" to-layer="314" to-port="1" /> |
|
<edge from-layer="312" from-port="0" to-layer="314" to-port="2" /> |
|
<edge from-layer="313" from-port="0" to-layer="314" to-port="3" /> |
|
<edge from-layer="314" from-port="4" to-layer="315" to-port="1" /> |
|
<edge from-layer="315" from-port="2" to-layer="316" to-port="2" /> |
|
<edge from-layer="316" from-port="3" to-layer="317" to-port="0" /> |
|
<edge from-layer="317" from-port="1" to-layer="318" to-port="0" /> |
|
<edge from-layer="318" from-port="2" to-layer="320" to-port="0" /> |
|
<edge from-layer="319" from-port="0" to-layer="320" to-port="1" /> |
|
<edge from-layer="320" from-port="2" to-layer="323" to-port="0" /> |
|
<edge from-layer="321" from-port="0" to-layer="322" to-port="1" /> |
|
<edge from-layer="322" from-port="2" to-layer="323" to-port="1" /> |
|
<edge from-layer="323" from-port="2" to-layer="326" to-port="0" /> |
|
<edge from-layer="324" from-port="0" to-layer="325" to-port="0" /> |
|
<edge from-layer="325" from-port="1" to-layer="326" to-port="1" /> |
|
<edge from-layer="326" from-port="2" to-layer="327" to-port="0" /> |
|
<edge from-layer="327" from-port="2" to-layer="329" to-port="0" /> |
|
<edge from-layer="327" from-port="2" to-layer="340" to-port="1" /> |
|
<edge from-layer="328" from-port="0" to-layer="329" to-port="1" /> |
|
<edge from-layer="329" from-port="2" to-layer="332" to-port="0" /> |
|
<edge from-layer="330" from-port="0" to-layer="331" to-port="0" /> |
|
<edge from-layer="331" from-port="1" to-layer="332" to-port="1" /> |
|
<edge from-layer="332" from-port="2" to-layer="335" to-port="0" /> |
|
<edge from-layer="333" from-port="0" to-layer="334" to-port="0" /> |
|
<edge from-layer="334" from-port="1" to-layer="335" to-port="1" /> |
|
<edge from-layer="335" from-port="2" to-layer="336" to-port="0" /> |
|
<edge from-layer="336" from-port="1" to-layer="339" to-port="0" /> |
|
<edge from-layer="337" from-port="0" to-layer="338" to-port="0" /> |
|
<edge from-layer="338" from-port="1" to-layer="339" to-port="1" /> |
|
<edge from-layer="339" from-port="2" to-layer="340" to-port="0" /> |
|
<edge from-layer="340" from-port="2" to-layer="342" to-port="0" /> |
|
<edge from-layer="341" from-port="0" to-layer="342" to-port="1" /> |
|
<edge from-layer="342" from-port="2" to-layer="345" to-port="0" /> |
|
<edge from-layer="343" from-port="0" to-layer="344" to-port="0" /> |
|
<edge from-layer="344" from-port="1" to-layer="345" to-port="1" /> |
|
<edge from-layer="345" from-port="2" to-layer="348" to-port="0" /> |
|
<edge from-layer="346" from-port="0" to-layer="347" to-port="0" /> |
|
<edge from-layer="347" from-port="1" to-layer="348" to-port="1" /> |
|
<edge from-layer="348" from-port="2" to-layer="349" to-port="0" /> |
|
</edges> |
|
<rt_info /> |
|
</net> |
|
|