|
<?xml version="1.0"?> |
|
<net name="Model3" version="11"> |
|
<layers> |
|
<layer id="3" name="decoder_input_ids" type="Parameter" version="opset1"> |
|
<data shape="?,?" element_type="i64" /> |
|
<output> |
|
<port id="0" precision="I64" names="input_ids"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="2" name="Parameter_20565" type="Parameter" version="opset1"> |
|
<data shape="?,?,1024" element_type="f32" /> |
|
<output> |
|
<port id="0" precision="FP32" names="encoder_hidden_states"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="1" name="cache_position" type="Parameter" version="opset1"> |
|
<data shape="?" element_type="i64" /> |
|
<output> |
|
<port id="0" precision="I64" names="cache_position"> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="0" name="beam_idx" type="Parameter" version="opset1"> |
|
<data shape="?" element_type="i32" /> |
|
<output> |
|
<port id="0" precision="I32" names="beam_idx"> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="4" name="self.model.model.decoder.layers.0.encoder_attn.k_proj.weight" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 8, 128" offset="0" size="524288" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="5" name="Convert_690996" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="6" name="self.model.model.decoder.layers.0.encoder_attn.k_proj.weight/zero_point" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 8, 1" offset="524288" size="4096" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="7" name="Convert_690999" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="8" name="self.model.model.decoder.layers.0.encoder_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="9" name="self.model.model.decoder.layers.0.encoder_attn.k_proj.weight/scale" type="Const" version="opset1"> |
|
<data element_type="f16" shape="1024, 8, 1" offset="528384" size="16384" /> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="10" name="self.model.model.decoder.layers.0.encoder_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="11" name="Constant_691004" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="544768" size="16" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="12" name="Reshape_691005" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="13" name="self.model.model.decoder.layers.0.encoder_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="14" name="__module.model.model.decoder.layers.0.encoder_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="183,tensor.9"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="15" name="Constant_27338" type="Const" version="opset1"> |
|
<data element_type="i64" shape="4" offset="544784" size="32" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="16" name="__module.model.model.decoder.layers.0.encoder_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="185"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="17" name="__module.model.model.decoder.layers.0.encoder_attn/aten::transpose/Constant_1" type="Const" version="opset1"> |
|
<data element_type="i32" shape="4" offset="544816" size="16" /> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="18" name="__module.model.model.decoder.layers.0.encoder_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="186"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="19" name="ReadValue_29849" type="ReadValue" version="opset6"> |
|
<data variable_id="186" variable_type="dynamic" variable_shape="..." /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="21" name="self.model.model.decoder.layers.1.encoder_attn.k_proj.weight" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 8, 128" offset="544832" size="524288" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="22" name="Convert_695295" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="23" name="self.model.model.decoder.layers.1.encoder_attn.k_proj.weight/zero_point" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 8, 1" offset="1069120" size="4096" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="24" name="Convert_695298" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="25" name="self.model.model.decoder.layers.1.encoder_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="26" name="self.model.model.decoder.layers.1.encoder_attn.k_proj.weight/scale" type="Const" version="opset1"> |
|
<data element_type="f16" shape="1024, 8, 1" offset="1073216" size="16384" /> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="27" name="self.model.model.decoder.layers.1.encoder_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="28" name="Constant_695303" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="544768" size="16" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="29" name="Reshape_695304" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="30" name="self.model.model.decoder.layers.1.encoder_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="31" name="__module.model.model.decoder.layers.1.encoder_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="299,tensor.21"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="32" name="Constant_27346" type="Const" version="opset1"> |
|
<data element_type="i64" shape="4" offset="544784" size="32" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="33" name="__module.model.model.decoder.layers.1.encoder_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="301"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="34" name="__module.model.model.decoder.layers.1.encoder_attn/aten::transpose/Constant_1" type="Const" version="opset1"> |
|
<data element_type="i32" shape="4" offset="544816" size="16" /> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="35" name="__module.model.model.decoder.layers.1.encoder_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="302"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="36" name="ReadValue_29847" type="ReadValue" version="opset6"> |
|
<data variable_id="302" variable_type="dynamic" variable_shape="..." /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="38" name="self.model.model.decoder.layers.0.encoder_attn.v_proj.weight" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 8, 128" offset="1089600" size="524288" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="39" name="Convert_699594" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="40" name="self.model.model.decoder.layers.0.encoder_attn.v_proj.weight/zero_point" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 8, 1" offset="1613888" size="4096" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="41" name="Convert_699597" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="42" name="self.model.model.decoder.layers.0.encoder_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="43" name="self.model.model.decoder.layers.0.encoder_attn.v_proj.weight/scale" type="Const" version="opset1"> |
|
<data element_type="f16" shape="1024, 8, 1" offset="1617984" size="16384" /> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="44" name="self.model.model.decoder.layers.0.encoder_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="45" name="Constant_699602" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="544768" size="16" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="46" name="Reshape_699603" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="47" name="self.model.model.decoder.layers.0.encoder_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="48" name="__module.model.model.decoder.layers.0.encoder_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="49" name="Constant_26715" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1024" offset="1634368" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="50" name="__module.model.model.decoder.layers.0.encoder_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="190,tensor.11"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="51" name="Constant_27339" type="Const" version="opset1"> |
|
<data element_type="i64" shape="4" offset="544784" size="32" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="52" name="__module.model.model.decoder.layers.0.encoder_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="192"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="53" name="__module.model.model.decoder.layers.0.encoder_attn/aten::transpose/Constant_2" type="Const" version="opset1"> |
|
<data element_type="i32" shape="4" offset="544816" size="16" /> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="54" name="__module.model.model.decoder.layers.0.encoder_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="193"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="55" name="ReadValue_29845" type="ReadValue" version="opset6"> |
|
<data variable_id="193" variable_type="dynamic" variable_shape="..." /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="57" name="self.model.model.decoder.layers.1.encoder_attn.v_proj.weight" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 8, 128" offset="1638464" size="524288" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="58" name="Convert_703893" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="59" name="self.model.model.decoder.layers.1.encoder_attn.v_proj.weight/zero_point" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 8, 1" offset="2162752" size="4096" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="60" name="Convert_703896" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="61" name="self.model.model.decoder.layers.1.encoder_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="62" name="self.model.model.decoder.layers.1.encoder_attn.v_proj.weight/scale" type="Const" version="opset1"> |
|
<data element_type="f16" shape="1024, 8, 1" offset="2166848" size="16384" /> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="63" name="self.model.model.decoder.layers.1.encoder_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="64" name="Constant_703901" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="544768" size="16" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="65" name="Reshape_703902" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="66" name="self.model.model.decoder.layers.1.encoder_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="67" name="__module.model.model.decoder.layers.1.encoder_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="68" name="Constant_26729" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1024" offset="2183232" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="69" name="__module.model.model.decoder.layers.1.encoder_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="306,tensor"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="70" name="Constant_27347" type="Const" version="opset1"> |
|
<data element_type="i64" shape="4" offset="544784" size="32" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="71" name="__module.model.model.decoder.layers.1.encoder_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="308"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="72" name="__module.model.model.decoder.layers.1.encoder_attn/aten::transpose/Constant_2" type="Const" version="opset1"> |
|
<data element_type="i32" shape="4" offset="544816" size="16" /> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="73" name="__module.model.model.decoder.layers.1.encoder_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="309"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="74" name="ReadValue_29843" type="ReadValue" version="opset6"> |
|
<data variable_id="309" variable_type="dynamic" variable_shape="..." /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="76" name="Constant_29413" type="Const" version="opset1"> |
|
<data element_type="f32" shape="" offset="2187328" size="4" /> |
|
<output> |
|
<port id="0" precision="FP32" /> |
|
</output> |
|
</layer> |
|
<layer id="77" name="ShapeOf_29399" type="ShapeOf" version="opset3"> |
|
<data output_type="i64" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="78" name="Constant_29401" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="2187332" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="79" name="Constant_29403" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="2187332" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="80" name="Gather_29404" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="81" name="Constant_29406" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="2187340" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="82" name="Constant_29408" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="2187332" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="83" name="Constant_29410" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="2187348" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="84" name="Concat_29411" type="Concat" version="opset1"> |
|
<data axis="0" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="85" name="Broadcast_29414" type="Broadcast" version="opset3"> |
|
<data mode="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32" /> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>0</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="86" name="ReadValue_29015" type="ReadValue" version="opset6"> |
|
<data variable_id="past_key_values.1.decoder.valuepresent.1.decoder.value" variable_type="f32" variable_shape="?,16,?,64" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>0</dim> |
|
<dim>64</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32" names="past_key_values.1.decoder.value"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="87" name="Constant_28625" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="2187332" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="88" name="Gather_28626" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="89" name="self.model.model.decoder.embed_tokens.weight" type="Const" version="opset1"> |
|
<data element_type="u8" shape="51864, 1024" offset="2187356" size="53108736" /> |
|
<output> |
|
<port id="0" precision="U8"> |
|
<dim>51864</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="90" name="Convert_669503" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U8"> |
|
<dim>51864</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>51864</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="91" name="self.model.model.decoder.embed_tokens.weight/zero_point" type="Const" version="opset1"> |
|
<data element_type="u8" shape="51864, 1" offset="55296092" size="51864" /> |
|
<output> |
|
<port id="0" precision="U8"> |
|
<dim>51864</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="92" name="Convert_669506" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U8"> |
|
<dim>51864</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>51864</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="93" name="self.model.model.decoder.embed_tokens.weight/zero_point/subtract" type="Subtract" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>51864</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>51864</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>51864</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="94" name="self.model.model.decoder.embed_tokens.weight/scale" type="Const" version="opset1"> |
|
<data element_type="f16" shape="51864, 1" offset="55347956" size="103728" /> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>51864</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="95" name="self.model.model.decoder.embed_tokens.weight/fq_weights_0" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>51864</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>51864</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>51864</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="96" name="self.model.model.decoder.embed_tokens.weight/fq_weights_0/convert" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>51864</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>51864</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="97" name="__module.model.model.decoder/prim::ListConstruct" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="55451684" size="16" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="98" name="__module.model.model.decoder/aten::view/Reshape" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="69"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="99" name="__module.model.model.decoder.embed_tokens/aten::embedding/Convert" type="Convert" version="opset1"> |
|
<data destination_type="i32" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="I32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="100" name="__module.model.model.decoder.embed_tokens/aten::embedding/Constant" type="Const" version="opset1"> |
|
<data element_type="i32" shape="" offset="2187328" size="4" /> |
|
<output> |
|
<port id="0" precision="I32" /> |
|
</output> |
|
</layer> |
|
<layer id="101" name="__module.model.model.decoder.embed_tokens/aten::embedding/Gather" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>51864</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="2" precision="I32" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="FP32" names="71,inputs_embeds"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="102" name="self.model.model.decoder.embed_positions.weight" type="Const" version="opset1"> |
|
<data element_type="u8" shape="448, 1024" offset="55451700" size="458752" /> |
|
<output> |
|
<port id="0" precision="U8"> |
|
<dim>448</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="103" name="Convert_759778" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U8"> |
|
<dim>448</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>448</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="104" name="self.model.model.decoder.embed_positions.weight/zero_point" type="Const" version="opset1"> |
|
<data element_type="u8" shape="448, 1" offset="55910452" size="448" /> |
|
<output> |
|
<port id="0" precision="U8"> |
|
<dim>448</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="105" name="Convert_759781" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U8"> |
|
<dim>448</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>448</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="106" name="self.model.model.decoder.embed_positions.weight/zero_point/subtract" type="Subtract" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>448</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>448</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>448</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="107" name="self.model.model.decoder.embed_positions.weight/scale" type="Const" version="opset1"> |
|
<data element_type="f16" shape="448, 1" offset="55910900" size="896" /> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>448</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="108" name="self.model.model.decoder.embed_positions.weight/fq_weights_0" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>448</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>448</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>448</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="109" name="self.model.model.decoder.embed_positions.weight/fq_weights_0/convert" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>448</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>448</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="110" name="45" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="2187332" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" names="45" /> |
|
</output> |
|
</layer> |
|
<layer id="111" name="__module.model.model.decoder/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1"> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="72"> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="112" name="ShapeOf_27123" type="ShapeOf" version="opset3"> |
|
<data output_type="i64" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="113" name="Constant_27124" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="2187332" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="114" name="Constant_27125" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="2187332" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="115" name="Gather_27126" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64" names="118,173,237,289,66,89"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="116" name="Constant_20870" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="55911796" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="117" name="__module.model.model.decoder/prim::ListConstruct/Concat" type="Concat" version="opset1"> |
|
<data axis="0" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="73"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="118" name="__module.model.model.decoder/aten::repeat/Tile" type="Tile" version="opset1"> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="74,position_ids"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="119" name="__module.model.model.decoder.embed_positions/aten::index/Convert" type="Convert" version="opset1"> |
|
<data destination_type="i32" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="I32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="120" name="__module.model.model.decoder.embed_positions/aten::index/Constant" type="Const" version="opset1"> |
|
<data element_type="i32" shape="" offset="2187328" size="4" /> |
|
<output> |
|
<port id="0" precision="I32" /> |
|
</output> |
|
</layer> |
|
<layer id="121" name="__module.model.model.decoder.embed_positions/aten::index/Gather" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>448</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="2" precision="I32" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="FP32" names="77,78,positions,positions.1"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="122" name="__module.model.model.decoder/aten::add/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="79,input.1"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="123" name="__module.model.model.decoder.layers.0.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> |
|
<data element_type="i32" shape="1" offset="55911804" size="4" /> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="124" name="__module.model.model.decoder.layers.0.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> |
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="125" name="Constant_26706" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1024" offset="55911808" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="126" name="__module.model.model.decoder.layers.0.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="127" name="Constant_26707" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1024" offset="55915904" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="128" name="__module.model.model.decoder.layers.0.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="113,hidden_states.1"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="129" name="self.model.model.decoder.layers.0.self_attn.q_proj.weight" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 8, 128" offset="55920000" size="524288" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="130" name="Convert_716790" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="131" name="self.model.model.decoder.layers.0.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 8, 1" offset="56444288" size="4096" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="132" name="Convert_716793" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="133" name="self.model.model.decoder.layers.0.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="134" name="self.model.model.decoder.layers.0.self_attn.q_proj.weight/scale" type="Const" version="opset1"> |
|
<data element_type="f16" shape="1024, 8, 1" offset="56448384" size="16384" /> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="135" name="self.model.model.decoder.layers.0.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="136" name="Constant_716798" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="544768" size="16" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="137" name="Reshape_716799" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="138" name="self.model.model.decoder.layers.0.self_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="139" name="__module.model.model.decoder.layers.0.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="140" name="Constant_26708" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1024" offset="56464768" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="141" name="__module.model.model.decoder.layers.0.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="122,tensor.1"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="142" name="Constant_27333" type="Const" version="opset1"> |
|
<data element_type="i64" shape="4" offset="544784" size="32" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="143" name="__module.model.model.decoder.layers.0.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="124"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="144" name="__module.model.model.decoder.layers.0.self_attn/aten::transpose/Constant" type="Const" version="opset1"> |
|
<data element_type="i32" shape="4" offset="544816" size="16" /> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="145" name="__module.model.model.decoder.layers.0.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="125"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="146" name="Constant_29425" type="Const" version="opset1"> |
|
<data element_type="f32" shape="" offset="2187328" size="4" /> |
|
<output> |
|
<port id="0" precision="FP32" /> |
|
</output> |
|
</layer> |
|
<layer id="147" name="Constant_29418" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="2187340" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="148" name="Constant_29420" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="2187332" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="149" name="Constant_29422" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="2187348" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="150" name="Concat_29423" type="Concat" version="opset1"> |
|
<data axis="0" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="151" name="Broadcast_29426" type="Broadcast" version="opset3"> |
|
<data mode="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32" /> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>0</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="152" name="ReadValue_29009" type="ReadValue" version="opset6"> |
|
<data variable_id="past_key_values.0.decoder.keypresent.0.decoder.key" variable_type="f32" variable_shape="?,16,?,64" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>0</dim> |
|
<dim>64</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32" names="past_key_values.0.decoder.key"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="153" name="Constant_28616" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="2187332" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="154" name="Gather_28617" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="155" name="self.model.model.decoder.layers.0.self_attn.k_proj.weight" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 8, 128" offset="56468864" size="524288" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="156" name="Convert_712491" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="157" name="self.model.model.decoder.layers.0.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 8, 1" offset="56993152" size="4096" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="158" name="Convert_712494" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="159" name="self.model.model.decoder.layers.0.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="160" name="self.model.model.decoder.layers.0.self_attn.k_proj.weight/scale" type="Const" version="opset1"> |
|
<data element_type="f16" shape="1024, 8, 1" offset="56997248" size="16384" /> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="161" name="self.model.model.decoder.layers.0.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="162" name="Constant_712499" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="544768" size="16" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="163" name="Reshape_712500" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="164" name="self.model.model.decoder.layers.0.self_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="165" name="__module.model.model.decoder.layers.0.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="128,tensor.3"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="166" name="Constant_27334" type="Const" version="opset1"> |
|
<data element_type="i64" shape="4" offset="544784" size="32" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="167" name="__module.model.model.decoder.layers.0.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="130"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="168" name="__module.model.model.decoder.layers.0.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> |
|
<data element_type="i32" shape="4" offset="544816" size="16" /> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="169" name="__module.model.model.decoder.layers.0.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="131"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="170" name="__module.model.model.decoder.layers.0.self_attn/aten::cat/Concat" type="Concat" version="opset1"> |
|
<data axis="-2" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="key_states.7"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="171" name="Constant_29437" type="Const" version="opset1"> |
|
<data element_type="f32" shape="" offset="2187328" size="4" /> |
|
<output> |
|
<port id="0" precision="FP32" /> |
|
</output> |
|
</layer> |
|
<layer id="172" name="Constant_29430" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="2187340" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="173" name="Constant_29432" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="2187332" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="174" name="Constant_29434" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="2187348" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="175" name="Concat_29435" type="Concat" version="opset1"> |
|
<data axis="0" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="176" name="Broadcast_29438" type="Broadcast" version="opset3"> |
|
<data mode="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32" /> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>0</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="177" name="ReadValue_29011" type="ReadValue" version="opset6"> |
|
<data variable_id="past_key_values.0.decoder.valuepresent.0.decoder.value" variable_type="f32" variable_shape="?,16,?,64" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>0</dim> |
|
<dim>64</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32" names="past_key_values.0.decoder.value"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="178" name="Constant_28619" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="2187332" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="179" name="Gather_28620" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="180" name="self.model.model.decoder.layers.0.self_attn.v_proj.weight" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 8, 128" offset="57013632" size="524288" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="181" name="Convert_708192" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="182" name="self.model.model.decoder.layers.0.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 8, 1" offset="57537920" size="4096" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="183" name="Convert_708195" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="184" name="self.model.model.decoder.layers.0.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="185" name="self.model.model.decoder.layers.0.self_attn.v_proj.weight/scale" type="Const" version="opset1"> |
|
<data element_type="f16" shape="1024, 8, 1" offset="57542016" size="16384" /> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="186" name="self.model.model.decoder.layers.0.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="187" name="Constant_708200" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="544768" size="16" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="188" name="Reshape_708201" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="189" name="self.model.model.decoder.layers.0.self_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="190" name="__module.model.model.decoder.layers.0.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="191" name="Constant_26709" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1024" offset="57558400" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="192" name="__module.model.model.decoder.layers.0.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="135,tensor.5"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="193" name="Constant_27335" type="Const" version="opset1"> |
|
<data element_type="i64" shape="4" offset="544784" size="32" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="194" name="__module.model.model.decoder.layers.0.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="137"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="195" name="__module.model.model.decoder.layers.0.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> |
|
<data element_type="i32" shape="4" offset="544816" size="16" /> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="196" name="__module.model.model.decoder.layers.0.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="138"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="197" name="__module.model.model.decoder.layers.0.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> |
|
<data axis="-2" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="198" name="Constant_26710" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1" offset="57562496" size="4" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="199" name="__module.model.model.decoder/aten::arange/Constant" type="Const" version="opset1"> |
|
<data element_type="i32" shape="" offset="2187328" size="4" /> |
|
<output> |
|
<port id="0" precision="I32" /> |
|
</output> |
|
</layer> |
|
<layer id="200" name="ShapeOf_27139" type="ShapeOf" version="opset3"> |
|
<data output_type="i64" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="201" name="Constant_27140" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="57562500" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="202" name="Constant_27141" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="2187332" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="203" name="Gather_27142" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
<port id="1" precision="I64" /> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64" names="81" /> |
|
</output> |
|
</layer> |
|
<layer id="204" name="Constant_27148" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="55911796" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="205" name="Constant_27149" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="2187332" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="206" name="Gather_27150" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
<port id="1" precision="I64" /> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="I64" names="83" /> |
|
</output> |
|
</layer> |
|
<layer id="207" name="__module.model.model.decoder/aten::add/Add_1" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="I64" /> |
|
<port id="1" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="85" /> |
|
</output> |
|
</layer> |
|
<layer id="208" name="__module.model.model.decoder/aten::add/Multiply_2" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="55911796" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="209" name="__module.model.model.decoder/aten::add/Add_2" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="I64" /> |
|
<port id="1" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="86,88" /> |
|
</output> |
|
</layer> |
|
<layer id="210" name="__module.model.model.decoder/aten::arange/Constant_1" type="Const" version="opset1"> |
|
<data element_type="i32" shape="" offset="57562508" size="4" /> |
|
<output> |
|
<port id="0" precision="I32" /> |
|
</output> |
|
</layer> |
|
<layer id="211" name="__module.model.model.decoder/aten::arange/Range" type="Range" version="opset4"> |
|
<data output_type="f32" /> |
|
<input> |
|
<port id="0" precision="I32" /> |
|
<port id="1" precision="I64" /> |
|
<port id="2" precision="I32" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="FP32"> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="212" name="__module.model.model.decoder/aten::arange/ConvertLike" type="Convert" version="opset1"> |
|
<data destination_type="i64" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="I64" names="92"> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="213" name="Constant_19310" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="57562512" size="16" /> |
|
<output> |
|
<port id="0" precision="I64" names="93"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="214" name="__module.model.model.decoder/aten::reshape/Reshape" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="94"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="215" name="__module.model.model.decoder/aten::gt/Greater" type="Greater" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="BOOL" names="95"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="216" name="__module.model.model.decoder/aten::mul_/ConvertLike" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<input> |
|
<port id="0" precision="BOOL"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="217" name="Multiply_25574" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="218" name="ShapeOf_25575" type="ShapeOf" version="opset3"> |
|
<data output_type="i64" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="219" name="Constant_27153" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="55911796" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="220" name="Reshape_27154" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="I64" /> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="221" name="Constant_19296" type="Const" version="opset1"> |
|
<data element_type="i32" shape="" offset="2187328" size="4" /> |
|
<output> |
|
<port id="0" precision="I32" /> |
|
</output> |
|
</layer> |
|
<layer id="222" name="Unsqueeze_19297" type="Unsqueeze" version="opset1"> |
|
<input> |
|
<port id="0" precision="I64" /> |
|
<port id="1" precision="I32" /> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="223" name="__module.model.model.decoder/prim::ListConstruct_1" type="Concat" version="opset1"> |
|
<data axis="0" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="224" name="Maximum_25576" type="Maximum" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="225" name="__module.model.model.decoder/aten::mul_/Multiply" type="Broadcast" version="opset3"> |
|
<data mode="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="91,causal_mask.1"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="226" name="__module.model.model.decoder/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="97"> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="227" name="46" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="55911796" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" names="46" /> |
|
</output> |
|
</layer> |
|
<layer id="228" name="__module.model.model.decoder/aten::unsqueeze/Unsqueeze_2" type="Unsqueeze" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="100,98,99"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="229" name="Constant_25009" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="55911796" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="230" name="Constant_25011" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="55911796" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="231" name="Constant_25013" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="55911796" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="232" name="__module.model.model.decoder/prim::ListConstruct_2" type="Concat" version="opset1"> |
|
<data axis="0" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="233" name="__module.model.model.decoder/aten::expand/Broadcast" type="Broadcast" version="opset3"> |
|
<data mode="bidirectional" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="102,148,149,150,264,265,266,attention_mask"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="234" name="Constant_19593" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="2187332" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="235" name="Constant_27161" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="55911796" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="236" name="Reshape_27162" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="I64" /> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="237" name="Add_27165" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="I64" names="147,263"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="238" name="Constant_19596" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="55911796" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="239" name="Constant_19591" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="57562528" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="240" name="__module.model.model.decoder.layers.0.self_attn/aten::slice/Slice_3" type="Slice" version="opset8"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="4" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="5" precision="FP32" names="151,267"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="241" name="__module.model.model.decoder.layers.0.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> |
|
<data causal="false" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="3" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="FP32" names="152,attn_output.1"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="242" name="__module.model.model.decoder.layers.0.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> |
|
<data element_type="i32" shape="4" offset="544816" size="16" /> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="243" name="__module.model.model.decoder.layers.0.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="153,attn_output.3"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="244" name="Constant_27336" type="Const" version="opset1"> |
|
<data element_type="i64" shape="3" offset="57562536" size="24" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="245" name="__module.model.model.decoder.layers.0.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="155"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="246" name="self.model.model.decoder.layers.0.self_attn.out_proj.weight" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 8, 128" offset="57562560" size="524288" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="247" name="Convert_721089" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="248" name="self.model.model.decoder.layers.0.self_attn.out_proj.weight/zero_point" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 8, 1" offset="58086848" size="4096" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="249" name="Convert_721092" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="250" name="self.model.model.decoder.layers.0.self_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="251" name="self.model.model.decoder.layers.0.self_attn.out_proj.weight/scale" type="Const" version="opset1"> |
|
<data element_type="f16" shape="1024, 8, 1" offset="58090944" size="16384" /> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="252" name="self.model.model.decoder.layers.0.self_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="253" name="Constant_721097" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="544768" size="16" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="254" name="Reshape_721098" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="255" name="self.model.model.decoder.layers.0.self_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="256" name="__module.model.model.decoder.layers.0.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="257" name="Constant_26711" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1024" offset="58107328" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="258" name="__module.model.model.decoder.layers.0.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="158,160,input.3"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="259" name="__module.model.model.decoder.layers.0/aten::add/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="164,residual.3"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="260" name="__module.model.model.decoder.layers.0.encoder_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> |
|
<data element_type="i32" shape="1" offset="55911804" size="4" /> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="261" name="__module.model.model.decoder.layers.0.encoder_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> |
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="262" name="Constant_26712" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1024" offset="58111424" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="263" name="__module.model.model.decoder.layers.0.encoder_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="264" name="Constant_26713" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1024" offset="58115520" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="265" name="__module.model.model.decoder.layers.0.encoder_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="168,hidden_states.5"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="266" name="self.model.model.decoder.layers.0.encoder_attn.q_proj.weight" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 8, 128" offset="58119616" size="524288" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="267" name="Convert_725388" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="268" name="self.model.model.decoder.layers.0.encoder_attn.q_proj.weight/zero_point" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 8, 1" offset="58643904" size="4096" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="269" name="Convert_725391" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="270" name="self.model.model.decoder.layers.0.encoder_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="271" name="self.model.model.decoder.layers.0.encoder_attn.q_proj.weight/scale" type="Const" version="opset1"> |
|
<data element_type="f16" shape="1024, 8, 1" offset="58648000" size="16384" /> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="272" name="self.model.model.decoder.layers.0.encoder_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="273" name="Constant_725396" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="544768" size="16" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="274" name="Reshape_725397" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="275" name="self.model.model.decoder.layers.0.encoder_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="276" name="__module.model.model.decoder.layers.0.encoder_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="277" name="Constant_26714" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1024" offset="58664384" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="278" name="__module.model.model.decoder.layers.0.encoder_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="177,tensor.7"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="279" name="Constant_27337" type="Const" version="opset1"> |
|
<data element_type="i64" shape="4" offset="544784" size="32" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="280" name="__module.model.model.decoder.layers.0.encoder_attn/aten::view/Reshape" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="179"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="281" name="__module.model.model.decoder.layers.0.encoder_attn/aten::transpose/Constant" type="Const" version="opset1"> |
|
<data element_type="i32" shape="4" offset="544816" size="16" /> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="282" name="__module.model.model.decoder.layers.0.encoder_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="180"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="283" name="__module.model.model.decoder.layers.0.encoder_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> |
|
<data causal="false" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="3" precision="FP32" names="195,attn_output.5"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="284" name="__module.model.model.decoder.layers.0.encoder_attn/aten::transpose/Constant_3" type="Const" version="opset1"> |
|
<data element_type="i32" shape="4" offset="544816" size="16" /> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="285" name="__module.model.model.decoder.layers.0.encoder_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="196,attn_output.7"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="286" name="Constant_27340" type="Const" version="opset1"> |
|
<data element_type="i64" shape="3" offset="57562536" size="24" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="287" name="__module.model.model.decoder.layers.0.encoder_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="198"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="288" name="self.model.model.decoder.layers.0.encoder_attn.out_proj.weight" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 8, 128" offset="58668480" size="524288" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="289" name="Convert_729687" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="290" name="self.model.model.decoder.layers.0.encoder_attn.out_proj.weight/zero_point" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 8, 1" offset="59192768" size="4096" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="291" name="Convert_729690" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="292" name="self.model.model.decoder.layers.0.encoder_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="293" name="self.model.model.decoder.layers.0.encoder_attn.out_proj.weight/scale" type="Const" version="opset1"> |
|
<data element_type="f16" shape="1024, 8, 1" offset="59196864" size="16384" /> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="294" name="self.model.model.decoder.layers.0.encoder_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="295" name="Constant_729695" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="544768" size="16" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="296" name="Reshape_729696" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="297" name="self.model.model.decoder.layers.0.encoder_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="298" name="__module.model.model.decoder.layers.0.encoder_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="299" name="Constant_26716" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1024" offset="59213248" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="300" name="__module.model.model.decoder.layers.0.encoder_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="201,input.5"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="301" name="__module.model.model.decoder.layers.0/aten::add/Add_1" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="203,residual.5"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="302" name="__module.model.model.decoder.layers.0.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> |
|
<data element_type="i32" shape="1" offset="55911804" size="4" /> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="303" name="__module.model.model.decoder.layers.0.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> |
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="304" name="Constant_26717" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1024" offset="59217344" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="305" name="__module.model.model.decoder.layers.0.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="306" name="Constant_26718" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1024" offset="59221440" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="307" name="__module.model.model.decoder.layers.0.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="207"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="308" name="self.model.model.decoder.layers.0.fc1.weight" type="Const" version="opset1"> |
|
<data element_type="u4" shape="4096, 8, 128" offset="59225536" size="2097152" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>4096</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="309" name="Convert_673800" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>4096</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>4096</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="310" name="self.model.model.decoder.layers.0.fc1.weight/zero_point" type="Const" version="opset1"> |
|
<data element_type="u4" shape="4096, 8, 1" offset="61322688" size="16384" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>4096</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="311" name="Convert_673803" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>4096</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>4096</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="312" name="self.model.model.decoder.layers.0.fc1.weight/zero_point/subtract" type="Subtract" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>4096</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>4096</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>4096</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="313" name="self.model.model.decoder.layers.0.fc1.weight/scale" type="Const" version="opset1"> |
|
<data element_type="f16" shape="4096, 8, 1" offset="61339072" size="65536" /> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>4096</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="314" name="self.model.model.decoder.layers.0.fc1.weight/fq_weights_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>4096</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>4096</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>4096</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="315" name="Constant_673808" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="61404608" size="16" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="316" name="Reshape_673809" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>4096</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>4096</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="317" name="self.model.model.decoder.layers.0.fc1.weight/fq_weights_1/convert" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>4096</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>4096</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="318" name="__module.model.model.decoder.layers.0.fc1/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>4096</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4096</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="319" name="Constant_26719" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 4096" offset="61404624" size="16384" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>4096</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="320" name="__module.model.model.decoder.layers.0.fc1/aten::linear/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4096</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>4096</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="210"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4096</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="321" name="__module.model.model.decoder.layers.0.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> |
|
<data approximation_mode="ERF" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4096</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32" names="211,input.7"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4096</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="322" name="self.model.model.decoder.layers.0.fc2.weight" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 32, 128" offset="61421008" size="2097152" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>32</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="323" name="Convert_678099" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>32</dim> |
|
<dim>128</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>32</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="324" name="self.model.model.decoder.layers.0.fc2.weight/zero_point" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 32, 1" offset="63518160" size="16384" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>32</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="325" name="Convert_678102" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>32</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>32</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="326" name="self.model.model.decoder.layers.0.fc2.weight/zero_point/subtract" type="Subtract" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>32</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>32</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>32</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="327" name="self.model.model.decoder.layers.0.fc2.weight/scale" type="Const" version="opset1"> |
|
<data element_type="f16" shape="1024, 32, 1" offset="63534544" size="65536" /> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>32</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="328" name="self.model.model.decoder.layers.0.fc2.weight/fq_weights_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>32</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>32</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>32</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="329" name="Constant_678107" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="63600080" size="16" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="330" name="Reshape_678108" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>32</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>4096</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="331" name="self.model.model.decoder.layers.0.fc2.weight/fq_weights_1/convert" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>4096</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>4096</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="332" name="__module.model.model.decoder.layers.0.fc2/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4096</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>4096</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="333" name="Constant_26720" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1024" offset="63600096" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="334" name="__module.model.model.decoder.layers.0.fc2/aten::linear/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="215,input.9"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="335" name="__module.model.model.decoder.layers.0/aten::add/Add_2" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="217,219,residual.7"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="336" name="__module.model.model.decoder.layers.1.self_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> |
|
<data element_type="i32" shape="1" offset="55911804" size="4" /> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="337" name="__module.model.model.decoder.layers.1.self_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> |
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="338" name="Constant_26721" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1024" offset="63604192" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="339" name="__module.model.model.decoder.layers.1.self_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="340" name="Constant_26722" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1024" offset="63608288" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="341" name="__module.model.model.decoder.layers.1.self_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="232,hidden_states.11"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="342" name="self.model.model.decoder.layers.1.self_attn.v_proj.weight" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 8, 128" offset="63612384" size="524288" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="343" name="Convert_733986" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="344" name="self.model.model.decoder.layers.1.self_attn.v_proj.weight/zero_point" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 8, 1" offset="64136672" size="4096" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="345" name="Convert_733989" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="346" name="self.model.model.decoder.layers.1.self_attn.v_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="347" name="self.model.model.decoder.layers.1.self_attn.v_proj.weight/scale" type="Const" version="opset1"> |
|
<data element_type="f16" shape="1024, 8, 1" offset="64140768" size="16384" /> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="348" name="self.model.model.decoder.layers.1.self_attn.v_proj.weight/fq_weights_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="349" name="Constant_733994" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="544768" size="16" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="350" name="Reshape_733995" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="351" name="self.model.model.decoder.layers.1.self_attn.v_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="352" name="__module.model.model.decoder.layers.1.self_attn.v_proj/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="353" name="Constant_26723" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1024" offset="64157152" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="354" name="__module.model.model.decoder.layers.1.self_attn.v_proj/aten::linear/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="254,tensor.17"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="355" name="Constant_27341" type="Const" version="opset1"> |
|
<data element_type="i64" shape="4" offset="544784" size="32" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="356" name="__module.model.model.decoder.layers.1.self_attn/aten::view/Reshape" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="256"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="357" name="__module.model.model.decoder.layers.1.self_attn/aten::transpose/Constant" type="Const" version="opset1"> |
|
<data element_type="i32" shape="4" offset="544816" size="16" /> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="358" name="__module.model.model.decoder.layers.1.self_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="257"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="359" name="__module.model.model.decoder.layers.1.self_attn/aten::cat/Concat" type="Concat" version="opset1"> |
|
<data axis="-2" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="present.1.decoder.value"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="361" name="Constant_29449" type="Const" version="opset1"> |
|
<data element_type="f32" shape="" offset="2187328" size="4" /> |
|
<output> |
|
<port id="0" precision="FP32" /> |
|
</output> |
|
</layer> |
|
<layer id="362" name="Constant_29442" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="2187340" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="363" name="Constant_29444" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="2187332" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="364" name="Constant_29446" type="Const" version="opset1"> |
|
<data element_type="i64" shape="1" offset="2187348" size="8" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="365" name="Concat_29447" type="Concat" version="opset1"> |
|
<data axis="0" /> |
|
<input> |
|
<port id="0" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="2" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
<port id="3" precision="I64"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="366" name="Broadcast_29450" type="Broadcast" version="opset3"> |
|
<data mode="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32" /> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>0</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="367" name="ReadValue_29013" type="ReadValue" version="opset6"> |
|
<data variable_id="past_key_values.1.decoder.keypresent.1.decoder.key" variable_type="f32" variable_shape="?,16,?,64" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>0</dim> |
|
<dim>64</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32" names="past_key_values.1.decoder.key"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="368" name="Constant_28622" type="Const" version="opset1"> |
|
<data element_type="i64" shape="" offset="2187332" size="8" /> |
|
<output> |
|
<port id="0" precision="I64" /> |
|
</output> |
|
</layer> |
|
<layer id="369" name="Gather_28623" type="Gather" version="opset8"> |
|
<data batch_dims="0" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>-1</dim> |
|
</port> |
|
<port id="2" precision="I64" /> |
|
</input> |
|
<output> |
|
<port id="3" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="370" name="self.model.model.decoder.layers.1.self_attn.k_proj.weight" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 8, 128" offset="64161248" size="524288" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="371" name="Convert_738285" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="372" name="self.model.model.decoder.layers.1.self_attn.k_proj.weight/zero_point" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 8, 1" offset="64685536" size="4096" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="373" name="Convert_738288" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="374" name="self.model.model.decoder.layers.1.self_attn.k_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="375" name="self.model.model.decoder.layers.1.self_attn.k_proj.weight/scale" type="Const" version="opset1"> |
|
<data element_type="f16" shape="1024, 8, 1" offset="64689632" size="16384" /> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="376" name="self.model.model.decoder.layers.1.self_attn.k_proj.weight/fq_weights_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="377" name="Constant_738293" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="544768" size="16" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="378" name="Reshape_738294" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="379" name="self.model.model.decoder.layers.1.self_attn.k_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="380" name="__module.model.model.decoder.layers.1.self_attn.k_proj/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="247,tensor.15"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="381" name="Constant_27342" type="Const" version="opset1"> |
|
<data element_type="i64" shape="4" offset="544784" size="32" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="382" name="__module.model.model.decoder.layers.1.self_attn/aten::view/Reshape_1" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="249"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="383" name="__module.model.model.decoder.layers.1.self_attn/aten::transpose/Constant_1" type="Const" version="opset1"> |
|
<data element_type="i32" shape="4" offset="544816" size="16" /> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="384" name="__module.model.model.decoder.layers.1.self_attn/aten::transpose/Transpose_1" type="Transpose" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="250"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="385" name="__module.model.model.decoder.layers.1.self_attn/aten::cat/Concat_1" type="Concat" version="opset1"> |
|
<data axis="-2" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="key_states"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="389" name="self.model.model.decoder.layers.1.self_attn.q_proj.weight" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 8, 128" offset="64706016" size="524288" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="390" name="Convert_742584" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="391" name="self.model.model.decoder.layers.1.self_attn.q_proj.weight/zero_point" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 8, 1" offset="65230304" size="4096" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="392" name="Convert_742587" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="393" name="self.model.model.decoder.layers.1.self_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="394" name="self.model.model.decoder.layers.1.self_attn.q_proj.weight/scale" type="Const" version="opset1"> |
|
<data element_type="f16" shape="1024, 8, 1" offset="65234400" size="16384" /> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="395" name="self.model.model.decoder.layers.1.self_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="396" name="Constant_742592" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="544768" size="16" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="397" name="Reshape_742593" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="398" name="self.model.model.decoder.layers.1.self_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="399" name="__module.model.model.decoder.layers.1.self_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="400" name="Constant_26724" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1024" offset="65250784" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="401" name="__module.model.model.decoder.layers.1.self_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="241,tensor.13"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="402" name="Constant_27343" type="Const" version="opset1"> |
|
<data element_type="i64" shape="4" offset="544784" size="32" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="403" name="__module.model.model.decoder.layers.1.self_attn/aten::view/Reshape_2" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="243"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="404" name="__module.model.model.decoder.layers.1.self_attn/aten::transpose/Constant_2" type="Const" version="opset1"> |
|
<data element_type="i32" shape="4" offset="544816" size="16" /> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="405" name="__module.model.model.decoder.layers.1.self_attn/aten::transpose/Transpose_2" type="Transpose" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="244"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="406" name="__module.model.model.decoder.layers.1.self_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> |
|
<data causal="false" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="3" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>1</dim> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="4" precision="FP32" names="268,attn_output.9"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="407" name="__module.model.model.decoder.layers.1.self_attn/aten::transpose/Constant_3" type="Const" version="opset1"> |
|
<data element_type="i32" shape="4" offset="544816" size="16" /> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="408" name="__module.model.model.decoder.layers.1.self_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="269,attn_output.11"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="409" name="Constant_27344" type="Const" version="opset1"> |
|
<data element_type="i64" shape="3" offset="57562536" size="24" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="410" name="__module.model.model.decoder.layers.1.self_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="271"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="411" name="self.model.model.decoder.layers.1.self_attn.out_proj.weight" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 8, 128" offset="65254880" size="524288" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="412" name="Convert_746883" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="413" name="self.model.model.decoder.layers.1.self_attn.out_proj.weight/zero_point" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 8, 1" offset="65779168" size="4096" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="414" name="Convert_746886" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="415" name="self.model.model.decoder.layers.1.self_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="416" name="self.model.model.decoder.layers.1.self_attn.out_proj.weight/scale" type="Const" version="opset1"> |
|
<data element_type="f16" shape="1024, 8, 1" offset="65783264" size="16384" /> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="417" name="self.model.model.decoder.layers.1.self_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="418" name="Constant_746891" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="544768" size="16" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="419" name="Reshape_746892" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="420" name="self.model.model.decoder.layers.1.self_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="421" name="__module.model.model.decoder.layers.1.self_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="422" name="Constant_26725" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1024" offset="65799648" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="423" name="__module.model.model.decoder.layers.1.self_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="274,276,input.11"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="424" name="__module.model.model.decoder.layers.1/aten::add/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="280,residual.9"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="425" name="__module.model.model.decoder.layers.1.encoder_attn_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> |
|
<data element_type="i32" shape="1" offset="55911804" size="4" /> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="426" name="__module.model.model.decoder.layers.1.encoder_attn_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> |
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="427" name="Constant_26726" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1024" offset="65803744" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="428" name="__module.model.model.decoder.layers.1.encoder_attn_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="429" name="Constant_26727" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1024" offset="65807840" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="430" name="__module.model.model.decoder.layers.1.encoder_attn_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="284,hidden_states.15"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="431" name="self.model.model.decoder.layers.1.encoder_attn.q_proj.weight" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 8, 128" offset="65811936" size="524288" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="432" name="Convert_751182" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="433" name="self.model.model.decoder.layers.1.encoder_attn.q_proj.weight/zero_point" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 8, 1" offset="66336224" size="4096" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="434" name="Convert_751185" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="435" name="self.model.model.decoder.layers.1.encoder_attn.q_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="436" name="self.model.model.decoder.layers.1.encoder_attn.q_proj.weight/scale" type="Const" version="opset1"> |
|
<data element_type="f16" shape="1024, 8, 1" offset="66340320" size="16384" /> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="437" name="self.model.model.decoder.layers.1.encoder_attn.q_proj.weight/fq_weights_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="438" name="Constant_751190" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="544768" size="16" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="439" name="Reshape_751191" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="440" name="self.model.model.decoder.layers.1.encoder_attn.q_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="441" name="__module.model.model.decoder.layers.1.encoder_attn.q_proj/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="442" name="Constant_26728" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1024" offset="66356704" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="443" name="__module.model.model.decoder.layers.1.encoder_attn.q_proj/aten::linear/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="293,tensor.19"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="444" name="Constant_27345" type="Const" version="opset1"> |
|
<data element_type="i64" shape="4" offset="544784" size="32" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="445" name="__module.model.model.decoder.layers.1.encoder_attn/aten::view/Reshape" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="295"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="446" name="__module.model.model.decoder.layers.1.encoder_attn/aten::transpose/Constant" type="Const" version="opset1"> |
|
<data element_type="i32" shape="4" offset="544816" size="16" /> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="447" name="__module.model.model.decoder.layers.1.encoder_attn/aten::transpose/Transpose" type="Transpose" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="296"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="448" name="__module.model.model.decoder.layers.1.encoder_attn/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13"> |
|
<data causal="false" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="3" precision="FP32" names="311,attn_output.13"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="449" name="__module.model.model.decoder.layers.1.encoder_attn/aten::transpose/Constant_3" type="Const" version="opset1"> |
|
<data element_type="i32" shape="4" offset="544816" size="16" /> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="450" name="__module.model.model.decoder.layers.1.encoder_attn/aten::transpose/Transpose_3" type="Transpose" version="opset1"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>4</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="312,attn_output"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="451" name="Constant_27348" type="Const" version="opset1"> |
|
<data element_type="i64" shape="3" offset="57562536" size="24" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="452" name="__module.model.model.decoder.layers.1.encoder_attn/aten::reshape/Reshape" type="Reshape" version="opset1"> |
|
<data special_zero="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>64</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>3</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="314"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="453" name="self.model.model.decoder.layers.1.encoder_attn.out_proj.weight" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 8, 128" offset="66360800" size="524288" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="454" name="Convert_755481" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="455" name="self.model.model.decoder.layers.1.encoder_attn.out_proj.weight/zero_point" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 8, 1" offset="66885088" size="4096" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="456" name="Convert_755484" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="457" name="self.model.model.decoder.layers.1.encoder_attn.out_proj.weight/zero_point/subtract" type="Subtract" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="458" name="self.model.model.decoder.layers.1.encoder_attn.out_proj.weight/scale" type="Const" version="opset1"> |
|
<data element_type="f16" shape="1024, 8, 1" offset="66889184" size="16384" /> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="459" name="self.model.model.decoder.layers.1.encoder_attn.out_proj.weight/fq_weights_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="460" name="Constant_755489" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="544768" size="16" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="461" name="Reshape_755490" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="462" name="self.model.model.decoder.layers.1.encoder_attn.out_proj.weight/fq_weights_1/convert" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="463" name="__module.model.model.decoder.layers.1.encoder_attn.out_proj/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="464" name="Constant_26730" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1024" offset="66905568" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="465" name="__module.model.model.decoder.layers.1.encoder_attn.out_proj/aten::linear/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="317,input.13"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="466" name="__module.model.model.decoder.layers.1/aten::add/Add_1" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="319,residual"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="467" name="__module.model.model.decoder.layers.1.final_layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> |
|
<data element_type="i32" shape="1" offset="55911804" size="4" /> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="468" name="__module.model.model.decoder.layers.1.final_layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> |
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="469" name="Constant_26731" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1024" offset="66909664" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="470" name="__module.model.model.decoder.layers.1.final_layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="471" name="Constant_26732" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1024" offset="66913760" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="472" name="__module.model.model.decoder.layers.1.final_layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="323"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="473" name="self.model.model.decoder.layers.1.fc1.weight" type="Const" version="opset1"> |
|
<data element_type="u4" shape="4096, 8, 128" offset="66917856" size="2097152" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>4096</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="474" name="Convert_682398" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>4096</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>4096</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="475" name="self.model.model.decoder.layers.1.fc1.weight/zero_point" type="Const" version="opset1"> |
|
<data element_type="u4" shape="4096, 8, 1" offset="69015008" size="16384" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>4096</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="476" name="Convert_682401" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>4096</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>4096</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="477" name="self.model.model.decoder.layers.1.fc1.weight/zero_point/subtract" type="Subtract" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>4096</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>4096</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>4096</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="478" name="self.model.model.decoder.layers.1.fc1.weight/scale" type="Const" version="opset1"> |
|
<data element_type="f16" shape="4096, 8, 1" offset="69031392" size="65536" /> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>4096</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="479" name="self.model.model.decoder.layers.1.fc1.weight/fq_weights_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>4096</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>4096</dim> |
|
<dim>8</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>4096</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="480" name="Constant_682406" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="61404608" size="16" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="481" name="Reshape_682407" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>4096</dim> |
|
<dim>8</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>4096</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="482" name="self.model.model.decoder.layers.1.fc1.weight/fq_weights_1/convert" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>4096</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>4096</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="483" name="__module.model.model.decoder.layers.1.fc1/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>4096</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4096</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="484" name="Constant_26733" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 4096" offset="69096928" size="16384" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>4096</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="485" name="__module.model.model.decoder.layers.1.fc1/aten::linear/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4096</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>4096</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="326"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4096</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="486" name="__module.model.model.decoder.layers.1.activation_fn/aten::gelu/Gelu" type="Gelu" version="opset7"> |
|
<data approximation_mode="ERF" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4096</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32" names="327,input.15"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4096</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="487" name="self.model.model.decoder.layers.1.fc2.weight" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 32, 128" offset="69113312" size="2097152" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>32</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="488" name="Convert_686697" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>32</dim> |
|
<dim>128</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>32</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="489" name="self.model.model.decoder.layers.1.fc2.weight/zero_point" type="Const" version="opset1"> |
|
<data element_type="u4" shape="1024, 32, 1" offset="71210464" size="16384" /> |
|
<output> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>32</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="490" name="Convert_686700" type="Convert" version="opset1"> |
|
<data destination_type="f16" /> |
|
<input> |
|
<port id="0" precision="U4"> |
|
<dim>1024</dim> |
|
<dim>32</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>32</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="491" name="self.model.model.decoder.layers.1.fc2.weight/zero_point/subtract" type="Subtract" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>32</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>32</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>32</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="492" name="self.model.model.decoder.layers.1.fc2.weight/scale" type="Const" version="opset1"> |
|
<data element_type="f16" shape="1024, 32, 1" offset="71226848" size="65536" /> |
|
<output> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>32</dim> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="493" name="self.model.model.decoder.layers.1.fc2.weight/fq_weights_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>32</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>32</dim> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>32</dim> |
|
<dim>128</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="494" name="Constant_686705" type="Const" version="opset1"> |
|
<data element_type="i64" shape="2" offset="63600080" size="16" /> |
|
<output> |
|
<port id="0" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="495" name="Reshape_686706" type="Reshape" version="opset1"> |
|
<data special_zero="false" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>32</dim> |
|
<dim>128</dim> |
|
</port> |
|
<port id="1" precision="I64"> |
|
<dim>2</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>4096</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="496" name="self.model.model.decoder.layers.1.fc2.weight/fq_weights_1/convert" type="Convert" version="opset1"> |
|
<data destination_type="f32" /> |
|
<input> |
|
<port id="0" precision="FP16"> |
|
<dim>1024</dim> |
|
<dim>4096</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>4096</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="497" name="__module.model.model.decoder.layers.1.fc2/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>4096</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1024</dim> |
|
<dim>4096</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="498" name="Constant_26734" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1024" offset="71292384" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="499" name="__module.model.model.decoder.layers.1.fc2/aten::linear/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="331,input"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="500" name="__module.model.model.decoder.layers.1/aten::add/Add_2" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="333,335"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="501" name="__module.model.model.decoder.layer_norm/aten::layer_norm/Multiply" type="Const" version="opset1"> |
|
<data element_type="i32" shape="1" offset="55911804" size="4" /> |
|
<output> |
|
<port id="0" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="502" name="__module.model.model.decoder.layer_norm/aten::layer_norm/MVN" type="MVN" version="opset6"> |
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="I32"> |
|
<dim>1</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="503" name="Constant_26735" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1024" offset="71296480" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="504" name="__module.model.model.decoder.layer_norm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="505" name="Constant_26736" type="Const" version="opset1"> |
|
<data element_type="f32" shape="1, 1, 1024" offset="71300576" size="4096" /> |
|
<output> |
|
<port id="0" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="506" name="__module.model.model.decoder.layer_norm/aten::layer_norm/Add" type="Add" version="opset1"> |
|
<data auto_broadcast="numpy" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>1</dim> |
|
<dim>1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="341,343,349"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="507" name="__module.model.proj_out/aten::linear/MatMul" type="MatMul" version="opset1"> |
|
<data transpose_a="false" transpose_b="true" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>1024</dim> |
|
</port> |
|
<port id="1" precision="FP32"> |
|
<dim>51864</dim> |
|
<dim>1024</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="2" precision="FP32" names="logits"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>51864</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="388" name="Assign_29010" type="Assign" version="opset6"> |
|
<data variable_id="past_key_values.0.decoder.keypresent.0.decoder.key" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="387" name="Assign_29012" type="Assign" version="opset6"> |
|
<data variable_id="past_key_values.0.decoder.valuepresent.0.decoder.value" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="386" name="Assign_29014" type="Assign" version="opset6"> |
|
<data variable_id="past_key_values.1.decoder.keypresent.1.decoder.key" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="360" name="Assign_29016" type="Assign" version="opset6"> |
|
<data variable_id="past_key_values.1.decoder.valuepresent.1.decoder.value" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="75" name="Assign_29844" type="Assign" version="opset6"> |
|
<data variable_id="309" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="56" name="Assign_29846" type="Assign" version="opset6"> |
|
<data variable_id="193" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="37" name="Assign_29848" type="Assign" version="opset6"> |
|
<data variable_id="302" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="20" name="Assign_29850" type="Assign" version="opset6"> |
|
<data variable_id="186" /> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</input> |
|
<output> |
|
<port id="1" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>16</dim> |
|
<dim>-1</dim> |
|
<dim>64</dim> |
|
</port> |
|
</output> |
|
</layer> |
|
<layer id="508" name="Result_20558" type="Result" version="opset1" output_names="logits"> |
|
<input> |
|
<port id="0" precision="FP32"> |
|
<dim>-1</dim> |
|
<dim>-1</dim> |
|
<dim>51864</dim> |
|
</port> |
|
</input> |
|
</layer> |
|
</layers> |
|
<edges> |
|
<edge from-layer="0" from-port="0" to-layer="88" to-port="1" /> |
|
<edge from-layer="0" from-port="0" to-layer="369" to-port="1" /> |
|
<edge from-layer="0" from-port="0" to-layer="179" to-port="1" /> |
|
<edge from-layer="0" from-port="0" to-layer="154" to-port="1" /> |
|
<edge from-layer="1" from-port="0" to-layer="111" to-port="0" /> |
|
<edge from-layer="1" from-port="0" to-layer="214" to-port="0" /> |
|
<edge from-layer="2" from-port="0" to-layer="14" to-port="0" /> |
|
<edge from-layer="2" from-port="0" to-layer="67" to-port="0" /> |
|
<edge from-layer="2" from-port="0" to-layer="48" to-port="0" /> |
|
<edge from-layer="2" from-port="0" to-layer="31" to-port="0" /> |
|
<edge from-layer="3" from-port="0" to-layer="98" to-port="0" /> |
|
<edge from-layer="3" from-port="0" to-layer="112" to-port="0" /> |
|
<edge from-layer="3" from-port="0" to-layer="77" to-port="0" /> |
|
<edge from-layer="4" from-port="0" to-layer="5" to-port="0" /> |
|
<edge from-layer="5" from-port="1" to-layer="8" to-port="0" /> |
|
<edge from-layer="6" from-port="0" to-layer="7" to-port="0" /> |
|
<edge from-layer="7" from-port="1" to-layer="8" to-port="1" /> |
|
<edge from-layer="8" from-port="2" to-layer="10" to-port="0" /> |
|
<edge from-layer="9" from-port="0" to-layer="10" to-port="1" /> |
|
<edge from-layer="10" from-port="2" to-layer="12" to-port="0" /> |
|
<edge from-layer="11" from-port="0" to-layer="12" to-port="1" /> |
|
<edge from-layer="12" from-port="2" to-layer="13" to-port="0" /> |
|
<edge from-layer="13" from-port="1" to-layer="14" to-port="1" /> |
|
<edge from-layer="14" from-port="2" to-layer="16" to-port="0" /> |
|
<edge from-layer="15" from-port="0" to-layer="16" to-port="1" /> |
|
<edge from-layer="16" from-port="2" to-layer="18" to-port="0" /> |
|
<edge from-layer="17" from-port="0" to-layer="18" to-port="1" /> |
|
<edge from-layer="18" from-port="2" to-layer="19" to-port="0" /> |
|
<edge from-layer="19" from-port="1" to-layer="283" to-port="1" /> |
|
<edge from-layer="19" from-port="1" to-layer="20" to-port="0" /> |
|
<edge from-layer="21" from-port="0" to-layer="22" to-port="0" /> |
|
<edge from-layer="22" from-port="1" to-layer="25" to-port="0" /> |
|
<edge from-layer="23" from-port="0" to-layer="24" to-port="0" /> |
|
<edge from-layer="24" from-port="1" to-layer="25" to-port="1" /> |
|
<edge from-layer="25" from-port="2" to-layer="27" to-port="0" /> |
|
<edge from-layer="26" from-port="0" to-layer="27" to-port="1" /> |
|
<edge from-layer="27" from-port="2" to-layer="29" to-port="0" /> |
|
<edge from-layer="28" from-port="0" to-layer="29" to-port="1" /> |
|
<edge from-layer="29" from-port="2" to-layer="30" to-port="0" /> |
|
<edge from-layer="30" from-port="1" to-layer="31" to-port="1" /> |
|
<edge from-layer="31" from-port="2" to-layer="33" to-port="0" /> |
|
<edge from-layer="32" from-port="0" to-layer="33" to-port="1" /> |
|
<edge from-layer="33" from-port="2" to-layer="35" to-port="0" /> |
|
<edge from-layer="34" from-port="0" to-layer="35" to-port="1" /> |
|
<edge from-layer="35" from-port="2" to-layer="36" to-port="0" /> |
|
<edge from-layer="36" from-port="1" to-layer="448" to-port="1" /> |
|
<edge from-layer="36" from-port="1" to-layer="37" to-port="0" /> |
|
<edge from-layer="38" from-port="0" to-layer="39" to-port="0" /> |
|
<edge from-layer="39" from-port="1" to-layer="42" to-port="0" /> |
|
<edge from-layer="40" from-port="0" to-layer="41" to-port="0" /> |
|
<edge from-layer="41" from-port="1" to-layer="42" to-port="1" /> |
|
<edge from-layer="42" from-port="2" to-layer="44" to-port="0" /> |
|
<edge from-layer="43" from-port="0" to-layer="44" to-port="1" /> |
|
<edge from-layer="44" from-port="2" to-layer="46" to-port="0" /> |
|
<edge from-layer="45" from-port="0" to-layer="46" to-port="1" /> |
|
<edge from-layer="46" from-port="2" to-layer="47" to-port="0" /> |
|
<edge from-layer="47" from-port="1" to-layer="48" to-port="1" /> |
|
<edge from-layer="48" from-port="2" to-layer="50" to-port="0" /> |
|
<edge from-layer="49" from-port="0" to-layer="50" to-port="1" /> |
|
<edge from-layer="50" from-port="2" to-layer="52" to-port="0" /> |
|
<edge from-layer="51" from-port="0" to-layer="52" to-port="1" /> |
|
<edge from-layer="52" from-port="2" to-layer="54" to-port="0" /> |
|
<edge from-layer="53" from-port="0" to-layer="54" to-port="1" /> |
|
<edge from-layer="54" from-port="2" to-layer="55" to-port="0" /> |
|
<edge from-layer="55" from-port="1" to-layer="56" to-port="0" /> |
|
<edge from-layer="55" from-port="1" to-layer="283" to-port="2" /> |
|
<edge from-layer="57" from-port="0" to-layer="58" to-port="0" /> |
|
<edge from-layer="58" from-port="1" to-layer="61" to-port="0" /> |
|
<edge from-layer="59" from-port="0" to-layer="60" to-port="0" /> |
|
<edge from-layer="60" from-port="1" to-layer="61" to-port="1" /> |
|
<edge from-layer="61" from-port="2" to-layer="63" to-port="0" /> |
|
<edge from-layer="62" from-port="0" to-layer="63" to-port="1" /> |
|
<edge from-layer="63" from-port="2" to-layer="65" to-port="0" /> |
|
<edge from-layer="64" from-port="0" to-layer="65" to-port="1" /> |
|
<edge from-layer="65" from-port="2" to-layer="66" to-port="0" /> |
|
<edge from-layer="66" from-port="1" to-layer="67" to-port="1" /> |
|
<edge from-layer="67" from-port="2" to-layer="69" to-port="0" /> |
|
<edge from-layer="68" from-port="0" to-layer="69" to-port="1" /> |
|
<edge from-layer="69" from-port="2" to-layer="71" to-port="0" /> |
|
<edge from-layer="70" from-port="0" to-layer="71" to-port="1" /> |
|
<edge from-layer="71" from-port="2" to-layer="73" to-port="0" /> |
|
<edge from-layer="72" from-port="0" to-layer="73" to-port="1" /> |
|
<edge from-layer="73" from-port="2" to-layer="74" to-port="0" /> |
|
<edge from-layer="74" from-port="1" to-layer="75" to-port="0" /> |
|
<edge from-layer="74" from-port="1" to-layer="448" to-port="2" /> |
|
<edge from-layer="76" from-port="0" to-layer="85" to-port="0" /> |
|
<edge from-layer="77" from-port="1" to-layer="80" to-port="0" /> |
|
<edge from-layer="78" from-port="0" to-layer="80" to-port="1" /> |
|
<edge from-layer="79" from-port="0" to-layer="80" to-port="2" /> |
|
<edge from-layer="80" from-port="3" to-layer="150" to-port="0" /> |
|
<edge from-layer="80" from-port="3" to-layer="175" to-port="0" /> |
|
<edge from-layer="80" from-port="3" to-layer="365" to-port="0" /> |
|
<edge from-layer="80" from-port="3" to-layer="84" to-port="0" /> |
|
<edge from-layer="81" from-port="0" to-layer="84" to-port="1" /> |
|
<edge from-layer="82" from-port="0" to-layer="84" to-port="2" /> |
|
<edge from-layer="83" from-port="0" to-layer="84" to-port="3" /> |
|
<edge from-layer="84" from-port="4" to-layer="85" to-port="1" /> |
|
<edge from-layer="85" from-port="2" to-layer="86" to-port="0" /> |
|
<edge from-layer="86" from-port="1" to-layer="88" to-port="0" /> |
|
<edge from-layer="87" from-port="0" to-layer="88" to-port="2" /> |
|
<edge from-layer="88" from-port="3" to-layer="359" to-port="0" /> |
|
<edge from-layer="89" from-port="0" to-layer="90" to-port="0" /> |
|
<edge from-layer="90" from-port="1" to-layer="93" to-port="0" /> |
|
<edge from-layer="91" from-port="0" to-layer="92" to-port="0" /> |
|
<edge from-layer="92" from-port="1" to-layer="93" to-port="1" /> |
|
<edge from-layer="93" from-port="2" to-layer="95" to-port="0" /> |
|
<edge from-layer="94" from-port="0" to-layer="95" to-port="1" /> |
|
<edge from-layer="95" from-port="2" to-layer="96" to-port="0" /> |
|
<edge from-layer="96" from-port="1" to-layer="101" to-port="0" /> |
|
<edge from-layer="96" from-port="1" to-layer="507" to-port="1" /> |
|
<edge from-layer="97" from-port="0" to-layer="98" to-port="1" /> |
|
<edge from-layer="98" from-port="2" to-layer="99" to-port="0" /> |
|
<edge from-layer="99" from-port="1" to-layer="101" to-port="1" /> |
|
<edge from-layer="100" from-port="0" to-layer="101" to-port="2" /> |
|
<edge from-layer="101" from-port="3" to-layer="122" to-port="0" /> |
|
<edge from-layer="102" from-port="0" to-layer="103" to-port="0" /> |
|
<edge from-layer="103" from-port="1" to-layer="106" to-port="0" /> |
|
<edge from-layer="104" from-port="0" to-layer="105" to-port="0" /> |
|
<edge from-layer="105" from-port="1" to-layer="106" to-port="1" /> |
|
<edge from-layer="106" from-port="2" to-layer="108" to-port="0" /> |
|
<edge from-layer="107" from-port="0" to-layer="108" to-port="1" /> |
|
<edge from-layer="108" from-port="2" to-layer="109" to-port="0" /> |
|
<edge from-layer="109" from-port="1" to-layer="121" to-port="0" /> |
|
<edge from-layer="110" from-port="0" to-layer="226" to-port="1" /> |
|
<edge from-layer="110" from-port="0" to-layer="111" to-port="1" /> |
|
<edge from-layer="111" from-port="2" to-layer="118" to-port="0" /> |
|
<edge from-layer="112" from-port="1" to-layer="206" to-port="0" /> |
|
<edge from-layer="112" from-port="1" to-layer="115" to-port="0" /> |
|
<edge from-layer="113" from-port="0" to-layer="115" to-port="1" /> |
|
<edge from-layer="114" from-port="0" to-layer="115" to-port="2" /> |
|
<edge from-layer="115" from-port="3" to-layer="232" to-port="0" /> |
|
<edge from-layer="115" from-port="3" to-layer="117" to-port="0" /> |
|
<edge from-layer="116" from-port="0" to-layer="117" to-port="1" /> |
|
<edge from-layer="117" from-port="2" to-layer="118" to-port="1" /> |
|
<edge from-layer="118" from-port="2" to-layer="119" to-port="0" /> |
|
<edge from-layer="119" from-port="1" to-layer="121" to-port="1" /> |
|
<edge from-layer="120" from-port="0" to-layer="121" to-port="2" /> |
|
<edge from-layer="121" from-port="3" to-layer="122" to-port="1" /> |
|
<edge from-layer="122" from-port="2" to-layer="259" to-port="0" /> |
|
<edge from-layer="122" from-port="2" to-layer="124" to-port="0" /> |
|
<edge from-layer="123" from-port="0" to-layer="124" to-port="1" /> |
|
<edge from-layer="124" from-port="2" to-layer="126" to-port="0" /> |
|
<edge from-layer="125" from-port="0" to-layer="126" to-port="1" /> |
|
<edge from-layer="126" from-port="2" to-layer="128" to-port="0" /> |
|
<edge from-layer="127" from-port="0" to-layer="128" to-port="1" /> |
|
<edge from-layer="128" from-port="2" to-layer="165" to-port="0" /> |
|
<edge from-layer="128" from-port="2" to-layer="190" to-port="0" /> |
|
<edge from-layer="128" from-port="2" to-layer="139" to-port="0" /> |
|
<edge from-layer="129" from-port="0" to-layer="130" to-port="0" /> |
|
<edge from-layer="130" from-port="1" to-layer="133" to-port="0" /> |
|
<edge from-layer="131" from-port="0" to-layer="132" to-port="0" /> |
|
<edge from-layer="132" from-port="1" to-layer="133" to-port="1" /> |
|
<edge from-layer="133" from-port="2" to-layer="135" to-port="0" /> |
|
<edge from-layer="134" from-port="0" to-layer="135" to-port="1" /> |
|
<edge from-layer="135" from-port="2" to-layer="137" to-port="0" /> |
|
<edge from-layer="136" from-port="0" to-layer="137" to-port="1" /> |
|
<edge from-layer="137" from-port="2" to-layer="138" to-port="0" /> |
|
<edge from-layer="138" from-port="1" to-layer="139" to-port="1" /> |
|
<edge from-layer="139" from-port="2" to-layer="141" to-port="0" /> |
|
<edge from-layer="140" from-port="0" to-layer="141" to-port="1" /> |
|
<edge from-layer="141" from-port="2" to-layer="143" to-port="0" /> |
|
<edge from-layer="142" from-port="0" to-layer="143" to-port="1" /> |
|
<edge from-layer="143" from-port="2" to-layer="145" to-port="0" /> |
|
<edge from-layer="144" from-port="0" to-layer="145" to-port="1" /> |
|
<edge from-layer="145" from-port="2" to-layer="241" to-port="0" /> |
|
<edge from-layer="146" from-port="0" to-layer="151" to-port="0" /> |
|
<edge from-layer="147" from-port="0" to-layer="150" to-port="1" /> |
|
<edge from-layer="148" from-port="0" to-layer="150" to-port="2" /> |
|
<edge from-layer="149" from-port="0" to-layer="150" to-port="3" /> |
|
<edge from-layer="150" from-port="4" to-layer="151" to-port="1" /> |
|
<edge from-layer="151" from-port="2" to-layer="152" to-port="0" /> |
|
<edge from-layer="152" from-port="1" to-layer="154" to-port="0" /> |
|
<edge from-layer="153" from-port="0" to-layer="154" to-port="2" /> |
|
<edge from-layer="154" from-port="3" to-layer="170" to-port="0" /> |
|
<edge from-layer="154" from-port="3" to-layer="200" to-port="0" /> |
|
<edge from-layer="155" from-port="0" to-layer="156" to-port="0" /> |
|
<edge from-layer="156" from-port="1" to-layer="159" to-port="0" /> |
|
<edge from-layer="157" from-port="0" to-layer="158" to-port="0" /> |
|
<edge from-layer="158" from-port="1" to-layer="159" to-port="1" /> |
|
<edge from-layer="159" from-port="2" to-layer="161" to-port="0" /> |
|
<edge from-layer="160" from-port="0" to-layer="161" to-port="1" /> |
|
<edge from-layer="161" from-port="2" to-layer="163" to-port="0" /> |
|
<edge from-layer="162" from-port="0" to-layer="163" to-port="1" /> |
|
<edge from-layer="163" from-port="2" to-layer="164" to-port="0" /> |
|
<edge from-layer="164" from-port="1" to-layer="165" to-port="1" /> |
|
<edge from-layer="165" from-port="2" to-layer="167" to-port="0" /> |
|
<edge from-layer="166" from-port="0" to-layer="167" to-port="1" /> |
|
<edge from-layer="167" from-port="2" to-layer="169" to-port="0" /> |
|
<edge from-layer="168" from-port="0" to-layer="169" to-port="1" /> |
|
<edge from-layer="169" from-port="2" to-layer="170" to-port="1" /> |
|
<edge from-layer="170" from-port="2" to-layer="388" to-port="0" /> |
|
<edge from-layer="170" from-port="2" to-layer="241" to-port="1" /> |
|
<edge from-layer="171" from-port="0" to-layer="176" to-port="0" /> |
|
<edge from-layer="172" from-port="0" to-layer="175" to-port="1" /> |
|
<edge from-layer="173" from-port="0" to-layer="175" to-port="2" /> |
|
<edge from-layer="174" from-port="0" to-layer="175" to-port="3" /> |
|
<edge from-layer="175" from-port="4" to-layer="176" to-port="1" /> |
|
<edge from-layer="176" from-port="2" to-layer="177" to-port="0" /> |
|
<edge from-layer="177" from-port="1" to-layer="179" to-port="0" /> |
|
<edge from-layer="178" from-port="0" to-layer="179" to-port="2" /> |
|
<edge from-layer="179" from-port="3" to-layer="197" to-port="0" /> |
|
<edge from-layer="180" from-port="0" to-layer="181" to-port="0" /> |
|
<edge from-layer="181" from-port="1" to-layer="184" to-port="0" /> |
|
<edge from-layer="182" from-port="0" to-layer="183" to-port="0" /> |
|
<edge from-layer="183" from-port="1" to-layer="184" to-port="1" /> |
|
<edge from-layer="184" from-port="2" to-layer="186" to-port="0" /> |
|
<edge from-layer="185" from-port="0" to-layer="186" to-port="1" /> |
|
<edge from-layer="186" from-port="2" to-layer="188" to-port="0" /> |
|
<edge from-layer="187" from-port="0" to-layer="188" to-port="1" /> |
|
<edge from-layer="188" from-port="2" to-layer="189" to-port="0" /> |
|
<edge from-layer="189" from-port="1" to-layer="190" to-port="1" /> |
|
<edge from-layer="190" from-port="2" to-layer="192" to-port="0" /> |
|
<edge from-layer="191" from-port="0" to-layer="192" to-port="1" /> |
|
<edge from-layer="192" from-port="2" to-layer="194" to-port="0" /> |
|
<edge from-layer="193" from-port="0" to-layer="194" to-port="1" /> |
|
<edge from-layer="194" from-port="2" to-layer="196" to-port="0" /> |
|
<edge from-layer="195" from-port="0" to-layer="196" to-port="1" /> |
|
<edge from-layer="196" from-port="2" to-layer="197" to-port="1" /> |
|
<edge from-layer="197" from-port="2" to-layer="387" to-port="0" /> |
|
<edge from-layer="197" from-port="2" to-layer="241" to-port="2" /> |
|
<edge from-layer="198" from-port="0" to-layer="217" to-port="0" /> |
|
<edge from-layer="199" from-port="0" to-layer="211" to-port="0" /> |
|
<edge from-layer="200" from-port="1" to-layer="203" to-port="0" /> |
|
<edge from-layer="201" from-port="0" to-layer="203" to-port="1" /> |
|
<edge from-layer="202" from-port="0" to-layer="203" to-port="2" /> |
|
<edge from-layer="203" from-port="3" to-layer="207" to-port="0" /> |
|
<edge from-layer="203" from-port="3" to-layer="236" to-port="0" /> |
|
<edge from-layer="204" from-port="0" to-layer="206" to-port="1" /> |
|
<edge from-layer="205" from-port="0" to-layer="206" to-port="2" /> |
|
<edge from-layer="206" from-port="3" to-layer="220" to-port="0" /> |
|
<edge from-layer="206" from-port="3" to-layer="207" to-port="1" /> |
|
<edge from-layer="207" from-port="2" to-layer="209" to-port="0" /> |
|
<edge from-layer="208" from-port="0" to-layer="209" to-port="1" /> |
|
<edge from-layer="209" from-port="2" to-layer="211" to-port="1" /> |
|
<edge from-layer="209" from-port="2" to-layer="222" to-port="0" /> |
|
<edge from-layer="210" from-port="0" to-layer="211" to-port="2" /> |
|
<edge from-layer="211" from-port="3" to-layer="212" to-port="0" /> |
|
<edge from-layer="212" from-port="1" to-layer="215" to-port="0" /> |
|
<edge from-layer="213" from-port="0" to-layer="214" to-port="1" /> |
|
<edge from-layer="214" from-port="2" to-layer="215" to-port="1" /> |
|
<edge from-layer="215" from-port="2" to-layer="216" to-port="0" /> |
|
<edge from-layer="216" from-port="1" to-layer="217" to-port="1" /> |
|
<edge from-layer="217" from-port="2" to-layer="225" to-port="0" /> |
|
<edge from-layer="217" from-port="2" to-layer="218" to-port="0" /> |
|
<edge from-layer="218" from-port="1" to-layer="224" to-port="0" /> |
|
<edge from-layer="219" from-port="0" to-layer="220" to-port="1" /> |
|
<edge from-layer="220" from-port="2" to-layer="237" to-port="1" /> |
|
<edge from-layer="220" from-port="2" to-layer="223" to-port="0" /> |
|
<edge from-layer="221" from-port="0" to-layer="222" to-port="1" /> |
|
<edge from-layer="222" from-port="2" to-layer="223" to-port="1" /> |
|
<edge from-layer="223" from-port="2" to-layer="224" to-port="1" /> |
|
<edge from-layer="224" from-port="2" to-layer="225" to-port="1" /> |
|
<edge from-layer="225" from-port="2" to-layer="226" to-port="0" /> |
|
<edge from-layer="226" from-port="2" to-layer="228" to-port="0" /> |
|
<edge from-layer="227" from-port="0" to-layer="228" to-port="1" /> |
|
<edge from-layer="228" from-port="2" to-layer="233" to-port="0" /> |
|
<edge from-layer="229" from-port="0" to-layer="232" to-port="1" /> |
|
<edge from-layer="230" from-port="0" to-layer="232" to-port="2" /> |
|
<edge from-layer="231" from-port="0" to-layer="232" to-port="3" /> |
|
<edge from-layer="232" from-port="4" to-layer="233" to-port="1" /> |
|
<edge from-layer="233" from-port="2" to-layer="240" to-port="0" /> |
|
<edge from-layer="234" from-port="0" to-layer="240" to-port="1" /> |
|
<edge from-layer="235" from-port="0" to-layer="236" to-port="1" /> |
|
<edge from-layer="236" from-port="2" to-layer="237" to-port="0" /> |
|
<edge from-layer="237" from-port="2" to-layer="240" to-port="2" /> |
|
<edge from-layer="238" from-port="0" to-layer="240" to-port="3" /> |
|
<edge from-layer="239" from-port="0" to-layer="240" to-port="4" /> |
|
<edge from-layer="240" from-port="5" to-layer="406" to-port="3" /> |
|
<edge from-layer="240" from-port="5" to-layer="241" to-port="3" /> |
|
<edge from-layer="241" from-port="4" to-layer="243" to-port="0" /> |
|
<edge from-layer="242" from-port="0" to-layer="243" to-port="1" /> |
|
<edge from-layer="243" from-port="2" to-layer="245" to-port="0" /> |
|
<edge from-layer="244" from-port="0" to-layer="245" to-port="1" /> |
|
<edge from-layer="245" from-port="2" to-layer="256" to-port="0" /> |
|
<edge from-layer="246" from-port="0" to-layer="247" to-port="0" /> |
|
<edge from-layer="247" from-port="1" to-layer="250" to-port="0" /> |
|
<edge from-layer="248" from-port="0" to-layer="249" to-port="0" /> |
|
<edge from-layer="249" from-port="1" to-layer="250" to-port="1" /> |
|
<edge from-layer="250" from-port="2" to-layer="252" to-port="0" /> |
|
<edge from-layer="251" from-port="0" to-layer="252" to-port="1" /> |
|
<edge from-layer="252" from-port="2" to-layer="254" to-port="0" /> |
|
<edge from-layer="253" from-port="0" to-layer="254" to-port="1" /> |
|
<edge from-layer="254" from-port="2" to-layer="255" to-port="0" /> |
|
<edge from-layer="255" from-port="1" to-layer="256" to-port="1" /> |
|
<edge from-layer="256" from-port="2" to-layer="258" to-port="0" /> |
|
<edge from-layer="257" from-port="0" to-layer="258" to-port="1" /> |
|
<edge from-layer="258" from-port="2" to-layer="259" to-port="1" /> |
|
<edge from-layer="259" from-port="2" to-layer="261" to-port="0" /> |
|
<edge from-layer="259" from-port="2" to-layer="301" to-port="0" /> |
|
<edge from-layer="260" from-port="0" to-layer="261" to-port="1" /> |
|
<edge from-layer="261" from-port="2" to-layer="263" to-port="0" /> |
|
<edge from-layer="262" from-port="0" to-layer="263" to-port="1" /> |
|
<edge from-layer="263" from-port="2" to-layer="265" to-port="0" /> |
|
<edge from-layer="264" from-port="0" to-layer="265" to-port="1" /> |
|
<edge from-layer="265" from-port="2" to-layer="276" to-port="0" /> |
|
<edge from-layer="266" from-port="0" to-layer="267" to-port="0" /> |
|
<edge from-layer="267" from-port="1" to-layer="270" to-port="0" /> |
|
<edge from-layer="268" from-port="0" to-layer="269" to-port="0" /> |
|
<edge from-layer="269" from-port="1" to-layer="270" to-port="1" /> |
|
<edge from-layer="270" from-port="2" to-layer="272" to-port="0" /> |
|
<edge from-layer="271" from-port="0" to-layer="272" to-port="1" /> |
|
<edge from-layer="272" from-port="2" to-layer="274" to-port="0" /> |
|
<edge from-layer="273" from-port="0" to-layer="274" to-port="1" /> |
|
<edge from-layer="274" from-port="2" to-layer="275" to-port="0" /> |
|
<edge from-layer="275" from-port="1" to-layer="276" to-port="1" /> |
|
<edge from-layer="276" from-port="2" to-layer="278" to-port="0" /> |
|
<edge from-layer="277" from-port="0" to-layer="278" to-port="1" /> |
|
<edge from-layer="278" from-port="2" to-layer="280" to-port="0" /> |
|
<edge from-layer="279" from-port="0" to-layer="280" to-port="1" /> |
|
<edge from-layer="280" from-port="2" to-layer="282" to-port="0" /> |
|
<edge from-layer="281" from-port="0" to-layer="282" to-port="1" /> |
|
<edge from-layer="282" from-port="2" to-layer="283" to-port="0" /> |
|
<edge from-layer="283" from-port="3" to-layer="285" to-port="0" /> |
|
<edge from-layer="284" from-port="0" to-layer="285" to-port="1" /> |
|
<edge from-layer="285" from-port="2" to-layer="287" to-port="0" /> |
|
<edge from-layer="286" from-port="0" to-layer="287" to-port="1" /> |
|
<edge from-layer="287" from-port="2" to-layer="298" to-port="0" /> |
|
<edge from-layer="288" from-port="0" to-layer="289" to-port="0" /> |
|
<edge from-layer="289" from-port="1" to-layer="292" to-port="0" /> |
|
<edge from-layer="290" from-port="0" to-layer="291" to-port="0" /> |
|
<edge from-layer="291" from-port="1" to-layer="292" to-port="1" /> |
|
<edge from-layer="292" from-port="2" to-layer="294" to-port="0" /> |
|
<edge from-layer="293" from-port="0" to-layer="294" to-port="1" /> |
|
<edge from-layer="294" from-port="2" to-layer="296" to-port="0" /> |
|
<edge from-layer="295" from-port="0" to-layer="296" to-port="1" /> |
|
<edge from-layer="296" from-port="2" to-layer="297" to-port="0" /> |
|
<edge from-layer="297" from-port="1" to-layer="298" to-port="1" /> |
|
<edge from-layer="298" from-port="2" to-layer="300" to-port="0" /> |
|
<edge from-layer="299" from-port="0" to-layer="300" to-port="1" /> |
|
<edge from-layer="300" from-port="2" to-layer="301" to-port="1" /> |
|
<edge from-layer="301" from-port="2" to-layer="335" to-port="0" /> |
|
<edge from-layer="301" from-port="2" to-layer="303" to-port="0" /> |
|
<edge from-layer="302" from-port="0" to-layer="303" to-port="1" /> |
|
<edge from-layer="303" from-port="2" to-layer="305" to-port="0" /> |
|
<edge from-layer="304" from-port="0" to-layer="305" to-port="1" /> |
|
<edge from-layer="305" from-port="2" to-layer="307" to-port="0" /> |
|
<edge from-layer="306" from-port="0" to-layer="307" to-port="1" /> |
|
<edge from-layer="307" from-port="2" to-layer="318" to-port="0" /> |
|
<edge from-layer="308" from-port="0" to-layer="309" to-port="0" /> |
|
<edge from-layer="309" from-port="1" to-layer="312" to-port="0" /> |
|
<edge from-layer="310" from-port="0" to-layer="311" to-port="0" /> |
|
<edge from-layer="311" from-port="1" to-layer="312" to-port="1" /> |
|
<edge from-layer="312" from-port="2" to-layer="314" to-port="0" /> |
|
<edge from-layer="313" from-port="0" to-layer="314" to-port="1" /> |
|
<edge from-layer="314" from-port="2" to-layer="316" to-port="0" /> |
|
<edge from-layer="315" from-port="0" to-layer="316" to-port="1" /> |
|
<edge from-layer="316" from-port="2" to-layer="317" to-port="0" /> |
|
<edge from-layer="317" from-port="1" to-layer="318" to-port="1" /> |
|
<edge from-layer="318" from-port="2" to-layer="320" to-port="0" /> |
|
<edge from-layer="319" from-port="0" to-layer="320" to-port="1" /> |
|
<edge from-layer="320" from-port="2" to-layer="321" to-port="0" /> |
|
<edge from-layer="321" from-port="1" to-layer="332" to-port="0" /> |
|
<edge from-layer="322" from-port="0" to-layer="323" to-port="0" /> |
|
<edge from-layer="323" from-port="1" to-layer="326" to-port="0" /> |
|
<edge from-layer="324" from-port="0" to-layer="325" to-port="0" /> |
|
<edge from-layer="325" from-port="1" to-layer="326" to-port="1" /> |
|
<edge from-layer="326" from-port="2" to-layer="328" to-port="0" /> |
|
<edge from-layer="327" from-port="0" to-layer="328" to-port="1" /> |
|
<edge from-layer="328" from-port="2" to-layer="330" to-port="0" /> |
|
<edge from-layer="329" from-port="0" to-layer="330" to-port="1" /> |
|
<edge from-layer="330" from-port="2" to-layer="331" to-port="0" /> |
|
<edge from-layer="331" from-port="1" to-layer="332" to-port="1" /> |
|
<edge from-layer="332" from-port="2" to-layer="334" to-port="0" /> |
|
<edge from-layer="333" from-port="0" to-layer="334" to-port="1" /> |
|
<edge from-layer="334" from-port="2" to-layer="335" to-port="1" /> |
|
<edge from-layer="335" from-port="2" to-layer="424" to-port="0" /> |
|
<edge from-layer="335" from-port="2" to-layer="337" to-port="0" /> |
|
<edge from-layer="336" from-port="0" to-layer="337" to-port="1" /> |
|
<edge from-layer="337" from-port="2" to-layer="339" to-port="0" /> |
|
<edge from-layer="338" from-port="0" to-layer="339" to-port="1" /> |
|
<edge from-layer="339" from-port="2" to-layer="341" to-port="0" /> |
|
<edge from-layer="340" from-port="0" to-layer="341" to-port="1" /> |
|
<edge from-layer="341" from-port="2" to-layer="352" to-port="0" /> |
|
<edge from-layer="341" from-port="2" to-layer="399" to-port="0" /> |
|
<edge from-layer="341" from-port="2" to-layer="380" to-port="0" /> |
|
<edge from-layer="342" from-port="0" to-layer="343" to-port="0" /> |
|
<edge from-layer="343" from-port="1" to-layer="346" to-port="0" /> |
|
<edge from-layer="344" from-port="0" to-layer="345" to-port="0" /> |
|
<edge from-layer="345" from-port="1" to-layer="346" to-port="1" /> |
|
<edge from-layer="346" from-port="2" to-layer="348" to-port="0" /> |
|
<edge from-layer="347" from-port="0" to-layer="348" to-port="1" /> |
|
<edge from-layer="348" from-port="2" to-layer="350" to-port="0" /> |
|
<edge from-layer="349" from-port="0" to-layer="350" to-port="1" /> |
|
<edge from-layer="350" from-port="2" to-layer="351" to-port="0" /> |
|
<edge from-layer="351" from-port="1" to-layer="352" to-port="1" /> |
|
<edge from-layer="352" from-port="2" to-layer="354" to-port="0" /> |
|
<edge from-layer="353" from-port="0" to-layer="354" to-port="1" /> |
|
<edge from-layer="354" from-port="2" to-layer="356" to-port="0" /> |
|
<edge from-layer="355" from-port="0" to-layer="356" to-port="1" /> |
|
<edge from-layer="356" from-port="2" to-layer="358" to-port="0" /> |
|
<edge from-layer="357" from-port="0" to-layer="358" to-port="1" /> |
|
<edge from-layer="358" from-port="2" to-layer="359" to-port="1" /> |
|
<edge from-layer="359" from-port="2" to-layer="406" to-port="2" /> |
|
<edge from-layer="359" from-port="2" to-layer="360" to-port="0" /> |
|
<edge from-layer="361" from-port="0" to-layer="366" to-port="0" /> |
|
<edge from-layer="362" from-port="0" to-layer="365" to-port="1" /> |
|
<edge from-layer="363" from-port="0" to-layer="365" to-port="2" /> |
|
<edge from-layer="364" from-port="0" to-layer="365" to-port="3" /> |
|
<edge from-layer="365" from-port="4" to-layer="366" to-port="1" /> |
|
<edge from-layer="366" from-port="2" to-layer="367" to-port="0" /> |
|
<edge from-layer="367" from-port="1" to-layer="369" to-port="0" /> |
|
<edge from-layer="368" from-port="0" to-layer="369" to-port="2" /> |
|
<edge from-layer="369" from-port="3" to-layer="385" to-port="0" /> |
|
<edge from-layer="370" from-port="0" to-layer="371" to-port="0" /> |
|
<edge from-layer="371" from-port="1" to-layer="374" to-port="0" /> |
|
<edge from-layer="372" from-port="0" to-layer="373" to-port="0" /> |
|
<edge from-layer="373" from-port="1" to-layer="374" to-port="1" /> |
|
<edge from-layer="374" from-port="2" to-layer="376" to-port="0" /> |
|
<edge from-layer="375" from-port="0" to-layer="376" to-port="1" /> |
|
<edge from-layer="376" from-port="2" to-layer="378" to-port="0" /> |
|
<edge from-layer="377" from-port="0" to-layer="378" to-port="1" /> |
|
<edge from-layer="378" from-port="2" to-layer="379" to-port="0" /> |
|
<edge from-layer="379" from-port="1" to-layer="380" to-port="1" /> |
|
<edge from-layer="380" from-port="2" to-layer="382" to-port="0" /> |
|
<edge from-layer="381" from-port="0" to-layer="382" to-port="1" /> |
|
<edge from-layer="382" from-port="2" to-layer="384" to-port="0" /> |
|
<edge from-layer="383" from-port="0" to-layer="384" to-port="1" /> |
|
<edge from-layer="384" from-port="2" to-layer="385" to-port="1" /> |
|
<edge from-layer="385" from-port="2" to-layer="386" to-port="0" /> |
|
<edge from-layer="385" from-port="2" to-layer="406" to-port="1" /> |
|
<edge from-layer="389" from-port="0" to-layer="390" to-port="0" /> |
|
<edge from-layer="390" from-port="1" to-layer="393" to-port="0" /> |
|
<edge from-layer="391" from-port="0" to-layer="392" to-port="0" /> |
|
<edge from-layer="392" from-port="1" to-layer="393" to-port="1" /> |
|
<edge from-layer="393" from-port="2" to-layer="395" to-port="0" /> |
|
<edge from-layer="394" from-port="0" to-layer="395" to-port="1" /> |
|
<edge from-layer="395" from-port="2" to-layer="397" to-port="0" /> |
|
<edge from-layer="396" from-port="0" to-layer="397" to-port="1" /> |
|
<edge from-layer="397" from-port="2" to-layer="398" to-port="0" /> |
|
<edge from-layer="398" from-port="1" to-layer="399" to-port="1" /> |
|
<edge from-layer="399" from-port="2" to-layer="401" to-port="0" /> |
|
<edge from-layer="400" from-port="0" to-layer="401" to-port="1" /> |
|
<edge from-layer="401" from-port="2" to-layer="403" to-port="0" /> |
|
<edge from-layer="402" from-port="0" to-layer="403" to-port="1" /> |
|
<edge from-layer="403" from-port="2" to-layer="405" to-port="0" /> |
|
<edge from-layer="404" from-port="0" to-layer="405" to-port="1" /> |
|
<edge from-layer="405" from-port="2" to-layer="406" to-port="0" /> |
|
<edge from-layer="406" from-port="4" to-layer="408" to-port="0" /> |
|
<edge from-layer="407" from-port="0" to-layer="408" to-port="1" /> |
|
<edge from-layer="408" from-port="2" to-layer="410" to-port="0" /> |
|
<edge from-layer="409" from-port="0" to-layer="410" to-port="1" /> |
|
<edge from-layer="410" from-port="2" to-layer="421" to-port="0" /> |
|
<edge from-layer="411" from-port="0" to-layer="412" to-port="0" /> |
|
<edge from-layer="412" from-port="1" to-layer="415" to-port="0" /> |
|
<edge from-layer="413" from-port="0" to-layer="414" to-port="0" /> |
|
<edge from-layer="414" from-port="1" to-layer="415" to-port="1" /> |
|
<edge from-layer="415" from-port="2" to-layer="417" to-port="0" /> |
|
<edge from-layer="416" from-port="0" to-layer="417" to-port="1" /> |
|
<edge from-layer="417" from-port="2" to-layer="419" to-port="0" /> |
|
<edge from-layer="418" from-port="0" to-layer="419" to-port="1" /> |
|
<edge from-layer="419" from-port="2" to-layer="420" to-port="0" /> |
|
<edge from-layer="420" from-port="1" to-layer="421" to-port="1" /> |
|
<edge from-layer="421" from-port="2" to-layer="423" to-port="0" /> |
|
<edge from-layer="422" from-port="0" to-layer="423" to-port="1" /> |
|
<edge from-layer="423" from-port="2" to-layer="424" to-port="1" /> |
|
<edge from-layer="424" from-port="2" to-layer="426" to-port="0" /> |
|
<edge from-layer="424" from-port="2" to-layer="466" to-port="0" /> |
|
<edge from-layer="425" from-port="0" to-layer="426" to-port="1" /> |
|
<edge from-layer="426" from-port="2" to-layer="428" to-port="0" /> |
|
<edge from-layer="427" from-port="0" to-layer="428" to-port="1" /> |
|
<edge from-layer="428" from-port="2" to-layer="430" to-port="0" /> |
|
<edge from-layer="429" from-port="0" to-layer="430" to-port="1" /> |
|
<edge from-layer="430" from-port="2" to-layer="441" to-port="0" /> |
|
<edge from-layer="431" from-port="0" to-layer="432" to-port="0" /> |
|
<edge from-layer="432" from-port="1" to-layer="435" to-port="0" /> |
|
<edge from-layer="433" from-port="0" to-layer="434" to-port="0" /> |
|
<edge from-layer="434" from-port="1" to-layer="435" to-port="1" /> |
|
<edge from-layer="435" from-port="2" to-layer="437" to-port="0" /> |
|
<edge from-layer="436" from-port="0" to-layer="437" to-port="1" /> |
|
<edge from-layer="437" from-port="2" to-layer="439" to-port="0" /> |
|
<edge from-layer="438" from-port="0" to-layer="439" to-port="1" /> |
|
<edge from-layer="439" from-port="2" to-layer="440" to-port="0" /> |
|
<edge from-layer="440" from-port="1" to-layer="441" to-port="1" /> |
|
<edge from-layer="441" from-port="2" to-layer="443" to-port="0" /> |
|
<edge from-layer="442" from-port="0" to-layer="443" to-port="1" /> |
|
<edge from-layer="443" from-port="2" to-layer="445" to-port="0" /> |
|
<edge from-layer="444" from-port="0" to-layer="445" to-port="1" /> |
|
<edge from-layer="445" from-port="2" to-layer="447" to-port="0" /> |
|
<edge from-layer="446" from-port="0" to-layer="447" to-port="1" /> |
|
<edge from-layer="447" from-port="2" to-layer="448" to-port="0" /> |
|
<edge from-layer="448" from-port="3" to-layer="450" to-port="0" /> |
|
<edge from-layer="449" from-port="0" to-layer="450" to-port="1" /> |
|
<edge from-layer="450" from-port="2" to-layer="452" to-port="0" /> |
|
<edge from-layer="451" from-port="0" to-layer="452" to-port="1" /> |
|
<edge from-layer="452" from-port="2" to-layer="463" to-port="0" /> |
|
<edge from-layer="453" from-port="0" to-layer="454" to-port="0" /> |
|
<edge from-layer="454" from-port="1" to-layer="457" to-port="0" /> |
|
<edge from-layer="455" from-port="0" to-layer="456" to-port="0" /> |
|
<edge from-layer="456" from-port="1" to-layer="457" to-port="1" /> |
|
<edge from-layer="457" from-port="2" to-layer="459" to-port="0" /> |
|
<edge from-layer="458" from-port="0" to-layer="459" to-port="1" /> |
|
<edge from-layer="459" from-port="2" to-layer="461" to-port="0" /> |
|
<edge from-layer="460" from-port="0" to-layer="461" to-port="1" /> |
|
<edge from-layer="461" from-port="2" to-layer="462" to-port="0" /> |
|
<edge from-layer="462" from-port="1" to-layer="463" to-port="1" /> |
|
<edge from-layer="463" from-port="2" to-layer="465" to-port="0" /> |
|
<edge from-layer="464" from-port="0" to-layer="465" to-port="1" /> |
|
<edge from-layer="465" from-port="2" to-layer="466" to-port="1" /> |
|
<edge from-layer="466" from-port="2" to-layer="500" to-port="0" /> |
|
<edge from-layer="466" from-port="2" to-layer="468" to-port="0" /> |
|
<edge from-layer="467" from-port="0" to-layer="468" to-port="1" /> |
|
<edge from-layer="468" from-port="2" to-layer="470" to-port="0" /> |
|
<edge from-layer="469" from-port="0" to-layer="470" to-port="1" /> |
|
<edge from-layer="470" from-port="2" to-layer="472" to-port="0" /> |
|
<edge from-layer="471" from-port="0" to-layer="472" to-port="1" /> |
|
<edge from-layer="472" from-port="2" to-layer="483" to-port="0" /> |
|
<edge from-layer="473" from-port="0" to-layer="474" to-port="0" /> |
|
<edge from-layer="474" from-port="1" to-layer="477" to-port="0" /> |
|
<edge from-layer="475" from-port="0" to-layer="476" to-port="0" /> |
|
<edge from-layer="476" from-port="1" to-layer="477" to-port="1" /> |
|
<edge from-layer="477" from-port="2" to-layer="479" to-port="0" /> |
|
<edge from-layer="478" from-port="0" to-layer="479" to-port="1" /> |
|
<edge from-layer="479" from-port="2" to-layer="481" to-port="0" /> |
|
<edge from-layer="480" from-port="0" to-layer="481" to-port="1" /> |
|
<edge from-layer="481" from-port="2" to-layer="482" to-port="0" /> |
|
<edge from-layer="482" from-port="1" to-layer="483" to-port="1" /> |
|
<edge from-layer="483" from-port="2" to-layer="485" to-port="0" /> |
|
<edge from-layer="484" from-port="0" to-layer="485" to-port="1" /> |
|
<edge from-layer="485" from-port="2" to-layer="486" to-port="0" /> |
|
<edge from-layer="486" from-port="1" to-layer="497" to-port="0" /> |
|
<edge from-layer="487" from-port="0" to-layer="488" to-port="0" /> |
|
<edge from-layer="488" from-port="1" to-layer="491" to-port="0" /> |
|
<edge from-layer="489" from-port="0" to-layer="490" to-port="0" /> |
|
<edge from-layer="490" from-port="1" to-layer="491" to-port="1" /> |
|
<edge from-layer="491" from-port="2" to-layer="493" to-port="0" /> |
|
<edge from-layer="492" from-port="0" to-layer="493" to-port="1" /> |
|
<edge from-layer="493" from-port="2" to-layer="495" to-port="0" /> |
|
<edge from-layer="494" from-port="0" to-layer="495" to-port="1" /> |
|
<edge from-layer="495" from-port="2" to-layer="496" to-port="0" /> |
|
<edge from-layer="496" from-port="1" to-layer="497" to-port="1" /> |
|
<edge from-layer="497" from-port="2" to-layer="499" to-port="0" /> |
|
<edge from-layer="498" from-port="0" to-layer="499" to-port="1" /> |
|
<edge from-layer="499" from-port="2" to-layer="500" to-port="1" /> |
|
<edge from-layer="500" from-port="2" to-layer="502" to-port="0" /> |
|
<edge from-layer="501" from-port="0" to-layer="502" to-port="1" /> |
|
<edge from-layer="502" from-port="2" to-layer="504" to-port="0" /> |
|
<edge from-layer="503" from-port="0" to-layer="504" to-port="1" /> |
|
<edge from-layer="504" from-port="2" to-layer="506" to-port="0" /> |
|
<edge from-layer="505" from-port="0" to-layer="506" to-port="1" /> |
|
<edge from-layer="506" from-port="2" to-layer="507" to-port="0" /> |
|
<edge from-layer="507" from-port="2" to-layer="508" to-port="0" /> |
|
</edges> |
|
<rt_info> |
|
<Runtime_version value="2025.2.0-19120-87425bc78ca-releases/2025/2" /> |
|
<conversion_parameters> |
|
<framework value="pytorch" /> |
|
<is_python_object value="True" /> |
|
</conversion_parameters> |
|
<nncf> |
|
<friendly_names_were_updated value="True" /> |
|
<weight_compression> |
|
<advanced_parameters value="{'statistics_path': None, 'awq_params': {'subset_size': 32, 'percent_to_apply': 0.002, 'alpha_min': 0.0, 'alpha_max': 1.0, 'steps': 100}, 'scale_estimation_params': {'subset_size': 64, 'initial_steps': 5, 'scale_steps': 5, 'weight_penalty': -1.0}, 'gptq_params': {'damp_percent': 0.1, 'block_size': 128, 'subset_size': 128}, 'lora_correction_params': {'adapter_rank': 8, 'num_iterations': 3, 'apply_regularization': True, 'subset_size': 128, 'use_int8_adapters': True}, 'lora_adapter_rank': 256}" /> |
|
<all_layers value="False" /> |
|
<awq value="False" /> |
|
<backup_mode value="int8_asym" /> |
|
<compression_format value="dequantize" /> |
|
<gptq value="False" /> |
|
<group_size value="128" /> |
|
<ignored_scope value="[]" /> |
|
<lora_correction value="False" /> |
|
<mode value="int4_asym" /> |
|
<ratio value="1.0" /> |
|
<scale_estimation value="False" /> |
|
<sensitivity_metric value="weight_quantization_error" /> |
|
</weight_compression> |
|
</nncf> |
|
<optimum> |
|
<nncf_version value="2.16.0" /> |
|
<optimum_intel_version value="1.24.0.dev0+08e3008" /> |
|
<optimum_version value="1.25.3" /> |
|
<pytorch_version value="2.7.0+cpu" /> |
|
<transformers_version value="4.51.3" /> |
|
</optimum> |
|
<runtime_options> |
|
<ACTIVATIONS_SCALE_FACTOR value="8.0" /> |
|
</runtime_options> |
|
</rt_info> |
|
</net> |
|
|