|
<?xml version="1.0"?>
|
|
<net name="Model0" version="11">
|
|
<layers>
|
|
<layer id="2" name="input_ids" type="Parameter" version="opset1">
|
|
<data shape="?,?" element_type="i64" />
|
|
<output>
|
|
<port id="0" precision="I64" names="input_ids">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1" name="attention_mask" type="Parameter" version="opset1">
|
|
<data shape="?,?" element_type="i64" />
|
|
<output>
|
|
<port id="0" precision="I64" names="attention_mask">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="0" name="token_type_ids" type="Parameter" version="opset1">
|
|
<data shape="?,?" element_type="i64" />
|
|
<output>
|
|
<port id="0" precision="I64" names="token_type_ids">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="3" name="Constant_74601" type="Const" version="opset1">
|
|
<data element_type="i8" shape="30522, 128" offset="0" size="3906816" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>30522</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="4" name="Convert_74602" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>30522</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>30522</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="5" name="Constant_74603" type="Const" version="opset1">
|
|
<data element_type="f32" shape="30522, 1" offset="3906816" size="122088" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>30522</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="6" name="__module.embeddings.word_embeddings/aten::embedding/Gather/fq_weights_0" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>30522</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>30522</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>30522</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="7" name="__module.embeddings.word_embeddings/aten::embedding/Convert" type="Convert" version="opset1">
|
|
<data destination_type="i32" />
|
|
<input>
|
|
<port id="0" precision="I64">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="I32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="8" name="__module.embeddings.word_embeddings/aten::embedding/Constant" type="Const" version="opset1">
|
|
<data element_type="i32" shape="" offset="4028904" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="9" name="__module.embeddings.word_embeddings/aten::embedding/Gather" type="Gather" version="opset8">
|
|
<data batch_dims="0" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>30522</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
<port id="2" precision="I32" />
|
|
</input>
|
|
<output>
|
|
<port id="3" precision="FP32" names="79,inputs_embeds">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="10" name="Constant_74605" type="Const" version="opset1">
|
|
<data element_type="i8" shape="2, 128" offset="4028908" size="256" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>2</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="11" name="Convert_74606" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>2</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>2</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="12" name="Constant_74607" type="Const" version="opset1">
|
|
<data element_type="f32" shape="2, 1" offset="4029164" size="8" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>2</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="13" name="__module.embeddings.token_type_embeddings/aten::embedding/Gather/fq_weights_0" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>2</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>2</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>2</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="14" name="__module.embeddings.token_type_embeddings/aten::embedding/Convert" type="Convert" version="opset1">
|
|
<data destination_type="i32" />
|
|
<input>
|
|
<port id="0" precision="I64">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="I32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="15" name="__module.embeddings.token_type_embeddings/aten::embedding/Constant" type="Const" version="opset1">
|
|
<data element_type="i32" shape="" offset="4028904" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="16" name="__module.embeddings.token_type_embeddings/aten::embedding/Gather" type="Gather" version="opset8">
|
|
<data batch_dims="0" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>2</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
<port id="2" precision="I32" />
|
|
</input>
|
|
<output>
|
|
<port id="3" precision="FP32" names="81,token_type_embeddings.1">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="17" name="__module.embeddings/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="82_1">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="18" name="Constant_74609" type="Const" version="opset1">
|
|
<data element_type="i8" shape="512, 128" offset="4029172" size="65536" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>512</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="19" name="Convert_74610" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>512</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>512</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="20" name="Constant_74611" type="Const" version="opset1">
|
|
<data element_type="f32" shape="512, 1" offset="4094708" size="2048" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>512</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="21" name="__module.embeddings.position_embeddings/aten::embedding/Gather/fq_weights_0" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>512</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>512</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>512</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="22" name="__module.embeddings/aten::slice/Slice" type="Const" version="opset1">
|
|
<data element_type="i64" shape="1, 512" offset="4096756" size="4096" />
|
|
<output>
|
|
<port id="0" precision="I64" names="76">
|
|
<dim>1</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="23" name="__module.embeddings/aten::slice/Reshape" type="Const" version="opset1">
|
|
<data element_type="i64" shape="1" offset="4100852" size="8" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="24" name="ShapeOf_4186" type="ShapeOf" version="opset3">
|
|
<data output_type="i64" />
|
|
<input>
|
|
<port id="0" precision="I64">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="I64">
|
|
<dim>2</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="25" name="Constant_4304" type="Const" version="opset1">
|
|
<data element_type="i64" shape="1" offset="4100860" size="8" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="26" name="Constant_4188" type="Const" version="opset1">
|
|
<data element_type="i64" shape="" offset="4100852" size="8" />
|
|
<output>
|
|
<port id="0" precision="I64" />
|
|
</output>
|
|
</layer>
|
|
<layer id="27" name="Gather_4189" type="Gather" version="opset8">
|
|
<data batch_dims="0" />
|
|
<input>
|
|
<port id="0" precision="I64">
|
|
<dim>2</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>1</dim>
|
|
</port>
|
|
<port id="2" precision="I64" />
|
|
</input>
|
|
<output>
|
|
<port id="3" precision="I64" names="10,17,19,72,74,75,8">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="28" name="__module.embeddings/aten::slice/Reshape_2" type="Const" version="opset1">
|
|
<data element_type="i64" shape="1" offset="4100860" size="8" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="29" name="__module.embeddings/aten::slice/Reshape_3" type="Const" version="opset1">
|
|
<data element_type="i64" shape="1" offset="4100860" size="8" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="30" name="__module.embeddings/aten::slice/Slice_1" type="Slice" version="opset8">
|
|
<input>
|
|
<port id="0" precision="I64">
|
|
<dim>1</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>1</dim>
|
|
</port>
|
|
<port id="2" precision="I64">
|
|
<dim>1</dim>
|
|
</port>
|
|
<port id="3" precision="I64">
|
|
<dim>1</dim>
|
|
</port>
|
|
<port id="4" precision="I64">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="I64" names="77">
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="31" name="__module.embeddings.position_embeddings/aten::embedding/Convert" type="Convert" version="opset1">
|
|
<data destination_type="i32" />
|
|
<input>
|
|
<port id="0" precision="I64">
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="32" name="__module.embeddings.position_embeddings/aten::embedding/Constant" type="Const" version="opset1">
|
|
<data element_type="i32" shape="" offset="4028904" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="33" name="__module.embeddings.position_embeddings/aten::embedding/Gather" type="Gather" version="opset8">
|
|
<data batch_dims="0" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>512</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
<port id="2" precision="I32" />
|
|
</input>
|
|
<output>
|
|
<port id="3" precision="FP32" names="84,position_embeddings.1">
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="34" name="__module.embeddings/aten::add_/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="82,embeddings.1">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="35" name="__module.embeddings.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="4100868" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="36" name="__module.embeddings.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="37" name="Constant_4129" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 128" offset="4100872" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="38" name="__module.embeddings.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="39" name="Constant_4130" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 128" offset="4101384" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="40" name="__module.embeddings.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="89,input.1">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="41" name="__module.embeddings.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 128" offset="4101896" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="42" name="__module.embeddings.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="43" name="__module.embeddings.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4102408" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="44" name="__module.embeddings.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4102412" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="45" name="__module.embeddings.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4102408" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="46" name="__module.embeddings.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4102412" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="47" name="__module.embeddings.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="48" name="Constant_74613" type="Const" version="opset1">
|
|
<data element_type="i8" shape="128, 128" offset="4102416" size="16384" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="49" name="Convert_74614" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="50" name="Constant_74615" type="Const" version="opset1">
|
|
<data element_type="f32" shape="128, 1" offset="4118800" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="51" name="__module.encoder.layer.0.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="52" name="__module.encoder.layer.0.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="53" name="Constant_4131" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 128" offset="4119312" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="54" name="__module.encoder.layer.0.attention.self.query/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="120,x.1">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="55" name="__module.encoder.layer.0.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4119824" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="56" name="__module.encoder.layer.0.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4119828" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="57" name="__module.encoder.layer.0.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4119824" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="58" name="__module.encoder.layer.0.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4119828" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="59" name="__module.encoder.layer.0.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="60" name="__module.encoder.layer.0.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="4119832" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="61" name="__module.encoder.layer.0.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="124,x.3">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>2</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="62" name="Constant_238" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="4119864" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="125">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="63" name="__module.encoder.layer.0.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>2</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="126">
|
|
<dim>-1</dim>
|
|
<dim>2</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="64" name="Constant_74617" type="Const" version="opset1">
|
|
<data element_type="i8" shape="128, 128" offset="4119896" size="16384" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="65" name="Convert_74618" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="66" name="Constant_74619" type="Const" version="opset1">
|
|
<data element_type="f32" shape="128, 1" offset="4136280" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="67" name="__module.encoder.layer.0.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="68" name="__module.encoder.layer.0.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="69" name="Constant_4132" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 128" offset="4136792" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="70" name="__module.encoder.layer.0.attention.self.key/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="129,x.5">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="71" name="__module.encoder.layer.0.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4137304" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="72" name="__module.encoder.layer.0.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4137308" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="73" name="__module.encoder.layer.0.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4137304" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="74" name="__module.encoder.layer.0.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4137308" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="75" name="__module.encoder.layer.0.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="76" name="__module.encoder.layer.0.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="4119832" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="77" name="__module.encoder.layer.0.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="133,x.7">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>2</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="78" name="Constant_263" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="4119864" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="134">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="79" name="__module.encoder.layer.0.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>2</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="135">
|
|
<dim>-1</dim>
|
|
<dim>2</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="80" name="Constant_74621" type="Const" version="opset1">
|
|
<data element_type="i8" shape="128, 128" offset="4137312" size="16384" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="81" name="Convert_74622" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="82" name="Constant_74623" type="Const" version="opset1">
|
|
<data element_type="f32" shape="128, 1" offset="4153696" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="83" name="__module.encoder.layer.0.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="84" name="__module.encoder.layer.0.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="85" name="Constant_4133" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 128" offset="4154208" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="86" name="__module.encoder.layer.0.attention.self.value/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="138,x.9">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="87" name="__module.encoder.layer.0.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="4119832" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="88" name="__module.encoder.layer.0.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="142,x.11">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>2</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="89" name="Constant_288" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="4119864" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="143">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="90" name="__module.encoder.layer.0.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>2</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="144">
|
|
<dim>-1</dim>
|
|
<dim>2</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="91" name="Constant_4135" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1, 1" offset="4154720" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="92" name="25" type="Const" version="opset1">
|
|
<data element_type="i64" shape="" offset="4100860" size="8" />
|
|
<output>
|
|
<port id="0" precision="I64" names="25" />
|
|
</output>
|
|
</layer>
|
|
<layer id="93" name="aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1">
|
|
<input>
|
|
<port id="0" precision="I64">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
<port id="1" precision="I64" />
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="I64" names="26">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="94" name="27" type="Const" version="opset1">
|
|
<data element_type="i64" shape="" offset="4154724" size="8" />
|
|
<output>
|
|
<port id="0" precision="I64" names="27" />
|
|
</output>
|
|
</layer>
|
|
<layer id="95" name="aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1">
|
|
<input>
|
|
<port id="0" precision="I64">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
<port id="1" precision="I64" />
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="I64" names="28,33">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="96" name="Constant_4307" type="Const" version="opset1">
|
|
<data element_type="i64" shape="1" offset="4100852" size="8" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="97" name="Constant_4196" type="Const" version="opset1">
|
|
<data element_type="i64" shape="" offset="4100852" size="8" />
|
|
<output>
|
|
<port id="0" precision="I64" />
|
|
</output>
|
|
</layer>
|
|
<layer id="98" name="Gather_4197" type="Gather" version="opset8">
|
|
<data batch_dims="0" />
|
|
<input>
|
|
<port id="0" precision="I64">
|
|
<dim>2</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>1</dim>
|
|
</port>
|
|
<port id="2" precision="I64" />
|
|
</input>
|
|
<output>
|
|
<port id="3" precision="I64" names="13,15">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="99" name="Constant_3763" type="Const" version="opset1">
|
|
<data element_type="i64" shape="1" offset="4100860" size="8" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="100" name="Constant_4309" type="Const" version="opset1">
|
|
<data element_type="i64" shape="2" offset="4154732" size="16" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>2</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="101" name="Constant_4310" type="Const" version="opset1">
|
|
<data element_type="i64" shape="" offset="4100852" size="8" />
|
|
<output>
|
|
<port id="0" precision="I64" />
|
|
</output>
|
|
</layer>
|
|
<layer id="102" name="Gather_4311" type="Gather" version="opset8">
|
|
<data batch_dims="0" />
|
|
<input>
|
|
<port id="0" precision="I64">
|
|
<dim>2</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>2</dim>
|
|
</port>
|
|
<port id="2" precision="I64" />
|
|
</input>
|
|
<output>
|
|
<port id="3" precision="I64">
|
|
<dim>2</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="103" name="prim::ListConstruct/Concat" type="Concat" version="opset1">
|
|
<data axis="0" />
|
|
<input>
|
|
<port id="0" precision="I64">
|
|
<dim>1</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>1</dim>
|
|
</port>
|
|
<port id="2" precision="I64">
|
|
<dim>2</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="3" precision="I64" names="35">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="104" name="aten::expand/Broadcast" type="Broadcast" version="opset3">
|
|
<data mode="bidirectional" />
|
|
<input>
|
|
<port id="0" precision="I64">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="I64" names="37">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="105" name="aten::to/Convert" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I64">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32" names="42">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="106" name="Constant_4134" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1, 1" offset="4154720" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="107" name="aten::rsub/Multiply" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="108" name="aten::rsub/Subtract" type="Subtract" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="45,inverted_mask">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="109" name="aten::to/Convert_1" type="Convert" version="opset1">
|
|
<data destination_type="boolean" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="BOOL" names="50">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="110" name="aten::masked_fill/ConvertLike" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4154748" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="111" name="aten::masked_fill/Select" type="Select" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="BOOL">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="3" precision="FP32" names="52">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="112" name="__module.encoder.layer.0.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
|
|
<data causal="false" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>2</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>2</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>2</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="3" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="4" precision="FP32" names="145,attn_output.1">
|
|
<dim>-1</dim>
|
|
<dim>2</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="113" name="__module.encoder.layer.0.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
|
|
<data element_type="i32" shape="4" offset="4154752" size="16" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="114" name="__module.encoder.layer.0.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>2</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="146,attn_output.3">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>2</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="115" name="Constant_4205" type="Const" version="opset1">
|
|
<data element_type="i64" shape="3" offset="4154768" size="24" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="116" name="__module.encoder.layer.0.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>2</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="148">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="117" name="__module.encoder.layer.0.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 128" offset="4154792" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="118" name="__module.encoder.layer.0.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="119" name="__module.encoder.layer.0.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4155304" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="120" name="__module.encoder.layer.0.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4155308" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="121" name="__module.encoder.layer.0.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4155304" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="122" name="__module.encoder.layer.0.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4155308" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="123" name="__module.encoder.layer.0.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="124" name="Constant_74625" type="Const" version="opset1">
|
|
<data element_type="i8" shape="128, 128" offset="4155312" size="16384" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="125" name="Convert_74626" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="126" name="Constant_74627" type="Const" version="opset1">
|
|
<data element_type="f32" shape="128, 1" offset="4171696" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="127" name="__module.encoder.layer.0.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="128" name="__module.encoder.layer.0.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="129" name="Constant_4136" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 128" offset="4172208" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="130" name="__module.encoder.layer.0.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="154,input.3">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="131" name="__module.encoder.layer.0.attention.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="156">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="132" name="__module.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="4100868" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="133" name="__module.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="134" name="Constant_4137" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 128" offset="4172720" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="135" name="__module.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="136" name="Constant_4138" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 128" offset="4173232" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="137" name="__module.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="160,input_tensor.1">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="138" name="__module.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 128" offset="4173744" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="139" name="__module.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="140" name="__module.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4174256" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="141" name="__module.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4174260" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="142" name="__module.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4174256" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="143" name="__module.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4174260" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="144" name="__module.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="145" name="Constant_74629" type="Const" version="opset1">
|
|
<data element_type="i8" shape="512, 128" offset="4174264" size="65536" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>512</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="146" name="Convert_74630" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>512</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>512</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="147" name="Constant_74631" type="Const" version="opset1">
|
|
<data element_type="f32" shape="512, 1" offset="4239800" size="2048" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>512</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="148" name="__module.encoder.layer.0.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>512</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>512</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>512</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="149" name="__module.encoder.layer.0.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>512</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="150" name="Constant_4139" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 512" offset="4241848" size="2048" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="151" name="__module.encoder.layer.0.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="165">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="152" name="__module.encoder.layer.0.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
|
<data approximation_mode="ERF" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32" names="166">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="153" name="__module.encoder.layer.0.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 512" offset="4243896" size="2048" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="154" name="__module.encoder.layer.0.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="155" name="__module.encoder.layer.0.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4245944" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="156" name="__module.encoder.layer.0.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4245948" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="157" name="__module.encoder.layer.0.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4245944" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="158" name="__module.encoder.layer.0.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4245948" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="159" name="__module.encoder.layer.0.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="160" name="Constant_74633" type="Const" version="opset1">
|
|
<data element_type="i8" shape="128, 512" offset="4245952" size="65536" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>128</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="161" name="Convert_74634" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>128</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="162" name="Constant_74635" type="Const" version="opset1">
|
|
<data element_type="f32" shape="128, 1" offset="4311488" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="163" name="__module.encoder.layer.0.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="164" name="__module.encoder.layer.0.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="165" name="Constant_4140" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 128" offset="4312000" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="166" name="__module.encoder.layer.0.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="172,input.5">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="167" name="__module.encoder.layer.0.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="174">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="168" name="__module.encoder.layer.0.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="4100868" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="169" name="__module.encoder.layer.0.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="170" name="Constant_4141" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 128" offset="4312512" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="171" name="__module.encoder.layer.0.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="172" name="Constant_4142" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 128" offset="4313024" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="173" name="__module.encoder.layer.0.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="178,hidden_states.7">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="174" name="__module.encoder.layer.0.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 128" offset="4313536" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="175" name="__module.encoder.layer.0.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="176" name="__module.encoder.layer.0.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4314048" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="177" name="__module.encoder.layer.0.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4314052" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="178" name="__module.encoder.layer.0.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4314048" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="179" name="__module.encoder.layer.0.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4314052" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="180" name="__module.encoder.layer.0.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="181" name="Constant_74637" type="Const" version="opset1">
|
|
<data element_type="i8" shape="128, 128" offset="4314056" size="16384" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="182" name="Convert_74638" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="183" name="Constant_74639" type="Const" version="opset1">
|
|
<data element_type="f32" shape="128, 1" offset="4330440" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="184" name="__module.encoder.layer.1.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="185" name="__module.encoder.layer.1.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="186" name="Constant_4143" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 128" offset="4330952" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="187" name="__module.encoder.layer.1.attention.self.query/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="191,x.13">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="188" name="__module.encoder.layer.1.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4331464" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="189" name="__module.encoder.layer.1.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4331468" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="190" name="__module.encoder.layer.1.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4331464" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="191" name="__module.encoder.layer.1.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4331468" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="192" name="__module.encoder.layer.1.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="193" name="__module.encoder.layer.1.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="4119832" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="194" name="__module.encoder.layer.1.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="195,x.15">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>2</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="195" name="Constant_470" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="4119864" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="196">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="196" name="__module.encoder.layer.1.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>2</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="197">
|
|
<dim>-1</dim>
|
|
<dim>2</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="197" name="Constant_74641" type="Const" version="opset1">
|
|
<data element_type="i8" shape="128, 128" offset="4331472" size="16384" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="198" name="Convert_74642" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="199" name="Constant_74643" type="Const" version="opset1">
|
|
<data element_type="f32" shape="128, 1" offset="4347856" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="200" name="__module.encoder.layer.1.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="201" name="__module.encoder.layer.1.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="202" name="Constant_4144" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 128" offset="4348368" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="203" name="__module.encoder.layer.1.attention.self.key/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="200,x.17">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="204" name="__module.encoder.layer.1.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4348880" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="205" name="__module.encoder.layer.1.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4348884" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="206" name="__module.encoder.layer.1.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4348880" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="207" name="__module.encoder.layer.1.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4348884" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="208" name="__module.encoder.layer.1.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="209" name="__module.encoder.layer.1.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="4119832" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="210" name="__module.encoder.layer.1.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="204,x.19">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>2</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="211" name="Constant_493" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="4119864" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="205">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="212" name="__module.encoder.layer.1.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>2</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="206">
|
|
<dim>-1</dim>
|
|
<dim>2</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="213" name="Constant_74645" type="Const" version="opset1">
|
|
<data element_type="i8" shape="128, 128" offset="4348888" size="16384" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="214" name="Convert_74646" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="215" name="Constant_74647" type="Const" version="opset1">
|
|
<data element_type="f32" shape="128, 1" offset="4365272" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="216" name="__module.encoder.layer.1.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="217" name="__module.encoder.layer.1.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="218" name="Constant_4145" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 128" offset="4365784" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="219" name="__module.encoder.layer.1.attention.self.value/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="209,x.21">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="220" name="__module.encoder.layer.1.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="4119832" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="221" name="__module.encoder.layer.1.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="213,x">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>2</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="222" name="Constant_516" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="4119864" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="214">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="223" name="__module.encoder.layer.1.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>2</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="215">
|
|
<dim>-1</dim>
|
|
<dim>2</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="224" name="__module.encoder.layer.1.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
|
|
<data causal="false" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>2</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>2</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>2</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="3" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="4" precision="FP32" names="216,attn_output.5">
|
|
<dim>-1</dim>
|
|
<dim>2</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="225" name="__module.encoder.layer.1.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
|
|
<data element_type="i32" shape="4" offset="4154752" size="16" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="226" name="__module.encoder.layer.1.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>2</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="217,attn_output">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>2</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="227" name="Constant_4206" type="Const" version="opset1">
|
|
<data element_type="i64" shape="3" offset="4154768" size="24" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="228" name="__module.encoder.layer.1.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>2</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="219">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="229" name="__module.encoder.layer.1.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 128" offset="4366296" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="230" name="__module.encoder.layer.1.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="231" name="__module.encoder.layer.1.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4366808" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="232" name="__module.encoder.layer.1.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4366812" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="233" name="__module.encoder.layer.1.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4366808" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="234" name="__module.encoder.layer.1.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4366812" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="235" name="__module.encoder.layer.1.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="236" name="Constant_74649" type="Const" version="opset1">
|
|
<data element_type="i8" shape="128, 128" offset="4366816" size="16384" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="237" name="Convert_74650" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="238" name="Constant_74651" type="Const" version="opset1">
|
|
<data element_type="f32" shape="128, 1" offset="4383200" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="239" name="__module.encoder.layer.1.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="240" name="__module.encoder.layer.1.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="241" name="Constant_4146" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 128" offset="4383712" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="242" name="__module.encoder.layer.1.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="225,input.7">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="243" name="__module.encoder.layer.1.attention.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="227">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="244" name="__module.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="4100868" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="245" name="__module.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="246" name="Constant_4147" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 128" offset="4384224" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="247" name="__module.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="248" name="Constant_4148" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 128" offset="4384736" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="249" name="__module.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="231,input_tensor">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="250" name="__module.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 128" offset="4385248" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="251" name="__module.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="252" name="__module.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4385760" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="253" name="__module.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4385764" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="254" name="__module.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4385760" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="255" name="__module.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4385764" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="256" name="__module.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="257" name="Constant_74653" type="Const" version="opset1">
|
|
<data element_type="i8" shape="512, 128" offset="4385768" size="65536" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>512</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="258" name="Convert_74654" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>512</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>512</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="259" name="Constant_74655" type="Const" version="opset1">
|
|
<data element_type="f32" shape="512, 1" offset="4451304" size="2048" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>512</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="260" name="__module.encoder.layer.1.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>512</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>512</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>512</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="261" name="__module.encoder.layer.1.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>512</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="262" name="Constant_4149" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 512" offset="4453352" size="2048" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="263" name="__module.encoder.layer.1.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="236">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="264" name="__module.encoder.layer.1.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
|
<data approximation_mode="ERF" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32" names="237">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="265" name="__module.encoder.layer.1.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 512" offset="4455400" size="2048" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="266" name="__module.encoder.layer.1.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="267" name="__module.encoder.layer.1.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4457448" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="268" name="__module.encoder.layer.1.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4457452" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="269" name="__module.encoder.layer.1.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4457448" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="270" name="__module.encoder.layer.1.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="4457452" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="271" name="__module.encoder.layer.1.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="272" name="Constant_74657" type="Const" version="opset1">
|
|
<data element_type="i8" shape="128, 512" offset="4457456" size="65536" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>128</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="273" name="Convert_74658" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>128</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="274" name="Constant_74659" type="Const" version="opset1">
|
|
<data element_type="f32" shape="128, 1" offset="4522992" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="275" name="__module.encoder.layer.1.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="276" name="__module.encoder.layer.1.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>128</dim>
|
|
<dim>512</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="277" name="Constant_4150" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 128" offset="4523504" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="278" name="__module.encoder.layer.1.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="243,input">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="279" name="__module.encoder.layer.1.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="245">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="280" name="__module.encoder.layer.1.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="4100868" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="281" name="__module.encoder.layer.1.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.999999960041972e-13" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="282" name="Constant_4151" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 128" offset="4524016" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="283" name="__module.encoder.layer.1.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="284" name="Constant_4152" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 128" offset="4524528" size="512" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="285" name="__module.encoder.layer.1.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="last_hidden_state">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="286" name="Result_1358" type="Result" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>128</dim>
|
|
</port>
|
|
</input>
|
|
</layer>
|
|
</layers>
|
|
<edges>
|
|
<edge from-layer="0" from-port="0" to-layer="14" to-port="0" />
|
|
<edge from-layer="1" from-port="0" to-layer="93" to-port="0" />
|
|
<edge from-layer="2" from-port="0" to-layer="7" to-port="0" />
|
|
<edge from-layer="2" from-port="0" to-layer="24" to-port="0" />
|
|
<edge from-layer="3" from-port="0" to-layer="4" to-port="0" />
|
|
<edge from-layer="4" from-port="1" to-layer="6" to-port="0" />
|
|
<edge from-layer="5" from-port="0" to-layer="6" to-port="1" />
|
|
<edge from-layer="6" from-port="2" to-layer="9" to-port="0" />
|
|
<edge from-layer="7" from-port="1" to-layer="9" to-port="1" />
|
|
<edge from-layer="8" from-port="0" to-layer="9" to-port="2" />
|
|
<edge from-layer="9" from-port="3" to-layer="17" to-port="0" />
|
|
<edge from-layer="10" from-port="0" to-layer="11" to-port="0" />
|
|
<edge from-layer="11" from-port="1" to-layer="13" to-port="0" />
|
|
<edge from-layer="12" from-port="0" to-layer="13" to-port="1" />
|
|
<edge from-layer="13" from-port="2" to-layer="16" to-port="0" />
|
|
<edge from-layer="14" from-port="1" to-layer="16" to-port="1" />
|
|
<edge from-layer="15" from-port="0" to-layer="16" to-port="2" />
|
|
<edge from-layer="16" from-port="3" to-layer="17" to-port="1" />
|
|
<edge from-layer="17" from-port="2" to-layer="34" to-port="0" />
|
|
<edge from-layer="18" from-port="0" to-layer="19" to-port="0" />
|
|
<edge from-layer="19" from-port="1" to-layer="21" to-port="0" />
|
|
<edge from-layer="20" from-port="0" to-layer="21" to-port="1" />
|
|
<edge from-layer="21" from-port="2" to-layer="33" to-port="0" />
|
|
<edge from-layer="22" from-port="0" to-layer="30" to-port="0" />
|
|
<edge from-layer="23" from-port="0" to-layer="30" to-port="1" />
|
|
<edge from-layer="24" from-port="1" to-layer="102" to-port="0" />
|
|
<edge from-layer="24" from-port="1" to-layer="27" to-port="0" />
|
|
<edge from-layer="24" from-port="1" to-layer="98" to-port="0" />
|
|
<edge from-layer="25" from-port="0" to-layer="27" to-port="1" />
|
|
<edge from-layer="26" from-port="0" to-layer="27" to-port="2" />
|
|
<edge from-layer="27" from-port="3" to-layer="30" to-port="2" />
|
|
<edge from-layer="28" from-port="0" to-layer="30" to-port="3" />
|
|
<edge from-layer="29" from-port="0" to-layer="30" to-port="4" />
|
|
<edge from-layer="30" from-port="5" to-layer="31" to-port="0" />
|
|
<edge from-layer="31" from-port="1" to-layer="33" to-port="1" />
|
|
<edge from-layer="32" from-port="0" to-layer="33" to-port="2" />
|
|
<edge from-layer="33" from-port="3" to-layer="34" to-port="1" />
|
|
<edge from-layer="34" from-port="2" to-layer="36" to-port="0" />
|
|
<edge from-layer="35" from-port="0" to-layer="36" to-port="1" />
|
|
<edge from-layer="36" from-port="2" to-layer="38" to-port="0" />
|
|
<edge from-layer="37" from-port="0" to-layer="38" to-port="1" />
|
|
<edge from-layer="38" from-port="2" to-layer="40" to-port="0" />
|
|
<edge from-layer="39" from-port="0" to-layer="40" to-port="1" />
|
|
<edge from-layer="40" from-port="2" to-layer="131" to-port="1" />
|
|
<edge from-layer="40" from-port="2" to-layer="42" to-port="0" />
|
|
<edge from-layer="41" from-port="0" to-layer="42" to-port="1" />
|
|
<edge from-layer="42" from-port="2" to-layer="47" to-port="0" />
|
|
<edge from-layer="43" from-port="0" to-layer="47" to-port="1" />
|
|
<edge from-layer="44" from-port="0" to-layer="47" to-port="2" />
|
|
<edge from-layer="45" from-port="0" to-layer="47" to-port="3" />
|
|
<edge from-layer="46" from-port="0" to-layer="47" to-port="4" />
|
|
<edge from-layer="47" from-port="5" to-layer="52" to-port="0" />
|
|
<edge from-layer="47" from-port="5" to-layer="68" to-port="0" />
|
|
<edge from-layer="47" from-port="5" to-layer="84" to-port="0" />
|
|
<edge from-layer="48" from-port="0" to-layer="49" to-port="0" />
|
|
<edge from-layer="49" from-port="1" to-layer="51" to-port="0" />
|
|
<edge from-layer="50" from-port="0" to-layer="51" to-port="1" />
|
|
<edge from-layer="51" from-port="2" to-layer="52" to-port="1" />
|
|
<edge from-layer="52" from-port="2" to-layer="54" to-port="0" />
|
|
<edge from-layer="53" from-port="0" to-layer="54" to-port="1" />
|
|
<edge from-layer="54" from-port="2" to-layer="59" to-port="0" />
|
|
<edge from-layer="55" from-port="0" to-layer="59" to-port="1" />
|
|
<edge from-layer="56" from-port="0" to-layer="59" to-port="2" />
|
|
<edge from-layer="57" from-port="0" to-layer="59" to-port="3" />
|
|
<edge from-layer="58" from-port="0" to-layer="59" to-port="4" />
|
|
<edge from-layer="59" from-port="5" to-layer="61" to-port="0" />
|
|
<edge from-layer="60" from-port="0" to-layer="61" to-port="1" />
|
|
<edge from-layer="61" from-port="2" to-layer="63" to-port="0" />
|
|
<edge from-layer="62" from-port="0" to-layer="63" to-port="1" />
|
|
<edge from-layer="63" from-port="2" to-layer="112" to-port="0" />
|
|
<edge from-layer="64" from-port="0" to-layer="65" to-port="0" />
|
|
<edge from-layer="65" from-port="1" to-layer="67" to-port="0" />
|
|
<edge from-layer="66" from-port="0" to-layer="67" to-port="1" />
|
|
<edge from-layer="67" from-port="2" to-layer="68" to-port="1" />
|
|
<edge from-layer="68" from-port="2" to-layer="70" to-port="0" />
|
|
<edge from-layer="69" from-port="0" to-layer="70" to-port="1" />
|
|
<edge from-layer="70" from-port="2" to-layer="75" to-port="0" />
|
|
<edge from-layer="71" from-port="0" to-layer="75" to-port="1" />
|
|
<edge from-layer="72" from-port="0" to-layer="75" to-port="2" />
|
|
<edge from-layer="73" from-port="0" to-layer="75" to-port="3" />
|
|
<edge from-layer="74" from-port="0" to-layer="75" to-port="4" />
|
|
<edge from-layer="75" from-port="5" to-layer="77" to-port="0" />
|
|
<edge from-layer="76" from-port="0" to-layer="77" to-port="1" />
|
|
<edge from-layer="77" from-port="2" to-layer="79" to-port="0" />
|
|
<edge from-layer="78" from-port="0" to-layer="79" to-port="1" />
|
|
<edge from-layer="79" from-port="2" to-layer="112" to-port="1" />
|
|
<edge from-layer="80" from-port="0" to-layer="81" to-port="0" />
|
|
<edge from-layer="81" from-port="1" to-layer="83" to-port="0" />
|
|
<edge from-layer="82" from-port="0" to-layer="83" to-port="1" />
|
|
<edge from-layer="83" from-port="2" to-layer="84" to-port="1" />
|
|
<edge from-layer="84" from-port="2" to-layer="86" to-port="0" />
|
|
<edge from-layer="85" from-port="0" to-layer="86" to-port="1" />
|
|
<edge from-layer="86" from-port="2" to-layer="88" to-port="0" />
|
|
<edge from-layer="87" from-port="0" to-layer="88" to-port="1" />
|
|
<edge from-layer="88" from-port="2" to-layer="90" to-port="0" />
|
|
<edge from-layer="89" from-port="0" to-layer="90" to-port="1" />
|
|
<edge from-layer="90" from-port="2" to-layer="112" to-port="2" />
|
|
<edge from-layer="91" from-port="0" to-layer="108" to-port="0" />
|
|
<edge from-layer="92" from-port="0" to-layer="93" to-port="1" />
|
|
<edge from-layer="93" from-port="2" to-layer="95" to-port="0" />
|
|
<edge from-layer="94" from-port="0" to-layer="95" to-port="1" />
|
|
<edge from-layer="95" from-port="2" to-layer="104" to-port="0" />
|
|
<edge from-layer="96" from-port="0" to-layer="98" to-port="1" />
|
|
<edge from-layer="97" from-port="0" to-layer="98" to-port="2" />
|
|
<edge from-layer="98" from-port="3" to-layer="103" to-port="0" />
|
|
<edge from-layer="99" from-port="0" to-layer="103" to-port="1" />
|
|
<edge from-layer="100" from-port="0" to-layer="102" to-port="1" />
|
|
<edge from-layer="101" from-port="0" to-layer="102" to-port="2" />
|
|
<edge from-layer="102" from-port="3" to-layer="103" to-port="2" />
|
|
<edge from-layer="103" from-port="3" to-layer="104" to-port="1" />
|
|
<edge from-layer="104" from-port="2" to-layer="105" to-port="0" />
|
|
<edge from-layer="105" from-port="1" to-layer="107" to-port="0" />
|
|
<edge from-layer="106" from-port="0" to-layer="107" to-port="1" />
|
|
<edge from-layer="107" from-port="2" to-layer="108" to-port="1" />
|
|
<edge from-layer="108" from-port="2" to-layer="109" to-port="0" />
|
|
<edge from-layer="108" from-port="2" to-layer="111" to-port="2" />
|
|
<edge from-layer="109" from-port="1" to-layer="111" to-port="0" />
|
|
<edge from-layer="110" from-port="0" to-layer="111" to-port="1" />
|
|
<edge from-layer="111" from-port="3" to-layer="112" to-port="3" />
|
|
<edge from-layer="111" from-port="3" to-layer="224" to-port="3" />
|
|
<edge from-layer="112" from-port="4" to-layer="114" to-port="0" />
|
|
<edge from-layer="113" from-port="0" to-layer="114" to-port="1" />
|
|
<edge from-layer="114" from-port="2" to-layer="116" to-port="0" />
|
|
<edge from-layer="115" from-port="0" to-layer="116" to-port="1" />
|
|
<edge from-layer="116" from-port="2" to-layer="118" to-port="0" />
|
|
<edge from-layer="117" from-port="0" to-layer="118" to-port="1" />
|
|
<edge from-layer="118" from-port="2" to-layer="123" to-port="0" />
|
|
<edge from-layer="119" from-port="0" to-layer="123" to-port="1" />
|
|
<edge from-layer="120" from-port="0" to-layer="123" to-port="2" />
|
|
<edge from-layer="121" from-port="0" to-layer="123" to-port="3" />
|
|
<edge from-layer="122" from-port="0" to-layer="123" to-port="4" />
|
|
<edge from-layer="123" from-port="5" to-layer="128" to-port="0" />
|
|
<edge from-layer="124" from-port="0" to-layer="125" to-port="0" />
|
|
<edge from-layer="125" from-port="1" to-layer="127" to-port="0" />
|
|
<edge from-layer="126" from-port="0" to-layer="127" to-port="1" />
|
|
<edge from-layer="127" from-port="2" to-layer="128" to-port="1" />
|
|
<edge from-layer="128" from-port="2" to-layer="130" to-port="0" />
|
|
<edge from-layer="129" from-port="0" to-layer="130" to-port="1" />
|
|
<edge from-layer="130" from-port="2" to-layer="131" to-port="0" />
|
|
<edge from-layer="131" from-port="2" to-layer="133" to-port="0" />
|
|
<edge from-layer="132" from-port="0" to-layer="133" to-port="1" />
|
|
<edge from-layer="133" from-port="2" to-layer="135" to-port="0" />
|
|
<edge from-layer="134" from-port="0" to-layer="135" to-port="1" />
|
|
<edge from-layer="135" from-port="2" to-layer="137" to-port="0" />
|
|
<edge from-layer="136" from-port="0" to-layer="137" to-port="1" />
|
|
<edge from-layer="137" from-port="2" to-layer="167" to-port="1" />
|
|
<edge from-layer="137" from-port="2" to-layer="139" to-port="0" />
|
|
<edge from-layer="138" from-port="0" to-layer="139" to-port="1" />
|
|
<edge from-layer="139" from-port="2" to-layer="144" to-port="0" />
|
|
<edge from-layer="140" from-port="0" to-layer="144" to-port="1" />
|
|
<edge from-layer="141" from-port="0" to-layer="144" to-port="2" />
|
|
<edge from-layer="142" from-port="0" to-layer="144" to-port="3" />
|
|
<edge from-layer="143" from-port="0" to-layer="144" to-port="4" />
|
|
<edge from-layer="144" from-port="5" to-layer="149" to-port="0" />
|
|
<edge from-layer="145" from-port="0" to-layer="146" to-port="0" />
|
|
<edge from-layer="146" from-port="1" to-layer="148" to-port="0" />
|
|
<edge from-layer="147" from-port="0" to-layer="148" to-port="1" />
|
|
<edge from-layer="148" from-port="2" to-layer="149" to-port="1" />
|
|
<edge from-layer="149" from-port="2" to-layer="151" to-port="0" />
|
|
<edge from-layer="150" from-port="0" to-layer="151" to-port="1" />
|
|
<edge from-layer="151" from-port="2" to-layer="152" to-port="0" />
|
|
<edge from-layer="152" from-port="1" to-layer="154" to-port="0" />
|
|
<edge from-layer="153" from-port="0" to-layer="154" to-port="1" />
|
|
<edge from-layer="154" from-port="2" to-layer="159" to-port="0" />
|
|
<edge from-layer="155" from-port="0" to-layer="159" to-port="1" />
|
|
<edge from-layer="156" from-port="0" to-layer="159" to-port="2" />
|
|
<edge from-layer="157" from-port="0" to-layer="159" to-port="3" />
|
|
<edge from-layer="158" from-port="0" to-layer="159" to-port="4" />
|
|
<edge from-layer="159" from-port="5" to-layer="164" to-port="0" />
|
|
<edge from-layer="160" from-port="0" to-layer="161" to-port="0" />
|
|
<edge from-layer="161" from-port="1" to-layer="163" to-port="0" />
|
|
<edge from-layer="162" from-port="0" to-layer="163" to-port="1" />
|
|
<edge from-layer="163" from-port="2" to-layer="164" to-port="1" />
|
|
<edge from-layer="164" from-port="2" to-layer="166" to-port="0" />
|
|
<edge from-layer="165" from-port="0" to-layer="166" to-port="1" />
|
|
<edge from-layer="166" from-port="2" to-layer="167" to-port="0" />
|
|
<edge from-layer="167" from-port="2" to-layer="169" to-port="0" />
|
|
<edge from-layer="168" from-port="0" to-layer="169" to-port="1" />
|
|
<edge from-layer="169" from-port="2" to-layer="171" to-port="0" />
|
|
<edge from-layer="170" from-port="0" to-layer="171" to-port="1" />
|
|
<edge from-layer="171" from-port="2" to-layer="173" to-port="0" />
|
|
<edge from-layer="172" from-port="0" to-layer="173" to-port="1" />
|
|
<edge from-layer="173" from-port="2" to-layer="175" to-port="0" />
|
|
<edge from-layer="173" from-port="2" to-layer="243" to-port="1" />
|
|
<edge from-layer="174" from-port="0" to-layer="175" to-port="1" />
|
|
<edge from-layer="175" from-port="2" to-layer="180" to-port="0" />
|
|
<edge from-layer="176" from-port="0" to-layer="180" to-port="1" />
|
|
<edge from-layer="177" from-port="0" to-layer="180" to-port="2" />
|
|
<edge from-layer="178" from-port="0" to-layer="180" to-port="3" />
|
|
<edge from-layer="179" from-port="0" to-layer="180" to-port="4" />
|
|
<edge from-layer="180" from-port="5" to-layer="185" to-port="0" />
|
|
<edge from-layer="180" from-port="5" to-layer="201" to-port="0" />
|
|
<edge from-layer="180" from-port="5" to-layer="217" to-port="0" />
|
|
<edge from-layer="181" from-port="0" to-layer="182" to-port="0" />
|
|
<edge from-layer="182" from-port="1" to-layer="184" to-port="0" />
|
|
<edge from-layer="183" from-port="0" to-layer="184" to-port="1" />
|
|
<edge from-layer="184" from-port="2" to-layer="185" to-port="1" />
|
|
<edge from-layer="185" from-port="2" to-layer="187" to-port="0" />
|
|
<edge from-layer="186" from-port="0" to-layer="187" to-port="1" />
|
|
<edge from-layer="187" from-port="2" to-layer="192" to-port="0" />
|
|
<edge from-layer="188" from-port="0" to-layer="192" to-port="1" />
|
|
<edge from-layer="189" from-port="0" to-layer="192" to-port="2" />
|
|
<edge from-layer="190" from-port="0" to-layer="192" to-port="3" />
|
|
<edge from-layer="191" from-port="0" to-layer="192" to-port="4" />
|
|
<edge from-layer="192" from-port="5" to-layer="194" to-port="0" />
|
|
<edge from-layer="193" from-port="0" to-layer="194" to-port="1" />
|
|
<edge from-layer="194" from-port="2" to-layer="196" to-port="0" />
|
|
<edge from-layer="195" from-port="0" to-layer="196" to-port="1" />
|
|
<edge from-layer="196" from-port="2" to-layer="224" to-port="0" />
|
|
<edge from-layer="197" from-port="0" to-layer="198" to-port="0" />
|
|
<edge from-layer="198" from-port="1" to-layer="200" to-port="0" />
|
|
<edge from-layer="199" from-port="0" to-layer="200" to-port="1" />
|
|
<edge from-layer="200" from-port="2" to-layer="201" to-port="1" />
|
|
<edge from-layer="201" from-port="2" to-layer="203" to-port="0" />
|
|
<edge from-layer="202" from-port="0" to-layer="203" to-port="1" />
|
|
<edge from-layer="203" from-port="2" to-layer="208" to-port="0" />
|
|
<edge from-layer="204" from-port="0" to-layer="208" to-port="1" />
|
|
<edge from-layer="205" from-port="0" to-layer="208" to-port="2" />
|
|
<edge from-layer="206" from-port="0" to-layer="208" to-port="3" />
|
|
<edge from-layer="207" from-port="0" to-layer="208" to-port="4" />
|
|
<edge from-layer="208" from-port="5" to-layer="210" to-port="0" />
|
|
<edge from-layer="209" from-port="0" to-layer="210" to-port="1" />
|
|
<edge from-layer="210" from-port="2" to-layer="212" to-port="0" />
|
|
<edge from-layer="211" from-port="0" to-layer="212" to-port="1" />
|
|
<edge from-layer="212" from-port="2" to-layer="224" to-port="1" />
|
|
<edge from-layer="213" from-port="0" to-layer="214" to-port="0" />
|
|
<edge from-layer="214" from-port="1" to-layer="216" to-port="0" />
|
|
<edge from-layer="215" from-port="0" to-layer="216" to-port="1" />
|
|
<edge from-layer="216" from-port="2" to-layer="217" to-port="1" />
|
|
<edge from-layer="217" from-port="2" to-layer="219" to-port="0" />
|
|
<edge from-layer="218" from-port="0" to-layer="219" to-port="1" />
|
|
<edge from-layer="219" from-port="2" to-layer="221" to-port="0" />
|
|
<edge from-layer="220" from-port="0" to-layer="221" to-port="1" />
|
|
<edge from-layer="221" from-port="2" to-layer="223" to-port="0" />
|
|
<edge from-layer="222" from-port="0" to-layer="223" to-port="1" />
|
|
<edge from-layer="223" from-port="2" to-layer="224" to-port="2" />
|
|
<edge from-layer="224" from-port="4" to-layer="226" to-port="0" />
|
|
<edge from-layer="225" from-port="0" to-layer="226" to-port="1" />
|
|
<edge from-layer="226" from-port="2" to-layer="228" to-port="0" />
|
|
<edge from-layer="227" from-port="0" to-layer="228" to-port="1" />
|
|
<edge from-layer="228" from-port="2" to-layer="230" to-port="0" />
|
|
<edge from-layer="229" from-port="0" to-layer="230" to-port="1" />
|
|
<edge from-layer="230" from-port="2" to-layer="235" to-port="0" />
|
|
<edge from-layer="231" from-port="0" to-layer="235" to-port="1" />
|
|
<edge from-layer="232" from-port="0" to-layer="235" to-port="2" />
|
|
<edge from-layer="233" from-port="0" to-layer="235" to-port="3" />
|
|
<edge from-layer="234" from-port="0" to-layer="235" to-port="4" />
|
|
<edge from-layer="235" from-port="5" to-layer="240" to-port="0" />
|
|
<edge from-layer="236" from-port="0" to-layer="237" to-port="0" />
|
|
<edge from-layer="237" from-port="1" to-layer="239" to-port="0" />
|
|
<edge from-layer="238" from-port="0" to-layer="239" to-port="1" />
|
|
<edge from-layer="239" from-port="2" to-layer="240" to-port="1" />
|
|
<edge from-layer="240" from-port="2" to-layer="242" to-port="0" />
|
|
<edge from-layer="241" from-port="0" to-layer="242" to-port="1" />
|
|
<edge from-layer="242" from-port="2" to-layer="243" to-port="0" />
|
|
<edge from-layer="243" from-port="2" to-layer="245" to-port="0" />
|
|
<edge from-layer="244" from-port="0" to-layer="245" to-port="1" />
|
|
<edge from-layer="245" from-port="2" to-layer="247" to-port="0" />
|
|
<edge from-layer="246" from-port="0" to-layer="247" to-port="1" />
|
|
<edge from-layer="247" from-port="2" to-layer="249" to-port="0" />
|
|
<edge from-layer="248" from-port="0" to-layer="249" to-port="1" />
|
|
<edge from-layer="249" from-port="2" to-layer="251" to-port="0" />
|
|
<edge from-layer="249" from-port="2" to-layer="279" to-port="1" />
|
|
<edge from-layer="250" from-port="0" to-layer="251" to-port="1" />
|
|
<edge from-layer="251" from-port="2" to-layer="256" to-port="0" />
|
|
<edge from-layer="252" from-port="0" to-layer="256" to-port="1" />
|
|
<edge from-layer="253" from-port="0" to-layer="256" to-port="2" />
|
|
<edge from-layer="254" from-port="0" to-layer="256" to-port="3" />
|
|
<edge from-layer="255" from-port="0" to-layer="256" to-port="4" />
|
|
<edge from-layer="256" from-port="5" to-layer="261" to-port="0" />
|
|
<edge from-layer="257" from-port="0" to-layer="258" to-port="0" />
|
|
<edge from-layer="258" from-port="1" to-layer="260" to-port="0" />
|
|
<edge from-layer="259" from-port="0" to-layer="260" to-port="1" />
|
|
<edge from-layer="260" from-port="2" to-layer="261" to-port="1" />
|
|
<edge from-layer="261" from-port="2" to-layer="263" to-port="0" />
|
|
<edge from-layer="262" from-port="0" to-layer="263" to-port="1" />
|
|
<edge from-layer="263" from-port="2" to-layer="264" to-port="0" />
|
|
<edge from-layer="264" from-port="1" to-layer="266" to-port="0" />
|
|
<edge from-layer="265" from-port="0" to-layer="266" to-port="1" />
|
|
<edge from-layer="266" from-port="2" to-layer="271" to-port="0" />
|
|
<edge from-layer="267" from-port="0" to-layer="271" to-port="1" />
|
|
<edge from-layer="268" from-port="0" to-layer="271" to-port="2" />
|
|
<edge from-layer="269" from-port="0" to-layer="271" to-port="3" />
|
|
<edge from-layer="270" from-port="0" to-layer="271" to-port="4" />
|
|
<edge from-layer="271" from-port="5" to-layer="276" to-port="0" />
|
|
<edge from-layer="272" from-port="0" to-layer="273" to-port="0" />
|
|
<edge from-layer="273" from-port="1" to-layer="275" to-port="0" />
|
|
<edge from-layer="274" from-port="0" to-layer="275" to-port="1" />
|
|
<edge from-layer="275" from-port="2" to-layer="276" to-port="1" />
|
|
<edge from-layer="276" from-port="2" to-layer="278" to-port="0" />
|
|
<edge from-layer="277" from-port="0" to-layer="278" to-port="1" />
|
|
<edge from-layer="278" from-port="2" to-layer="279" to-port="0" />
|
|
<edge from-layer="279" from-port="2" to-layer="281" to-port="0" />
|
|
<edge from-layer="280" from-port="0" to-layer="281" to-port="1" />
|
|
<edge from-layer="281" from-port="2" to-layer="283" to-port="0" />
|
|
<edge from-layer="282" from-port="0" to-layer="283" to-port="1" />
|
|
<edge from-layer="283" from-port="2" to-layer="285" to-port="0" />
|
|
<edge from-layer="284" from-port="0" to-layer="285" to-port="1" />
|
|
<edge from-layer="285" from-port="2" to-layer="286" to-port="0" />
|
|
</edges>
|
|
<rt_info>
|
|
<Runtime_version value="2024.4.1-16618-643f23d1318-releases/2024/4" />
|
|
<conversion_parameters>
|
|
<framework value="pytorch" />
|
|
<is_python_object value="True" />
|
|
</conversion_parameters>
|
|
<nncf>
|
|
<friendly_names_were_updated value="True" />
|
|
<quantization>
|
|
<advanced_parameters value="{'overflow_fix': 'disable', 'quantize_outputs': False, 'inplace_statistics': True, 'disable_channel_alignment': True, 'disable_bias_correction': False, 'batchwise_statistics': None, 'activations_quantization_params': None, 'weights_quantization_params': None, 'activations_range_estimator_params': {'min': {'statistics_type': None, 'aggregator_type': None, 'clipping_value': None, 'quantile_outlier_prob': 0.0001}, 'max': {'statistics_type': None, 'aggregator_type': None, 'clipping_value': None, 'quantile_outlier_prob': 0.0001}}, 'weights_range_estimator_params': {'min': {'statistics_type': None, 'aggregator_type': None, 'clipping_value': None, 'quantile_outlier_prob': 0.0001}, 'max': {'statistics_type': None, 'aggregator_type': None, 'clipping_value': None, 'quantile_outlier_prob': 0.0001}}, 'bias_correction_params': {'apply_for_all_nodes': False, 'threshold': None}, 'smooth_quant_alphas': {'convolution': -1, 'matmul': 0.95}, 'smooth_quant_alpha': None, 'backend_params': {}}" />
|
|
<fast_bias_correction value="True" />
|
|
<ignored_scope>
|
|
<types value="['GroupNormalization']" />
|
|
</ignored_scope>
|
|
<model_type value="transformer" />
|
|
<preset value="mixed" />
|
|
<subset_size value="300" />
|
|
<target_device value="ANY" />
|
|
</quantization>
|
|
</nncf>
|
|
<optimum>
|
|
<optimum_intel_version value="1.20.1" />
|
|
<optimum_version value="1.23.3" />
|
|
<pytorch_version value="2.5.0+cu121" />
|
|
<transformers_version value="4.46.2" />
|
|
</optimum>
|
|
</rt_info>
|
|
</net>
|
|
|