41330 lines
1.3 MiB
41330 lines
1.3 MiB
<?xml version="1.0"?>
|
|
<net name="Model786" version="11">
|
|
<layers>
|
|
<layer id="1" name="input_ids" type="Parameter" version="opset1">
|
|
<data shape="?,?" element_type="i64" />
|
|
<output>
|
|
<port id="0" precision="I64" names="input_ids">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="0" name="attention_mask" type="Parameter" version="opset1">
|
|
<data shape="?,?" element_type="i64" />
|
|
<output>
|
|
<port id="0" precision="I64" names="attention_mask">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2" name="Constant_1974064" type="Const" version="opset1">
|
|
<data element_type="i8" shape="50265, 1024" offset="0" size="51471360" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>50265</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="3" name="Convert_1974065" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>50265</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>50265</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="4" name="Constant_1974066" type="Const" version="opset1">
|
|
<data element_type="f32" shape="50265, 1" offset="51471360" size="201060" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>50265</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="5" name="__module.roberta.embeddings.word_embeddings/aten::embedding/Gather/fq_weights_0" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>50265</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>50265</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>50265</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="6" name="__module.roberta.embeddings.word_embeddings/aten::embedding/Convert" type="Convert" version="opset1">
|
|
<data destination_type="i32" />
|
|
<input>
|
|
<port id="0" precision="I64">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="I32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="7" name="__module.roberta.embeddings.word_embeddings/aten::embedding/Constant" type="Const" version="opset1">
|
|
<data element_type="i32" shape="" offset="51672420" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="8" name="__module.roberta.embeddings.word_embeddings/aten::embedding/Gather" type="Gather" version="opset8">
|
|
<data batch_dims="0" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>50265</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
<port id="2" precision="I32" />
|
|
</input>
|
|
<output>
|
|
<port id="3" precision="FP32" names="54,inputs_embeds">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="9" name="Constant_1974068" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1, 1024" offset="51672424" size="1024" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="10" name="Convert_1974069" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="11" name="Constant_1974070" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1" offset="51673448" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="12" name="__module.roberta.embeddings.token_type_embeddings/aten::embedding/Gather/fq_weights_0" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="13" name="__module.roberta/aten::slice/Slice" type="Const" version="opset1">
|
|
<data element_type="i64" shape="1, 514" offset="51673452" size="4112" />
|
|
<output>
|
|
<port id="0" precision="I64" names="37">
|
|
<dim>1</dim>
|
|
<dim>514</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="14" name="__module.roberta/aten::slice/Reshape" type="Const" version="opset1">
|
|
<data element_type="i64" shape="1" offset="51677564" size="8" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="15" name="__module.roberta/aten::size/ShapeOf_1" type="ShapeOf" version="opset3">
|
|
<data output_type="i64" />
|
|
<input>
|
|
<port id="0" precision="I64">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="I64" names="39">
|
|
<dim>2</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="16" name="Constant_857969" type="Const" version="opset1">
|
|
<data element_type="i64" shape="1" offset="51677572" size="8" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="17" name="Constant_857970" type="Const" version="opset1">
|
|
<data element_type="i64" shape="" offset="51677564" size="8" />
|
|
<output>
|
|
<port id="0" precision="I64" />
|
|
</output>
|
|
</layer>
|
|
<layer id="18" name="Gather_857971" type="Gather" version="opset8">
|
|
<data batch_dims="0" />
|
|
<input>
|
|
<port id="0" precision="I64">
|
|
<dim>2</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>1</dim>
|
|
</port>
|
|
<port id="2" precision="I64" />
|
|
</input>
|
|
<output>
|
|
<port id="3" precision="I64" names="36,67">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="19" name="__module.roberta/aten::slice/Reshape_2" type="Const" version="opset1">
|
|
<data element_type="i64" shape="1" offset="51677572" size="8" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="20" name="__module.roberta/aten::slice/Reshape_3" type="Const" version="opset1">
|
|
<data element_type="i64" shape="1" offset="51677572" size="8" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="21" name="__module.roberta/aten::slice/Slice_1" type="Slice" version="opset8">
|
|
<input>
|
|
<port id="0" precision="I64">
|
|
<dim>1</dim>
|
|
<dim>514</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>1</dim>
|
|
</port>
|
|
<port id="2" precision="I64">
|
|
<dim>1</dim>
|
|
</port>
|
|
<port id="3" precision="I64">
|
|
<dim>1</dim>
|
|
</port>
|
|
<port id="4" precision="I64">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="I64" names="38,buffered_token_type_ids">
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="22" name="__module.roberta/aten::expand/Broadcast" type="Broadcast" version="opset3">
|
|
<data mode="bidirectional" />
|
|
<input>
|
|
<port id="0" precision="I64">
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>2</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="I64" names="40">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="23" name="__module.roberta.embeddings.token_type_embeddings/aten::embedding/Convert" type="Convert" version="opset1">
|
|
<data destination_type="i32" />
|
|
<input>
|
|
<port id="0" precision="I64">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="I32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="24" name="__module.roberta.embeddings.token_type_embeddings/aten::embedding/Constant" type="Const" version="opset1">
|
|
<data element_type="i32" shape="" offset="51672420" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="25" name="__module.roberta.embeddings.token_type_embeddings/aten::embedding/Gather" type="Gather" version="opset8">
|
|
<data batch_dims="0" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
<port id="2" precision="I32" />
|
|
</input>
|
|
<output>
|
|
<port id="3" precision="FP32" names="56,token_type_embeddings.1">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="26" name="__module.roberta.embeddings/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="57_1">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="27" name="Constant_1974072" type="Const" version="opset1">
|
|
<data element_type="i8" shape="514, 1024" offset="51677580" size="526336" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>514</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="28" name="Convert_1974073" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>514</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>514</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="29" name="Constant_1974074" type="Const" version="opset1">
|
|
<data element_type="f32" shape="514, 1" offset="52203916" size="2056" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>514</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="30" name="__module.roberta.embeddings.position_embeddings/aten::embedding/Gather/fq_weights_0" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>514</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>514</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>514</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="31" name="Constant_857534" type="Const" version="opset1">
|
|
<data element_type="i64" shape="1, 1" offset="51677572" size="8" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="32" name="__module.roberta.embeddings/aten::ne/NotEqual" type="NotEqual" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="I64">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="BOOL" names="45">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="33" name="__module.roberta.embeddings/aten::to/Convert" type="Convert" version="opset1">
|
|
<data destination_type="i32" />
|
|
<input>
|
|
<port id="0" precision="BOOL">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="I32" names="46,mask">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="34" name="29" type="Const" version="opset1">
|
|
<data element_type="i64" shape="" offset="51677572" size="8" />
|
|
<output>
|
|
<port id="0" precision="I64" names="29" />
|
|
</output>
|
|
</layer>
|
|
<layer id="35" name="__module.roberta.embeddings/aten::cumsum/CumSum" type="CumSum" version="opset3">
|
|
<data exclusive="false" reverse="false" />
|
|
<input>
|
|
<port id="0" precision="I32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
<port id="1" precision="I64" />
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="I32" names="47,48,49">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="36" name="__module.roberta.embeddings/aten::mul/Multiply" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="I32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="I32" names="50,incremental_indices">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="37" name="__module.roberta.embeddings/aten::to/Convert_1" type="Convert" version="opset1">
|
|
<data destination_type="i64" />
|
|
<input>
|
|
<port id="0" precision="I32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="I64" names="51">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="38" name="Constant_857535" type="Const" version="opset1">
|
|
<data element_type="i64" shape="1, 1" offset="51677572" size="8" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="39" name="__module.roberta.embeddings/aten::add/Add_2" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="I64">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="I64" names="52">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="40" name="__module.roberta.embeddings.position_embeddings/aten::embedding/Convert" type="Convert" version="opset1">
|
|
<data destination_type="i32" />
|
|
<input>
|
|
<port id="0" precision="I64">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="I32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="41" name="__module.roberta.embeddings.position_embeddings/aten::embedding/Constant" type="Const" version="opset1">
|
|
<data element_type="i32" shape="" offset="51672420" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="42" name="__module.roberta.embeddings.position_embeddings/aten::embedding/Gather" type="Gather" version="opset8">
|
|
<data batch_dims="0" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>514</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
<port id="2" precision="I32" />
|
|
</input>
|
|
<output>
|
|
<port id="3" precision="FP32" names="59,position_embeddings.1">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="43" name="__module.roberta.embeddings/aten::add_/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="57,embeddings.1">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="44" name="__module.roberta.embeddings.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="45" name="__module.roberta.embeddings.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="46" name="Constant_857536" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="52205976" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="47" name="__module.roberta.embeddings.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="48" name="Constant_857537" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="52210072" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="49" name="__module.roberta.embeddings.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="64,input.1">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="50" name="__module.roberta.embeddings.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="52214168" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="51" name="__module.roberta.embeddings.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="52" name="__module.roberta.embeddings.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="52218264" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="53" name="__module.roberta.embeddings.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="52218268" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="54" name="__module.roberta.embeddings.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="52218264" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="55" name="__module.roberta.embeddings.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="52218268" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="56" name="__module.roberta.embeddings.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="57" name="Constant_1974076" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="52218272" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="58" name="Convert_1974077" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="59" name="Constant_1974078" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="53266848" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="60" name="__module.roberta.encoder.layer.0.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="61" name="__module.roberta.encoder.layer.0.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="62" name="Constant_857538" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="53270944" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="63" name="__module.roberta.encoder.layer.0.attention.self.query/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="138,x.1">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="64" name="__module.roberta.encoder.layer.0.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="53275040" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="65" name="__module.roberta.encoder.layer.0.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="53275044" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="66" name="__module.roberta.encoder.layer.0.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="53275040" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="67" name="__module.roberta.encoder.layer.0.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="53275044" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="68" name="__module.roberta.encoder.layer.0.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="69" name="__module.roberta.encoder.layer.0.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="70" name="__module.roberta.encoder.layer.0.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="142,x.3">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="71" name="Constant_843173" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="143">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="72" name="__module.roberta.encoder.layer.0.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="144">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="73" name="Constant_1974080" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="53275112" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="74" name="Convert_1974081" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="75" name="Constant_1974082" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="54323688" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="76" name="__module.roberta.encoder.layer.0.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="77" name="__module.roberta.encoder.layer.0.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="78" name="Constant_857539" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="54327784" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="79" name="__module.roberta.encoder.layer.0.attention.self.key/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="147,x.5">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="80" name="__module.roberta.encoder.layer.0.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="54331880" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="81" name="__module.roberta.encoder.layer.0.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="54331884" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="82" name="__module.roberta.encoder.layer.0.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="54331880" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="83" name="__module.roberta.encoder.layer.0.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="54331884" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="84" name="__module.roberta.encoder.layer.0.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="85" name="__module.roberta.encoder.layer.0.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="86" name="__module.roberta.encoder.layer.0.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="151,x.7">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="87" name="Constant_843196" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="152">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="88" name="__module.roberta.encoder.layer.0.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="153">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="89" name="Constant_1974084" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="54331888" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="90" name="Convert_1974085" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="91" name="Constant_1974086" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="55380464" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="92" name="__module.roberta.encoder.layer.0.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="93" name="__module.roberta.encoder.layer.0.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="94" name="Constant_857540" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="55384560" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="95" name="__module.roberta.encoder.layer.0.attention.self.value/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="156,x.9">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="96" name="__module.roberta.encoder.layer.0.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="97" name="__module.roberta.encoder.layer.0.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="160,x.11">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="98" name="Constant_843219" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="161">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="99" name="__module.roberta.encoder.layer.0.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="162">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="100" name="Constant_857542" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1, 1" offset="55388656" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="101" name="__module.roberta/aten::unsqueeze/Unsqueeze" type="Unsqueeze" version="opset1">
|
|
<input>
|
|
<port id="0" precision="I64">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
<port id="1" precision="I64" />
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="I64" names="69">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="102" name="16" type="Const" version="opset1">
|
|
<data element_type="i64" shape="" offset="55388660" size="8" />
|
|
<output>
|
|
<port id="0" precision="I64" names="16" />
|
|
</output>
|
|
</layer>
|
|
<layer id="103" name="__module.roberta/aten::unsqueeze/Unsqueeze_1" type="Unsqueeze" version="opset1">
|
|
<input>
|
|
<port id="0" precision="I64">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
<port id="1" precision="I64" />
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="I64" names="70,71">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="104" name="Constant_857974" type="Const" version="opset1">
|
|
<data element_type="i64" shape="1" offset="51677564" size="8" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="105" name="Constant_857975" type="Const" version="opset1">
|
|
<data element_type="i64" shape="" offset="51677564" size="8" />
|
|
<output>
|
|
<port id="0" precision="I64" />
|
|
</output>
|
|
</layer>
|
|
<layer id="106" name="Gather_857976" type="Gather" version="opset8">
|
|
<data batch_dims="0" />
|
|
<input>
|
|
<port id="0" precision="I64">
|
|
<dim>2</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>1</dim>
|
|
</port>
|
|
<port id="2" precision="I64" />
|
|
</input>
|
|
<output>
|
|
<port id="3" precision="I64" names="66">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="107" name="Constant_854998" type="Const" version="opset1">
|
|
<data element_type="i64" shape="1" offset="51677572" size="8" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="108" name="Constant_858098" type="Const" version="opset1">
|
|
<data element_type="i64" shape="2" offset="55388668" size="16" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>2</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="109" name="Constant_858099" type="Const" version="opset1">
|
|
<data element_type="i64" shape="" offset="51677564" size="8" />
|
|
<output>
|
|
<port id="0" precision="I64" />
|
|
</output>
|
|
</layer>
|
|
<layer id="110" name="Gather_858100" type="Gather" version="opset8">
|
|
<data batch_dims="0" />
|
|
<input>
|
|
<port id="0" precision="I64">
|
|
<dim>2</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>2</dim>
|
|
</port>
|
|
<port id="2" precision="I64" />
|
|
</input>
|
|
<output>
|
|
<port id="3" precision="I64">
|
|
<dim>2</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="111" name="__module.roberta/prim::ListConstruct/Concat_1" type="Concat" version="opset1">
|
|
<data axis="0" />
|
|
<input>
|
|
<port id="0" precision="I64">
|
|
<dim>1</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>1</dim>
|
|
</port>
|
|
<port id="2" precision="I64">
|
|
<dim>2</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="3" precision="I64" names="72">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="112" name="__module.roberta/aten::expand/Broadcast_1" type="Broadcast" version="opset3">
|
|
<data mode="bidirectional" />
|
|
<input>
|
|
<port id="0" precision="I64">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="I64" names="73">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="113" name="__module.roberta/aten::to/Convert" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I64">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32" names="74">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="114" name="Constant_857541" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1, 1" offset="55388656" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="115" name="__module.roberta/aten::rsub/Multiply" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="116" name="__module.roberta/aten::rsub/Subtract" type="Subtract" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="75,inverted_mask">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="117" name="__module.roberta/aten::to/Convert_1" type="Convert" version="opset1">
|
|
<data destination_type="boolean" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="BOOL" names="76">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="118" name="__module.roberta/aten::masked_fill/ConvertLike" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="55388684" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="119" name="__module.roberta/aten::masked_fill/Select" type="Select" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="BOOL">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="3" precision="FP32" names="77">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="120" name="__module.roberta.encoder.layer.0.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
|
|
<data causal="false" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="3" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="4" precision="FP32" names="163,attn_output.1">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="121" name="__module.roberta.encoder.layer.0.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
|
|
<data element_type="i32" shape="4" offset="55388688" size="16" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="122" name="__module.roberta.encoder.layer.0.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="164,attn_output.3">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="123" name="Constant_857978" type="Const" version="opset1">
|
|
<data element_type="i64" shape="3" offset="55388704" size="24" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="124" name="__module.roberta.encoder.layer.0.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="166">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="125" name="__module.roberta.encoder.layer.0.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="55388728" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="126" name="__module.roberta.encoder.layer.0.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="127" name="__module.roberta.encoder.layer.0.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="55392824" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="128" name="__module.roberta.encoder.layer.0.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="55392828" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="129" name="__module.roberta.encoder.layer.0.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="55392824" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="130" name="__module.roberta.encoder.layer.0.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="55392828" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="131" name="__module.roberta.encoder.layer.0.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="132" name="Constant_1974088" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="55392832" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="133" name="Convert_1974089" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="134" name="Constant_1974090" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="56441408" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="135" name="__module.roberta.encoder.layer.0.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="136" name="__module.roberta.encoder.layer.0.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="137" name="Constant_857543" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="56445504" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="138" name="__module.roberta.encoder.layer.0.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="171,input.3">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="139" name="__module.roberta.encoder.layer.0.attention.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="173">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="140" name="__module.roberta.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="141" name="__module.roberta.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="142" name="Constant_857544" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="56449600" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="143" name="__module.roberta.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="144" name="Constant_857545" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="56453696" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="145" name="__module.roberta.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="177,input_tensor.1">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="146" name="__module.roberta.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="56457792" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="147" name="__module.roberta.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="148" name="__module.roberta.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="56461888" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="149" name="__module.roberta.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="56461892" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="150" name="__module.roberta.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="56461888" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="151" name="__module.roberta.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="56461892" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="152" name="__module.roberta.encoder.layer.0.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="153" name="Constant_1974092" type="Const" version="opset1">
|
|
<data element_type="i8" shape="4096, 1024" offset="56461896" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="154" name="Convert_1974093" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="155" name="Constant_1974094" type="Const" version="opset1">
|
|
<data element_type="f32" shape="4096, 1" offset="60656200" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="156" name="__module.roberta.encoder.layer.0.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="157" name="__module.roberta.encoder.layer.0.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="158" name="Constant_857546" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="60672584" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="159" name="__module.roberta.encoder.layer.0.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="181">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="160" name="__module.roberta.encoder.layer.0.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
|
<data approximation_mode="ERF" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32" names="182">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="161" name="__module.roberta.encoder.layer.0.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="60688968" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="162" name="__module.roberta.encoder.layer.0.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="163" name="__module.roberta.encoder.layer.0.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="60705352" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="164" name="__module.roberta.encoder.layer.0.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="60705356" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="165" name="__module.roberta.encoder.layer.0.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="60705352" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="166" name="__module.roberta.encoder.layer.0.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="60705356" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="167" name="__module.roberta.encoder.layer.0.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="168" name="Constant_1974096" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 4096" offset="60705360" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="169" name="Convert_1974097" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="170" name="Constant_1974098" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="64899664" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="171" name="__module.roberta.encoder.layer.0.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="172" name="__module.roberta.encoder.layer.0.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="173" name="Constant_857547" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="64903760" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="174" name="__module.roberta.encoder.layer.0.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="187,input.5">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="175" name="__module.roberta.encoder.layer.0.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="189">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="176" name="__module.roberta.encoder.layer.0.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="177" name="__module.roberta.encoder.layer.0.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="178" name="Constant_857548" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="64907856" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="179" name="__module.roberta.encoder.layer.0.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="180" name="Constant_857549" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="64911952" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="181" name="__module.roberta.encoder.layer.0.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="193,hidden_states.7">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="182" name="__module.roberta.encoder.layer.0.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="64916048" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="183" name="__module.roberta.encoder.layer.0.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="184" name="__module.roberta.encoder.layer.0.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="64920144" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="185" name="__module.roberta.encoder.layer.0.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="64920148" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="186" name="__module.roberta.encoder.layer.0.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="64920144" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="187" name="__module.roberta.encoder.layer.0.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="64920148" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="188" name="__module.roberta.encoder.layer.0.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="189" name="Constant_1974100" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="64920152" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="190" name="Convert_1974101" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="191" name="Constant_1974102" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="65968728" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="192" name="__module.roberta.encoder.layer.1.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="193" name="__module.roberta.encoder.layer.1.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="194" name="Constant_857550" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="65972824" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="195" name="__module.roberta.encoder.layer.1.attention.self.query/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="206,x.13">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="196" name="__module.roberta.encoder.layer.1.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="65976920" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="197" name="__module.roberta.encoder.layer.1.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="65976924" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="198" name="__module.roberta.encoder.layer.1.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="65976920" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="199" name="__module.roberta.encoder.layer.1.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="65976924" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="200" name="__module.roberta.encoder.layer.1.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="201" name="__module.roberta.encoder.layer.1.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="202" name="__module.roberta.encoder.layer.1.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="210,x.15">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="203" name="Constant_843396" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="211">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="204" name="__module.roberta.encoder.layer.1.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="212">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="205" name="Constant_1974104" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="65976928" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="206" name="Convert_1974105" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="207" name="Constant_1974106" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="67025504" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="208" name="__module.roberta.encoder.layer.1.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="209" name="__module.roberta.encoder.layer.1.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="210" name="Constant_857551" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="67029600" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="211" name="__module.roberta.encoder.layer.1.attention.self.key/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="215,x.17">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="212" name="__module.roberta.encoder.layer.1.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="67033696" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="213" name="__module.roberta.encoder.layer.1.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="67033700" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="214" name="__module.roberta.encoder.layer.1.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="67033696" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="215" name="__module.roberta.encoder.layer.1.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="67033700" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="216" name="__module.roberta.encoder.layer.1.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="217" name="__module.roberta.encoder.layer.1.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="218" name="__module.roberta.encoder.layer.1.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="219,x.19">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="219" name="Constant_843419" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="220">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="220" name="__module.roberta.encoder.layer.1.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="221">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="221" name="Constant_1974108" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="67033704" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="222" name="Convert_1974109" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="223" name="Constant_1974110" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="68082280" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="224" name="__module.roberta.encoder.layer.1.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="225" name="__module.roberta.encoder.layer.1.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="226" name="Constant_857552" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="68086376" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="227" name="__module.roberta.encoder.layer.1.attention.self.value/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="224,x.21">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="228" name="__module.roberta.encoder.layer.1.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="229" name="__module.roberta.encoder.layer.1.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="228,x.23">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="230" name="Constant_843442" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="229">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="231" name="__module.roberta.encoder.layer.1.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="230">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="232" name="__module.roberta.encoder.layer.1.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
|
|
<data causal="false" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="3" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="4" precision="FP32" names="231,attn_output.5">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="233" name="__module.roberta.encoder.layer.1.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
|
|
<data element_type="i32" shape="4" offset="55388688" size="16" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="234" name="__module.roberta.encoder.layer.1.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="232,attn_output.7">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="235" name="Constant_857979" type="Const" version="opset1">
|
|
<data element_type="i64" shape="3" offset="55388704" size="24" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="236" name="__module.roberta.encoder.layer.1.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="234">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="237" name="__module.roberta.encoder.layer.1.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="68090472" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="238" name="__module.roberta.encoder.layer.1.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="239" name="__module.roberta.encoder.layer.1.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="68094568" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="240" name="__module.roberta.encoder.layer.1.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="68094572" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="241" name="__module.roberta.encoder.layer.1.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="68094568" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="242" name="__module.roberta.encoder.layer.1.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="68094572" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="243" name="__module.roberta.encoder.layer.1.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="244" name="Constant_1974112" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="68094576" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="245" name="Convert_1974113" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="246" name="Constant_1974114" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="69143152" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="247" name="__module.roberta.encoder.layer.1.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="248" name="__module.roberta.encoder.layer.1.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="249" name="Constant_857553" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="69147248" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="250" name="__module.roberta.encoder.layer.1.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="239,input.7">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="251" name="__module.roberta.encoder.layer.1.attention.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="241">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="252" name="__module.roberta.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="253" name="__module.roberta.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="254" name="Constant_857554" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="69151344" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="255" name="__module.roberta.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="256" name="Constant_857555" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="69155440" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="257" name="__module.roberta.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="245,input_tensor.3">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="258" name="__module.roberta.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="69159536" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="259" name="__module.roberta.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="260" name="__module.roberta.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="69163632" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="261" name="__module.roberta.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="69163636" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="262" name="__module.roberta.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="69163632" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="263" name="__module.roberta.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="69163636" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="264" name="__module.roberta.encoder.layer.1.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="265" name="Constant_1974116" type="Const" version="opset1">
|
|
<data element_type="i8" shape="4096, 1024" offset="69163640" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="266" name="Convert_1974117" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="267" name="Constant_1974118" type="Const" version="opset1">
|
|
<data element_type="f32" shape="4096, 1" offset="73357944" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="268" name="__module.roberta.encoder.layer.1.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="269" name="__module.roberta.encoder.layer.1.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="270" name="Constant_857556" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="73374328" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="271" name="__module.roberta.encoder.layer.1.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="249">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="272" name="__module.roberta.encoder.layer.1.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
|
<data approximation_mode="ERF" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32" names="250">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="273" name="__module.roberta.encoder.layer.1.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="73390712" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="274" name="__module.roberta.encoder.layer.1.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="275" name="__module.roberta.encoder.layer.1.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="73407096" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="276" name="__module.roberta.encoder.layer.1.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="73407100" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="277" name="__module.roberta.encoder.layer.1.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="73407096" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="278" name="__module.roberta.encoder.layer.1.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="73407100" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="279" name="__module.roberta.encoder.layer.1.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="280" name="Constant_1974120" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 4096" offset="73407104" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="281" name="Convert_1974121" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="282" name="Constant_1974122" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="77601408" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="283" name="__module.roberta.encoder.layer.1.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="284" name="__module.roberta.encoder.layer.1.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="285" name="Constant_857557" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="77605504" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="286" name="__module.roberta.encoder.layer.1.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="255,input.9">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="287" name="__module.roberta.encoder.layer.1.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="257">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="288" name="__module.roberta.encoder.layer.1.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="289" name="__module.roberta.encoder.layer.1.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="290" name="Constant_857558" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="77609600" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="291" name="__module.roberta.encoder.layer.1.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="292" name="Constant_857559" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="77613696" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="293" name="__module.roberta.encoder.layer.1.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="261,hidden_states.13">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="294" name="__module.roberta.encoder.layer.1.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="77617792" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="295" name="__module.roberta.encoder.layer.1.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="296" name="__module.roberta.encoder.layer.1.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="77621888" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="297" name="__module.roberta.encoder.layer.1.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="77621892" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="298" name="__module.roberta.encoder.layer.1.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="77621888" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="299" name="__module.roberta.encoder.layer.1.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="77621892" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="300" name="__module.roberta.encoder.layer.1.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="301" name="Constant_1974124" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="77621896" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="302" name="Convert_1974125" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="303" name="Constant_1974126" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="78670472" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="304" name="__module.roberta.encoder.layer.2.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="305" name="__module.roberta.encoder.layer.2.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="306" name="Constant_857560" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="78674568" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="307" name="__module.roberta.encoder.layer.2.attention.self.query/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="274,x.25">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="308" name="__module.roberta.encoder.layer.2.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="78678664" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="309" name="__module.roberta.encoder.layer.2.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="78678668" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="310" name="__module.roberta.encoder.layer.2.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="78678664" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="311" name="__module.roberta.encoder.layer.2.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="78678668" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="312" name="__module.roberta.encoder.layer.2.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="313" name="__module.roberta.encoder.layer.2.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="314" name="__module.roberta.encoder.layer.2.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="278,x.27">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="315" name="Constant_843619" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="279">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="316" name="__module.roberta.encoder.layer.2.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="280">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="317" name="Constant_1974128" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="78678672" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="318" name="Convert_1974129" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="319" name="Constant_1974130" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="79727248" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="320" name="__module.roberta.encoder.layer.2.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="321" name="__module.roberta.encoder.layer.2.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="322" name="Constant_857561" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="79731344" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="323" name="__module.roberta.encoder.layer.2.attention.self.key/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="283,x.29">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="324" name="__module.roberta.encoder.layer.2.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="79735440" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="325" name="__module.roberta.encoder.layer.2.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="79735444" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="326" name="__module.roberta.encoder.layer.2.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="79735440" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="327" name="__module.roberta.encoder.layer.2.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="79735444" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="328" name="__module.roberta.encoder.layer.2.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="329" name="__module.roberta.encoder.layer.2.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="330" name="__module.roberta.encoder.layer.2.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="287,x.31">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="331" name="Constant_843642" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="288">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="332" name="__module.roberta.encoder.layer.2.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="289">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="333" name="Constant_1974132" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="79735448" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="334" name="Convert_1974133" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="335" name="Constant_1974134" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="80784024" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="336" name="__module.roberta.encoder.layer.2.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="337" name="__module.roberta.encoder.layer.2.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="338" name="Constant_857562" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="80788120" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="339" name="__module.roberta.encoder.layer.2.attention.self.value/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="292,x.33">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="340" name="__module.roberta.encoder.layer.2.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="341" name="__module.roberta.encoder.layer.2.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="296,x.35">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="342" name="Constant_843665" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="297">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="343" name="__module.roberta.encoder.layer.2.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="298">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="344" name="__module.roberta.encoder.layer.2.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
|
|
<data causal="false" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="3" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="4" precision="FP32" names="299,attn_output.9">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="345" name="__module.roberta.encoder.layer.2.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
|
|
<data element_type="i32" shape="4" offset="55388688" size="16" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="346" name="__module.roberta.encoder.layer.2.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="300,attn_output.11">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="347" name="Constant_857980" type="Const" version="opset1">
|
|
<data element_type="i64" shape="3" offset="55388704" size="24" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="348" name="__module.roberta.encoder.layer.2.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="302">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="349" name="__module.roberta.encoder.layer.2.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="80792216" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="350" name="__module.roberta.encoder.layer.2.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="351" name="__module.roberta.encoder.layer.2.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="80796312" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="352" name="__module.roberta.encoder.layer.2.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="80796316" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="353" name="__module.roberta.encoder.layer.2.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="80796312" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="354" name="__module.roberta.encoder.layer.2.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="80796316" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="355" name="__module.roberta.encoder.layer.2.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="356" name="Constant_1974136" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="80796320" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="357" name="Convert_1974137" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="358" name="Constant_1974138" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="81844896" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="359" name="__module.roberta.encoder.layer.2.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="360" name="__module.roberta.encoder.layer.2.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="361" name="Constant_857563" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="81848992" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="362" name="__module.roberta.encoder.layer.2.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="307,input.11">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="363" name="__module.roberta.encoder.layer.2.attention.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="309">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="364" name="__module.roberta.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="365" name="__module.roberta.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="366" name="Constant_857564" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="81853088" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="367" name="__module.roberta.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="368" name="Constant_857565" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="81857184" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="369" name="__module.roberta.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="313,input_tensor.5">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="370" name="__module.roberta.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="81861280" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="371" name="__module.roberta.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="372" name="__module.roberta.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="81865376" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="373" name="__module.roberta.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="81865380" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="374" name="__module.roberta.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="81865376" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="375" name="__module.roberta.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="81865380" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="376" name="__module.roberta.encoder.layer.2.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="377" name="Constant_1974140" type="Const" version="opset1">
|
|
<data element_type="i8" shape="4096, 1024" offset="81865384" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="378" name="Convert_1974141" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="379" name="Constant_1974142" type="Const" version="opset1">
|
|
<data element_type="f32" shape="4096, 1" offset="86059688" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="380" name="__module.roberta.encoder.layer.2.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="381" name="__module.roberta.encoder.layer.2.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="382" name="Constant_857566" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="86076072" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="383" name="__module.roberta.encoder.layer.2.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="317">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="384" name="__module.roberta.encoder.layer.2.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
|
<data approximation_mode="ERF" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32" names="318">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="385" name="__module.roberta.encoder.layer.2.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="86092456" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="386" name="__module.roberta.encoder.layer.2.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="387" name="__module.roberta.encoder.layer.2.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="86108840" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="388" name="__module.roberta.encoder.layer.2.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="86108844" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="389" name="__module.roberta.encoder.layer.2.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="86108840" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="390" name="__module.roberta.encoder.layer.2.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="86108844" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="391" name="__module.roberta.encoder.layer.2.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="392" name="Constant_1974144" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 4096" offset="86108848" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="393" name="Convert_1974145" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="394" name="Constant_1974146" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="90303152" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="395" name="__module.roberta.encoder.layer.2.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="396" name="__module.roberta.encoder.layer.2.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="397" name="Constant_857567" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="90307248" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="398" name="__module.roberta.encoder.layer.2.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="323,input.13">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="399" name="__module.roberta.encoder.layer.2.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="325">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="400" name="__module.roberta.encoder.layer.2.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="401" name="__module.roberta.encoder.layer.2.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="402" name="Constant_857568" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="90311344" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="403" name="__module.roberta.encoder.layer.2.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="404" name="Constant_857569" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="90315440" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="405" name="__module.roberta.encoder.layer.2.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="329,hidden_states.19">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="406" name="__module.roberta.encoder.layer.2.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="90319536" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="407" name="__module.roberta.encoder.layer.2.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="408" name="__module.roberta.encoder.layer.2.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="90323632" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="409" name="__module.roberta.encoder.layer.2.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="90323636" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="410" name="__module.roberta.encoder.layer.2.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="90323632" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="411" name="__module.roberta.encoder.layer.2.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="90323636" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="412" name="__module.roberta.encoder.layer.2.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="413" name="Constant_1974148" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="90323640" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="414" name="Convert_1974149" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="415" name="Constant_1974150" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="91372216" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="416" name="__module.roberta.encoder.layer.3.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="417" name="__module.roberta.encoder.layer.3.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="418" name="Constant_857570" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="91376312" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="419" name="__module.roberta.encoder.layer.3.attention.self.query/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="342,x.37">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="420" name="__module.roberta.encoder.layer.3.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="91380408" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="421" name="__module.roberta.encoder.layer.3.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="91380412" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="422" name="__module.roberta.encoder.layer.3.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="91380408" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="423" name="__module.roberta.encoder.layer.3.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="91380412" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="424" name="__module.roberta.encoder.layer.3.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="425" name="__module.roberta.encoder.layer.3.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="426" name="__module.roberta.encoder.layer.3.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="346,x.39">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="427" name="Constant_843842" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="347">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="428" name="__module.roberta.encoder.layer.3.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="348">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="429" name="Constant_1974152" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="91380416" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="430" name="Convert_1974153" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="431" name="Constant_1974154" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="92428992" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="432" name="__module.roberta.encoder.layer.3.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="433" name="__module.roberta.encoder.layer.3.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="434" name="Constant_857571" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="92433088" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="435" name="__module.roberta.encoder.layer.3.attention.self.key/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="351,x.41">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="436" name="__module.roberta.encoder.layer.3.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="92437184" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="437" name="__module.roberta.encoder.layer.3.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="92437188" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="438" name="__module.roberta.encoder.layer.3.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="92437184" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="439" name="__module.roberta.encoder.layer.3.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="92437188" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="440" name="__module.roberta.encoder.layer.3.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="441" name="__module.roberta.encoder.layer.3.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="442" name="__module.roberta.encoder.layer.3.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="355,x.43">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="443" name="Constant_843865" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="356">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="444" name="__module.roberta.encoder.layer.3.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="357">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="445" name="Constant_1974156" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="92437192" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="446" name="Convert_1974157" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="447" name="Constant_1974158" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="93485768" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="448" name="__module.roberta.encoder.layer.3.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="449" name="__module.roberta.encoder.layer.3.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="450" name="Constant_857572" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="93489864" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="451" name="__module.roberta.encoder.layer.3.attention.self.value/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="360,x.45">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="452" name="__module.roberta.encoder.layer.3.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="453" name="__module.roberta.encoder.layer.3.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="364,x.47">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="454" name="Constant_843888" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="365">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="455" name="__module.roberta.encoder.layer.3.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="366">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="456" name="__module.roberta.encoder.layer.3.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
|
|
<data causal="false" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="3" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="4" precision="FP32" names="367,attn_output.13">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="457" name="__module.roberta.encoder.layer.3.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
|
|
<data element_type="i32" shape="4" offset="55388688" size="16" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="458" name="__module.roberta.encoder.layer.3.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="368,attn_output.15">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="459" name="Constant_857981" type="Const" version="opset1">
|
|
<data element_type="i64" shape="3" offset="55388704" size="24" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="460" name="__module.roberta.encoder.layer.3.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="370">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="461" name="__module.roberta.encoder.layer.3.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="93493960" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="462" name="__module.roberta.encoder.layer.3.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="463" name="__module.roberta.encoder.layer.3.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="93498056" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="464" name="__module.roberta.encoder.layer.3.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="93498060" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="465" name="__module.roberta.encoder.layer.3.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="93498056" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="466" name="__module.roberta.encoder.layer.3.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="93498060" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="467" name="__module.roberta.encoder.layer.3.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="468" name="Constant_1974160" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="93498064" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="469" name="Convert_1974161" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="470" name="Constant_1974162" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="94546640" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="471" name="__module.roberta.encoder.layer.3.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="472" name="__module.roberta.encoder.layer.3.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="473" name="Constant_857573" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="94550736" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="474" name="__module.roberta.encoder.layer.3.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="375,input.15">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="475" name="__module.roberta.encoder.layer.3.attention.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="377">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="476" name="__module.roberta.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="477" name="__module.roberta.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="478" name="Constant_857574" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="94554832" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="479" name="__module.roberta.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="480" name="Constant_857575" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="94558928" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="481" name="__module.roberta.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="381,input_tensor.7">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="482" name="__module.roberta.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="94563024" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="483" name="__module.roberta.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="484" name="__module.roberta.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="94567120" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="485" name="__module.roberta.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="94567124" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="486" name="__module.roberta.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="94567120" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="487" name="__module.roberta.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="94567124" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="488" name="__module.roberta.encoder.layer.3.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="489" name="Constant_1974164" type="Const" version="opset1">
|
|
<data element_type="i8" shape="4096, 1024" offset="94567128" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="490" name="Convert_1974165" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="491" name="Constant_1974166" type="Const" version="opset1">
|
|
<data element_type="f32" shape="4096, 1" offset="98761432" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="492" name="__module.roberta.encoder.layer.3.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="493" name="__module.roberta.encoder.layer.3.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="494" name="Constant_857576" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="98777816" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="495" name="__module.roberta.encoder.layer.3.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="385">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="496" name="__module.roberta.encoder.layer.3.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
|
<data approximation_mode="ERF" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32" names="386">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="497" name="__module.roberta.encoder.layer.3.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="98794200" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="498" name="__module.roberta.encoder.layer.3.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="499" name="__module.roberta.encoder.layer.3.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="98810584" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="500" name="__module.roberta.encoder.layer.3.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="98810588" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="501" name="__module.roberta.encoder.layer.3.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="98810584" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="502" name="__module.roberta.encoder.layer.3.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="98810588" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="503" name="__module.roberta.encoder.layer.3.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="504" name="Constant_1974168" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 4096" offset="98810592" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="505" name="Convert_1974169" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="506" name="Constant_1974170" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="103004896" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="507" name="__module.roberta.encoder.layer.3.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="508" name="__module.roberta.encoder.layer.3.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="509" name="Constant_857577" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="103008992" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="510" name="__module.roberta.encoder.layer.3.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="391,input.17">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="511" name="__module.roberta.encoder.layer.3.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="393">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="512" name="__module.roberta.encoder.layer.3.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="513" name="__module.roberta.encoder.layer.3.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="514" name="Constant_857578" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="103013088" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="515" name="__module.roberta.encoder.layer.3.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="516" name="Constant_857579" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="103017184" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="517" name="__module.roberta.encoder.layer.3.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="397,hidden_states.25">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="518" name="__module.roberta.encoder.layer.3.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="103021280" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="519" name="__module.roberta.encoder.layer.3.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="520" name="__module.roberta.encoder.layer.3.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="103025376" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="521" name="__module.roberta.encoder.layer.3.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="103025380" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="522" name="__module.roberta.encoder.layer.3.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="103025376" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="523" name="__module.roberta.encoder.layer.3.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="103025380" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="524" name="__module.roberta.encoder.layer.3.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="525" name="Constant_1974172" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="103025384" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="526" name="Convert_1974173" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="527" name="Constant_1974174" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="104073960" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="528" name="__module.roberta.encoder.layer.4.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="529" name="__module.roberta.encoder.layer.4.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="530" name="Constant_857580" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="104078056" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="531" name="__module.roberta.encoder.layer.4.attention.self.query/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="410,x.49">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="532" name="__module.roberta.encoder.layer.4.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="104082152" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="533" name="__module.roberta.encoder.layer.4.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="104082156" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="534" name="__module.roberta.encoder.layer.4.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="104082152" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="535" name="__module.roberta.encoder.layer.4.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="104082156" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="536" name="__module.roberta.encoder.layer.4.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="537" name="__module.roberta.encoder.layer.4.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="538" name="__module.roberta.encoder.layer.4.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="414,x.51">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="539" name="Constant_844065" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="415">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="540" name="__module.roberta.encoder.layer.4.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="416">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="541" name="Constant_1974176" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="104082160" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="542" name="Convert_1974177" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="543" name="Constant_1974178" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="105130736" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="544" name="__module.roberta.encoder.layer.4.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="545" name="__module.roberta.encoder.layer.4.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="546" name="Constant_857581" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="105134832" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="547" name="__module.roberta.encoder.layer.4.attention.self.key/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="419,x.53">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="548" name="__module.roberta.encoder.layer.4.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="105138928" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="549" name="__module.roberta.encoder.layer.4.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="105138932" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="550" name="__module.roberta.encoder.layer.4.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="105138928" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="551" name="__module.roberta.encoder.layer.4.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="105138932" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="552" name="__module.roberta.encoder.layer.4.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="553" name="__module.roberta.encoder.layer.4.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="554" name="__module.roberta.encoder.layer.4.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="423,x.55">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="555" name="Constant_844088" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="424">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="556" name="__module.roberta.encoder.layer.4.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="425">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="557" name="Constant_1974180" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="105138936" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="558" name="Convert_1974181" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="559" name="Constant_1974182" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="106187512" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="560" name="__module.roberta.encoder.layer.4.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="561" name="__module.roberta.encoder.layer.4.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="562" name="Constant_857582" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="106191608" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="563" name="__module.roberta.encoder.layer.4.attention.self.value/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="428,x.57">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="564" name="__module.roberta.encoder.layer.4.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="565" name="__module.roberta.encoder.layer.4.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="432,x.59">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="566" name="Constant_844111" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="433">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="567" name="__module.roberta.encoder.layer.4.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="434">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="568" name="__module.roberta.encoder.layer.4.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
|
|
<data causal="false" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="3" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="4" precision="FP32" names="435,attn_output.17">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="569" name="__module.roberta.encoder.layer.4.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
|
|
<data element_type="i32" shape="4" offset="55388688" size="16" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="570" name="__module.roberta.encoder.layer.4.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="436,attn_output.19">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="571" name="Constant_857982" type="Const" version="opset1">
|
|
<data element_type="i64" shape="3" offset="55388704" size="24" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="572" name="__module.roberta.encoder.layer.4.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="438">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="573" name="__module.roberta.encoder.layer.4.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="106195704" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="574" name="__module.roberta.encoder.layer.4.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="575" name="__module.roberta.encoder.layer.4.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="106199800" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="576" name="__module.roberta.encoder.layer.4.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="106199804" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="577" name="__module.roberta.encoder.layer.4.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="106199800" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="578" name="__module.roberta.encoder.layer.4.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="106199804" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="579" name="__module.roberta.encoder.layer.4.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="580" name="Constant_1974184" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="106199808" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="581" name="Convert_1974185" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="582" name="Constant_1974186" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="107248384" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="583" name="__module.roberta.encoder.layer.4.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="584" name="__module.roberta.encoder.layer.4.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="585" name="Constant_857583" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="107252480" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="586" name="__module.roberta.encoder.layer.4.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="443,input.19">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="587" name="__module.roberta.encoder.layer.4.attention.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="445">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="588" name="__module.roberta.encoder.layer.4.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="589" name="__module.roberta.encoder.layer.4.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="590" name="Constant_857584" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="107256576" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="591" name="__module.roberta.encoder.layer.4.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="592" name="Constant_857585" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="107260672" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="593" name="__module.roberta.encoder.layer.4.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="449,input_tensor.9">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="594" name="__module.roberta.encoder.layer.4.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="107264768" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="595" name="__module.roberta.encoder.layer.4.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="596" name="__module.roberta.encoder.layer.4.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="107268864" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="597" name="__module.roberta.encoder.layer.4.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="107268868" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="598" name="__module.roberta.encoder.layer.4.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="107268864" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="599" name="__module.roberta.encoder.layer.4.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="107268868" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="600" name="__module.roberta.encoder.layer.4.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="601" name="Constant_1974188" type="Const" version="opset1">
|
|
<data element_type="i8" shape="4096, 1024" offset="107268872" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="602" name="Convert_1974189" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="603" name="Constant_1974190" type="Const" version="opset1">
|
|
<data element_type="f32" shape="4096, 1" offset="111463176" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="604" name="__module.roberta.encoder.layer.4.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="605" name="__module.roberta.encoder.layer.4.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="606" name="Constant_857586" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="111479560" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="607" name="__module.roberta.encoder.layer.4.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="453">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="608" name="__module.roberta.encoder.layer.4.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
|
<data approximation_mode="ERF" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32" names="454">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="609" name="__module.roberta.encoder.layer.4.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="111495944" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="610" name="__module.roberta.encoder.layer.4.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="611" name="__module.roberta.encoder.layer.4.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="111512328" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="612" name="__module.roberta.encoder.layer.4.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="111512332" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="613" name="__module.roberta.encoder.layer.4.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="111512328" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="614" name="__module.roberta.encoder.layer.4.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="111512332" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="615" name="__module.roberta.encoder.layer.4.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="616" name="Constant_1974192" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 4096" offset="111512336" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="617" name="Convert_1974193" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="618" name="Constant_1974194" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="115706640" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="619" name="__module.roberta.encoder.layer.4.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="620" name="__module.roberta.encoder.layer.4.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="621" name="Constant_857587" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="115710736" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="622" name="__module.roberta.encoder.layer.4.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="459,input.21">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="623" name="__module.roberta.encoder.layer.4.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="461">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="624" name="__module.roberta.encoder.layer.4.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="625" name="__module.roberta.encoder.layer.4.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="626" name="Constant_857588" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="115714832" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="627" name="__module.roberta.encoder.layer.4.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="628" name="Constant_857589" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="115718928" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="629" name="__module.roberta.encoder.layer.4.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="465,hidden_states.31">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="630" name="__module.roberta.encoder.layer.4.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="115723024" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="631" name="__module.roberta.encoder.layer.4.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="632" name="__module.roberta.encoder.layer.4.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="115727120" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="633" name="__module.roberta.encoder.layer.4.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="115727124" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="634" name="__module.roberta.encoder.layer.4.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="115727120" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="635" name="__module.roberta.encoder.layer.4.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="115727124" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="636" name="__module.roberta.encoder.layer.4.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="637" name="Constant_1974196" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="115727128" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="638" name="Convert_1974197" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="639" name="Constant_1974198" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="116775704" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="640" name="__module.roberta.encoder.layer.5.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="641" name="__module.roberta.encoder.layer.5.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="642" name="Constant_857590" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="116779800" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="643" name="__module.roberta.encoder.layer.5.attention.self.query/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="478,x.61">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="644" name="__module.roberta.encoder.layer.5.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="116783896" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="645" name="__module.roberta.encoder.layer.5.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="116783900" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="646" name="__module.roberta.encoder.layer.5.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="116783896" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="647" name="__module.roberta.encoder.layer.5.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="116783900" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="648" name="__module.roberta.encoder.layer.5.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="649" name="__module.roberta.encoder.layer.5.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="650" name="__module.roberta.encoder.layer.5.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="482,x.63">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="651" name="Constant_844288" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="483">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="652" name="__module.roberta.encoder.layer.5.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="484">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="653" name="Constant_1974200" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="116783904" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="654" name="Convert_1974201" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="655" name="Constant_1974202" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="117832480" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="656" name="__module.roberta.encoder.layer.5.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="657" name="__module.roberta.encoder.layer.5.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="658" name="Constant_857591" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="117836576" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="659" name="__module.roberta.encoder.layer.5.attention.self.key/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="487,x.65">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="660" name="__module.roberta.encoder.layer.5.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="117840672" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="661" name="__module.roberta.encoder.layer.5.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="117840676" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="662" name="__module.roberta.encoder.layer.5.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="117840672" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="663" name="__module.roberta.encoder.layer.5.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="117840676" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="664" name="__module.roberta.encoder.layer.5.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="665" name="__module.roberta.encoder.layer.5.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="666" name="__module.roberta.encoder.layer.5.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="491,x.67">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="667" name="Constant_844311" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="492">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="668" name="__module.roberta.encoder.layer.5.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="493">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="669" name="Constant_1974204" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="117840680" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="670" name="Convert_1974205" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="671" name="Constant_1974206" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="118889256" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="672" name="__module.roberta.encoder.layer.5.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="673" name="__module.roberta.encoder.layer.5.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="674" name="Constant_857592" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="118893352" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="675" name="__module.roberta.encoder.layer.5.attention.self.value/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="496,x.69">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="676" name="__module.roberta.encoder.layer.5.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="677" name="__module.roberta.encoder.layer.5.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="500,x.71">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="678" name="Constant_844334" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="501">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="679" name="__module.roberta.encoder.layer.5.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="502">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="680" name="__module.roberta.encoder.layer.5.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
|
|
<data causal="false" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="3" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="4" precision="FP32" names="503,attn_output.21">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="681" name="__module.roberta.encoder.layer.5.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
|
|
<data element_type="i32" shape="4" offset="55388688" size="16" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="682" name="__module.roberta.encoder.layer.5.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="504,attn_output.23">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="683" name="Constant_857983" type="Const" version="opset1">
|
|
<data element_type="i64" shape="3" offset="55388704" size="24" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="684" name="__module.roberta.encoder.layer.5.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="506">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="685" name="__module.roberta.encoder.layer.5.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="118897448" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="686" name="__module.roberta.encoder.layer.5.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="687" name="__module.roberta.encoder.layer.5.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="118901544" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="688" name="__module.roberta.encoder.layer.5.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="118901548" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="689" name="__module.roberta.encoder.layer.5.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="118901544" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="690" name="__module.roberta.encoder.layer.5.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="118901548" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="691" name="__module.roberta.encoder.layer.5.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="692" name="Constant_1974208" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="118901552" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="693" name="Convert_1974209" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="694" name="Constant_1974210" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="119950128" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="695" name="__module.roberta.encoder.layer.5.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="696" name="__module.roberta.encoder.layer.5.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="697" name="Constant_857593" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="119954224" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="698" name="__module.roberta.encoder.layer.5.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="511,input.23">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="699" name="__module.roberta.encoder.layer.5.attention.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="513">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="700" name="__module.roberta.encoder.layer.5.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="701" name="__module.roberta.encoder.layer.5.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="702" name="Constant_857594" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="119958320" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="703" name="__module.roberta.encoder.layer.5.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="704" name="Constant_857595" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="119962416" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="705" name="__module.roberta.encoder.layer.5.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="517,input_tensor.11">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="706" name="__module.roberta.encoder.layer.5.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="119966512" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="707" name="__module.roberta.encoder.layer.5.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="708" name="__module.roberta.encoder.layer.5.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="119970608" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="709" name="__module.roberta.encoder.layer.5.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="119970612" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="710" name="__module.roberta.encoder.layer.5.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="119970608" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="711" name="__module.roberta.encoder.layer.5.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="119970612" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="712" name="__module.roberta.encoder.layer.5.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="713" name="Constant_1974212" type="Const" version="opset1">
|
|
<data element_type="i8" shape="4096, 1024" offset="119970616" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="714" name="Convert_1974213" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="715" name="Constant_1974214" type="Const" version="opset1">
|
|
<data element_type="f32" shape="4096, 1" offset="124164920" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="716" name="__module.roberta.encoder.layer.5.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="717" name="__module.roberta.encoder.layer.5.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="718" name="Constant_857596" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="124181304" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="719" name="__module.roberta.encoder.layer.5.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="521">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="720" name="__module.roberta.encoder.layer.5.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
|
<data approximation_mode="ERF" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32" names="522">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="721" name="__module.roberta.encoder.layer.5.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="124197688" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="722" name="__module.roberta.encoder.layer.5.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="723" name="__module.roberta.encoder.layer.5.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="124214072" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="724" name="__module.roberta.encoder.layer.5.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="124214076" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="725" name="__module.roberta.encoder.layer.5.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="124214072" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="726" name="__module.roberta.encoder.layer.5.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="124214076" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="727" name="__module.roberta.encoder.layer.5.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="728" name="Constant_1974216" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 4096" offset="124214080" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="729" name="Convert_1974217" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="730" name="Constant_1974218" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="128408384" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="731" name="__module.roberta.encoder.layer.5.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="732" name="__module.roberta.encoder.layer.5.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="733" name="Constant_857597" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="128412480" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="734" name="__module.roberta.encoder.layer.5.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="527,input.25">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="735" name="__module.roberta.encoder.layer.5.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="529">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="736" name="__module.roberta.encoder.layer.5.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="737" name="__module.roberta.encoder.layer.5.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="738" name="Constant_857598" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="128416576" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="739" name="__module.roberta.encoder.layer.5.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="740" name="Constant_857599" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="128420672" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="741" name="__module.roberta.encoder.layer.5.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="533,hidden_states.37">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="742" name="__module.roberta.encoder.layer.5.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="128424768" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="743" name="__module.roberta.encoder.layer.5.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="744" name="__module.roberta.encoder.layer.5.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="128428864" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="745" name="__module.roberta.encoder.layer.5.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="128428868" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="746" name="__module.roberta.encoder.layer.5.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="128428864" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="747" name="__module.roberta.encoder.layer.5.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="128428868" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="748" name="__module.roberta.encoder.layer.5.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="749" name="Constant_1974220" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="128428872" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="750" name="Convert_1974221" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="751" name="Constant_1974222" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="129477448" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="752" name="__module.roberta.encoder.layer.6.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="753" name="__module.roberta.encoder.layer.6.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="754" name="Constant_857600" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="129481544" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="755" name="__module.roberta.encoder.layer.6.attention.self.query/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="546,x.73">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="756" name="__module.roberta.encoder.layer.6.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="129485640" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="757" name="__module.roberta.encoder.layer.6.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="129485644" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="758" name="__module.roberta.encoder.layer.6.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="129485640" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="759" name="__module.roberta.encoder.layer.6.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="129485644" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="760" name="__module.roberta.encoder.layer.6.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="761" name="__module.roberta.encoder.layer.6.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="762" name="__module.roberta.encoder.layer.6.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="550,x.75">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="763" name="Constant_844511" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="551">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="764" name="__module.roberta.encoder.layer.6.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="552">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="765" name="Constant_1974224" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="129485648" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="766" name="Convert_1974225" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="767" name="Constant_1974226" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="130534224" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="768" name="__module.roberta.encoder.layer.6.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="769" name="__module.roberta.encoder.layer.6.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="770" name="Constant_857601" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="130538320" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="771" name="__module.roberta.encoder.layer.6.attention.self.key/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="555,x.77">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="772" name="__module.roberta.encoder.layer.6.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="130542416" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="773" name="__module.roberta.encoder.layer.6.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="130542420" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="774" name="__module.roberta.encoder.layer.6.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="130542416" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="775" name="__module.roberta.encoder.layer.6.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="130542420" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="776" name="__module.roberta.encoder.layer.6.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="777" name="__module.roberta.encoder.layer.6.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="778" name="__module.roberta.encoder.layer.6.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="559,x.79">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="779" name="Constant_844534" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="560">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="780" name="__module.roberta.encoder.layer.6.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="561">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="781" name="Constant_1974228" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="130542424" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="782" name="Convert_1974229" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="783" name="Constant_1974230" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="131591000" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="784" name="__module.roberta.encoder.layer.6.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="785" name="__module.roberta.encoder.layer.6.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="786" name="Constant_857602" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="131595096" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="787" name="__module.roberta.encoder.layer.6.attention.self.value/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="564,x.81">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="788" name="__module.roberta.encoder.layer.6.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="789" name="__module.roberta.encoder.layer.6.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="568,x.83">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="790" name="Constant_844557" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="569">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="791" name="__module.roberta.encoder.layer.6.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="570">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="792" name="__module.roberta.encoder.layer.6.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
|
|
<data causal="false" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="3" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="4" precision="FP32" names="571,attn_output.25">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="793" name="__module.roberta.encoder.layer.6.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
|
|
<data element_type="i32" shape="4" offset="55388688" size="16" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="794" name="__module.roberta.encoder.layer.6.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="572,attn_output.27">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="795" name="Constant_857984" type="Const" version="opset1">
|
|
<data element_type="i64" shape="3" offset="55388704" size="24" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="796" name="__module.roberta.encoder.layer.6.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="574">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="797" name="__module.roberta.encoder.layer.6.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="131599192" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="798" name="__module.roberta.encoder.layer.6.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="799" name="__module.roberta.encoder.layer.6.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="131603288" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="800" name="__module.roberta.encoder.layer.6.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="131603292" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="801" name="__module.roberta.encoder.layer.6.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="131603288" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="802" name="__module.roberta.encoder.layer.6.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="131603292" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="803" name="__module.roberta.encoder.layer.6.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="804" name="Constant_1974232" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="131603296" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="805" name="Convert_1974233" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="806" name="Constant_1974234" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="132651872" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="807" name="__module.roberta.encoder.layer.6.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="808" name="__module.roberta.encoder.layer.6.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="809" name="Constant_857603" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="132655968" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="810" name="__module.roberta.encoder.layer.6.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="579,input.27">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="811" name="__module.roberta.encoder.layer.6.attention.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="581">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="812" name="__module.roberta.encoder.layer.6.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="813" name="__module.roberta.encoder.layer.6.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="814" name="Constant_857604" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="132660064" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="815" name="__module.roberta.encoder.layer.6.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="816" name="Constant_857605" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="132664160" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="817" name="__module.roberta.encoder.layer.6.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="585,input_tensor.13">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="818" name="__module.roberta.encoder.layer.6.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="132668256" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="819" name="__module.roberta.encoder.layer.6.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="820" name="__module.roberta.encoder.layer.6.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="132672352" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="821" name="__module.roberta.encoder.layer.6.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="132672356" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="822" name="__module.roberta.encoder.layer.6.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="132672352" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="823" name="__module.roberta.encoder.layer.6.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="132672356" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="824" name="__module.roberta.encoder.layer.6.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="825" name="Constant_1974236" type="Const" version="opset1">
|
|
<data element_type="i8" shape="4096, 1024" offset="132672360" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="826" name="Convert_1974237" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="827" name="Constant_1974238" type="Const" version="opset1">
|
|
<data element_type="f32" shape="4096, 1" offset="136866664" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="828" name="__module.roberta.encoder.layer.6.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="829" name="__module.roberta.encoder.layer.6.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="830" name="Constant_857606" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="136883048" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="831" name="__module.roberta.encoder.layer.6.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="589">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="832" name="__module.roberta.encoder.layer.6.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
|
<data approximation_mode="ERF" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32" names="590">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="833" name="__module.roberta.encoder.layer.6.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="136899432" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="834" name="__module.roberta.encoder.layer.6.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="835" name="__module.roberta.encoder.layer.6.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="136915816" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="836" name="__module.roberta.encoder.layer.6.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="136915820" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="837" name="__module.roberta.encoder.layer.6.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="136915816" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="838" name="__module.roberta.encoder.layer.6.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="136915820" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="839" name="__module.roberta.encoder.layer.6.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="840" name="Constant_1974240" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 4096" offset="136915824" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="841" name="Convert_1974241" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="842" name="Constant_1974242" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="141110128" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="843" name="__module.roberta.encoder.layer.6.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="844" name="__module.roberta.encoder.layer.6.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="845" name="Constant_857607" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="141114224" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="846" name="__module.roberta.encoder.layer.6.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="595,input.29">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="847" name="__module.roberta.encoder.layer.6.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="597">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="848" name="__module.roberta.encoder.layer.6.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="849" name="__module.roberta.encoder.layer.6.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="850" name="Constant_857608" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="141118320" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="851" name="__module.roberta.encoder.layer.6.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="852" name="Constant_857609" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="141122416" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="853" name="__module.roberta.encoder.layer.6.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="601,hidden_states.43">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="854" name="__module.roberta.encoder.layer.6.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="141126512" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="855" name="__module.roberta.encoder.layer.6.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="856" name="__module.roberta.encoder.layer.6.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="141130608" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="857" name="__module.roberta.encoder.layer.6.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="141130612" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="858" name="__module.roberta.encoder.layer.6.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="141130608" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="859" name="__module.roberta.encoder.layer.6.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="141130612" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="860" name="__module.roberta.encoder.layer.6.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="861" name="Constant_1974244" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="141130616" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="862" name="Convert_1974245" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="863" name="Constant_1974246" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="142179192" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="864" name="__module.roberta.encoder.layer.7.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="865" name="__module.roberta.encoder.layer.7.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="866" name="Constant_857610" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="142183288" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="867" name="__module.roberta.encoder.layer.7.attention.self.query/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="614,x.85">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="868" name="__module.roberta.encoder.layer.7.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="142187384" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="869" name="__module.roberta.encoder.layer.7.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="142187388" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="870" name="__module.roberta.encoder.layer.7.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="142187384" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="871" name="__module.roberta.encoder.layer.7.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="142187388" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="872" name="__module.roberta.encoder.layer.7.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="873" name="__module.roberta.encoder.layer.7.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="874" name="__module.roberta.encoder.layer.7.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="618,x.87">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="875" name="Constant_844734" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="619">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="876" name="__module.roberta.encoder.layer.7.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="620">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="877" name="Constant_1974248" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="142187392" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="878" name="Convert_1974249" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="879" name="Constant_1974250" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="143235968" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="880" name="__module.roberta.encoder.layer.7.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="881" name="__module.roberta.encoder.layer.7.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="882" name="Constant_857611" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="143240064" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="883" name="__module.roberta.encoder.layer.7.attention.self.key/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="623,x.89">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="884" name="__module.roberta.encoder.layer.7.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="143244160" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="885" name="__module.roberta.encoder.layer.7.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="143244164" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="886" name="__module.roberta.encoder.layer.7.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="143244160" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="887" name="__module.roberta.encoder.layer.7.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="143244164" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="888" name="__module.roberta.encoder.layer.7.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="889" name="__module.roberta.encoder.layer.7.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="890" name="__module.roberta.encoder.layer.7.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="627,x.91">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="891" name="Constant_844757" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="628">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="892" name="__module.roberta.encoder.layer.7.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="629">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="893" name="Constant_1974252" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="143244168" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="894" name="Convert_1974253" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="895" name="Constant_1974254" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="144292744" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="896" name="__module.roberta.encoder.layer.7.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="897" name="__module.roberta.encoder.layer.7.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="898" name="Constant_857612" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="144296840" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="899" name="__module.roberta.encoder.layer.7.attention.self.value/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="632,x.93">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="900" name="__module.roberta.encoder.layer.7.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="901" name="__module.roberta.encoder.layer.7.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="636,x.95">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="902" name="Constant_844780" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="637">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="903" name="__module.roberta.encoder.layer.7.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="638">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="904" name="__module.roberta.encoder.layer.7.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
|
|
<data causal="false" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="3" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="4" precision="FP32" names="639,attn_output.29">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="905" name="__module.roberta.encoder.layer.7.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
|
|
<data element_type="i32" shape="4" offset="55388688" size="16" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="906" name="__module.roberta.encoder.layer.7.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="640,attn_output.31">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="907" name="Constant_857985" type="Const" version="opset1">
|
|
<data element_type="i64" shape="3" offset="55388704" size="24" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="908" name="__module.roberta.encoder.layer.7.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="642">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="909" name="__module.roberta.encoder.layer.7.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="144300936" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="910" name="__module.roberta.encoder.layer.7.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="911" name="__module.roberta.encoder.layer.7.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="144305032" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="912" name="__module.roberta.encoder.layer.7.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="144305036" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="913" name="__module.roberta.encoder.layer.7.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="144305032" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="914" name="__module.roberta.encoder.layer.7.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="144305036" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="915" name="__module.roberta.encoder.layer.7.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="916" name="Constant_1974256" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="144305040" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="917" name="Convert_1974257" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="918" name="Constant_1974258" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="145353616" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="919" name="__module.roberta.encoder.layer.7.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="920" name="__module.roberta.encoder.layer.7.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="921" name="Constant_857613" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="145357712" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="922" name="__module.roberta.encoder.layer.7.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="647,input.31">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="923" name="__module.roberta.encoder.layer.7.attention.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="649">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="924" name="__module.roberta.encoder.layer.7.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="925" name="__module.roberta.encoder.layer.7.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="926" name="Constant_857614" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="145361808" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="927" name="__module.roberta.encoder.layer.7.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="928" name="Constant_857615" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="145365904" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="929" name="__module.roberta.encoder.layer.7.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="653,input_tensor.15">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="930" name="__module.roberta.encoder.layer.7.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="145370000" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="931" name="__module.roberta.encoder.layer.7.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="932" name="__module.roberta.encoder.layer.7.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="145374096" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="933" name="__module.roberta.encoder.layer.7.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="145374100" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="934" name="__module.roberta.encoder.layer.7.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="145374096" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="935" name="__module.roberta.encoder.layer.7.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="145374100" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="936" name="__module.roberta.encoder.layer.7.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="937" name="Constant_1974260" type="Const" version="opset1">
|
|
<data element_type="i8" shape="4096, 1024" offset="145374104" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="938" name="Convert_1974261" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="939" name="Constant_1974262" type="Const" version="opset1">
|
|
<data element_type="f32" shape="4096, 1" offset="149568408" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="940" name="__module.roberta.encoder.layer.7.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="941" name="__module.roberta.encoder.layer.7.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="942" name="Constant_857616" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="149584792" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="943" name="__module.roberta.encoder.layer.7.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="657">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="944" name="__module.roberta.encoder.layer.7.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
|
<data approximation_mode="ERF" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32" names="658">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="945" name="__module.roberta.encoder.layer.7.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="149601176" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="946" name="__module.roberta.encoder.layer.7.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="947" name="__module.roberta.encoder.layer.7.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="149617560" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="948" name="__module.roberta.encoder.layer.7.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="149617564" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="949" name="__module.roberta.encoder.layer.7.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="149617560" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="950" name="__module.roberta.encoder.layer.7.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="149617564" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="951" name="__module.roberta.encoder.layer.7.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="952" name="Constant_1974264" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 4096" offset="149617568" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="953" name="Convert_1974265" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="954" name="Constant_1974266" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="153811872" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="955" name="__module.roberta.encoder.layer.7.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="956" name="__module.roberta.encoder.layer.7.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="957" name="Constant_857617" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="153815968" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="958" name="__module.roberta.encoder.layer.7.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="663,input.33">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="959" name="__module.roberta.encoder.layer.7.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="665">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="960" name="__module.roberta.encoder.layer.7.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="961" name="__module.roberta.encoder.layer.7.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="962" name="Constant_857618" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="153820064" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="963" name="__module.roberta.encoder.layer.7.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="964" name="Constant_857619" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="153824160" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="965" name="__module.roberta.encoder.layer.7.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="669,hidden_states.49">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="966" name="__module.roberta.encoder.layer.7.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="153828256" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="967" name="__module.roberta.encoder.layer.7.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="968" name="__module.roberta.encoder.layer.7.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="153832352" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="969" name="__module.roberta.encoder.layer.7.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="153832356" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="970" name="__module.roberta.encoder.layer.7.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="153832352" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="971" name="__module.roberta.encoder.layer.7.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="153832356" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="972" name="__module.roberta.encoder.layer.7.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="973" name="Constant_1974268" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="153832360" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="974" name="Convert_1974269" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="975" name="Constant_1974270" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="154880936" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="976" name="__module.roberta.encoder.layer.8.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="977" name="__module.roberta.encoder.layer.8.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="978" name="Constant_857620" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="154885032" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="979" name="__module.roberta.encoder.layer.8.attention.self.query/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="682,x.97">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="980" name="__module.roberta.encoder.layer.8.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="154889128" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="981" name="__module.roberta.encoder.layer.8.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="154889132" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="982" name="__module.roberta.encoder.layer.8.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="154889128" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="983" name="__module.roberta.encoder.layer.8.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="154889132" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="984" name="__module.roberta.encoder.layer.8.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="985" name="__module.roberta.encoder.layer.8.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="986" name="__module.roberta.encoder.layer.8.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="686,x.99">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="987" name="Constant_844957" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="687">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="988" name="__module.roberta.encoder.layer.8.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="688">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="989" name="Constant_1974272" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="154889136" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="990" name="Convert_1974273" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="991" name="Constant_1974274" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="155937712" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="992" name="__module.roberta.encoder.layer.8.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="993" name="__module.roberta.encoder.layer.8.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="994" name="Constant_857621" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="155941808" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="995" name="__module.roberta.encoder.layer.8.attention.self.key/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="691,x.101">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="996" name="__module.roberta.encoder.layer.8.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="155945904" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="997" name="__module.roberta.encoder.layer.8.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="155945908" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="998" name="__module.roberta.encoder.layer.8.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="155945904" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="999" name="__module.roberta.encoder.layer.8.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="155945908" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1000" name="__module.roberta.encoder.layer.8.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1001" name="__module.roberta.encoder.layer.8.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1002" name="__module.roberta.encoder.layer.8.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="695,x.103">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1003" name="Constant_844980" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="696">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1004" name="__module.roberta.encoder.layer.8.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="697">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1005" name="Constant_1974276" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="155945912" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1006" name="Convert_1974277" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1007" name="Constant_1974278" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="156994488" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1008" name="__module.roberta.encoder.layer.8.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1009" name="__module.roberta.encoder.layer.8.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1010" name="Constant_857622" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="156998584" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1011" name="__module.roberta.encoder.layer.8.attention.self.value/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="700,x.105">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1012" name="__module.roberta.encoder.layer.8.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1013" name="__module.roberta.encoder.layer.8.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="704,x.107">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1014" name="Constant_845003" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="705">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1015" name="__module.roberta.encoder.layer.8.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="706">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1016" name="__module.roberta.encoder.layer.8.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
|
|
<data causal="false" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="3" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="4" precision="FP32" names="707,attn_output.33">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1017" name="__module.roberta.encoder.layer.8.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
|
|
<data element_type="i32" shape="4" offset="55388688" size="16" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1018" name="__module.roberta.encoder.layer.8.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="708,attn_output.35">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1019" name="Constant_857986" type="Const" version="opset1">
|
|
<data element_type="i64" shape="3" offset="55388704" size="24" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1020" name="__module.roberta.encoder.layer.8.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="710">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1021" name="__module.roberta.encoder.layer.8.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="157002680" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1022" name="__module.roberta.encoder.layer.8.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1023" name="__module.roberta.encoder.layer.8.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="157006776" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1024" name="__module.roberta.encoder.layer.8.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="157006780" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1025" name="__module.roberta.encoder.layer.8.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="157006776" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1026" name="__module.roberta.encoder.layer.8.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="157006780" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1027" name="__module.roberta.encoder.layer.8.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1028" name="Constant_1974280" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="157006784" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1029" name="Convert_1974281" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1030" name="Constant_1974282" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="158055360" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1031" name="__module.roberta.encoder.layer.8.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1032" name="__module.roberta.encoder.layer.8.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1033" name="Constant_857623" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="158059456" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1034" name="__module.roberta.encoder.layer.8.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="715,input.35">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1035" name="__module.roberta.encoder.layer.8.attention.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="717">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1036" name="__module.roberta.encoder.layer.8.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1037" name="__module.roberta.encoder.layer.8.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1038" name="Constant_857624" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="158063552" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1039" name="__module.roberta.encoder.layer.8.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1040" name="Constant_857625" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="158067648" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1041" name="__module.roberta.encoder.layer.8.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="721,input_tensor.17">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1042" name="__module.roberta.encoder.layer.8.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="158071744" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1043" name="__module.roberta.encoder.layer.8.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1044" name="__module.roberta.encoder.layer.8.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="158075840" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1045" name="__module.roberta.encoder.layer.8.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="158075844" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1046" name="__module.roberta.encoder.layer.8.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="158075840" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1047" name="__module.roberta.encoder.layer.8.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="158075844" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1048" name="__module.roberta.encoder.layer.8.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1049" name="Constant_1974284" type="Const" version="opset1">
|
|
<data element_type="i8" shape="4096, 1024" offset="158075848" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1050" name="Convert_1974285" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1051" name="Constant_1974286" type="Const" version="opset1">
|
|
<data element_type="f32" shape="4096, 1" offset="162270152" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1052" name="__module.roberta.encoder.layer.8.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1053" name="__module.roberta.encoder.layer.8.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1054" name="Constant_857626" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="162286536" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1055" name="__module.roberta.encoder.layer.8.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="725">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1056" name="__module.roberta.encoder.layer.8.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
|
<data approximation_mode="ERF" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32" names="726">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1057" name="__module.roberta.encoder.layer.8.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="162302920" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1058" name="__module.roberta.encoder.layer.8.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1059" name="__module.roberta.encoder.layer.8.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="162319304" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1060" name="__module.roberta.encoder.layer.8.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="162319308" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1061" name="__module.roberta.encoder.layer.8.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="162319304" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1062" name="__module.roberta.encoder.layer.8.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="162319308" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1063" name="__module.roberta.encoder.layer.8.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1064" name="Constant_1974288" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 4096" offset="162319312" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1065" name="Convert_1974289" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1066" name="Constant_1974290" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="166513616" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1067" name="__module.roberta.encoder.layer.8.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1068" name="__module.roberta.encoder.layer.8.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1069" name="Constant_857627" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="166517712" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1070" name="__module.roberta.encoder.layer.8.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="731,input.37">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1071" name="__module.roberta.encoder.layer.8.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="733">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1072" name="__module.roberta.encoder.layer.8.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1073" name="__module.roberta.encoder.layer.8.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1074" name="Constant_857628" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="166521808" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1075" name="__module.roberta.encoder.layer.8.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1076" name="Constant_857629" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="166525904" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1077" name="__module.roberta.encoder.layer.8.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="737,hidden_states.55">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1078" name="__module.roberta.encoder.layer.8.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="166530000" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1079" name="__module.roberta.encoder.layer.8.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1080" name="__module.roberta.encoder.layer.8.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="166534096" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1081" name="__module.roberta.encoder.layer.8.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="166534100" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1082" name="__module.roberta.encoder.layer.8.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="166534096" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1083" name="__module.roberta.encoder.layer.8.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="166534100" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1084" name="__module.roberta.encoder.layer.8.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1085" name="Constant_1974292" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="166534104" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1086" name="Convert_1974293" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1087" name="Constant_1974294" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="167582680" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1088" name="__module.roberta.encoder.layer.9.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1089" name="__module.roberta.encoder.layer.9.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1090" name="Constant_857630" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="167586776" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1091" name="__module.roberta.encoder.layer.9.attention.self.query/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="750,x.109">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1092" name="__module.roberta.encoder.layer.9.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="167590872" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1093" name="__module.roberta.encoder.layer.9.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="167590876" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1094" name="__module.roberta.encoder.layer.9.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="167590872" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1095" name="__module.roberta.encoder.layer.9.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="167590876" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1096" name="__module.roberta.encoder.layer.9.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1097" name="__module.roberta.encoder.layer.9.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1098" name="__module.roberta.encoder.layer.9.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="754,x.111">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1099" name="Constant_845180" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="755">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1100" name="__module.roberta.encoder.layer.9.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="756">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1101" name="Constant_1974296" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="167590880" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1102" name="Convert_1974297" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1103" name="Constant_1974298" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="168639456" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1104" name="__module.roberta.encoder.layer.9.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1105" name="__module.roberta.encoder.layer.9.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1106" name="Constant_857631" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="168643552" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1107" name="__module.roberta.encoder.layer.9.attention.self.key/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="759,x.113">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1108" name="__module.roberta.encoder.layer.9.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="168647648" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1109" name="__module.roberta.encoder.layer.9.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="168647652" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1110" name="__module.roberta.encoder.layer.9.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="168647648" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1111" name="__module.roberta.encoder.layer.9.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="168647652" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1112" name="__module.roberta.encoder.layer.9.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1113" name="__module.roberta.encoder.layer.9.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1114" name="__module.roberta.encoder.layer.9.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="763,x.115">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1115" name="Constant_845203" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="764">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1116" name="__module.roberta.encoder.layer.9.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="765">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1117" name="Constant_1974300" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="168647656" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1118" name="Convert_1974301" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1119" name="Constant_1974302" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="169696232" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1120" name="__module.roberta.encoder.layer.9.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1121" name="__module.roberta.encoder.layer.9.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1122" name="Constant_857632" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="169700328" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1123" name="__module.roberta.encoder.layer.9.attention.self.value/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="768,x.117">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1124" name="__module.roberta.encoder.layer.9.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1125" name="__module.roberta.encoder.layer.9.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="772,x.119">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1126" name="Constant_845226" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="773">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1127" name="__module.roberta.encoder.layer.9.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="774">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1128" name="__module.roberta.encoder.layer.9.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
|
|
<data causal="false" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="3" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="4" precision="FP32" names="775,attn_output.37">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1129" name="__module.roberta.encoder.layer.9.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
|
|
<data element_type="i32" shape="4" offset="55388688" size="16" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1130" name="__module.roberta.encoder.layer.9.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="776,attn_output.39">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1131" name="Constant_857987" type="Const" version="opset1">
|
|
<data element_type="i64" shape="3" offset="55388704" size="24" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1132" name="__module.roberta.encoder.layer.9.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="778">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1133" name="__module.roberta.encoder.layer.9.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="169704424" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1134" name="__module.roberta.encoder.layer.9.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1135" name="__module.roberta.encoder.layer.9.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="169708520" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1136" name="__module.roberta.encoder.layer.9.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="169708524" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1137" name="__module.roberta.encoder.layer.9.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="169708520" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1138" name="__module.roberta.encoder.layer.9.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="169708524" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1139" name="__module.roberta.encoder.layer.9.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1140" name="Constant_1974304" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="169708528" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1141" name="Convert_1974305" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1142" name="Constant_1974306" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="170757104" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1143" name="__module.roberta.encoder.layer.9.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1144" name="__module.roberta.encoder.layer.9.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1145" name="Constant_857633" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="170761200" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1146" name="__module.roberta.encoder.layer.9.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="783,input.39">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1147" name="__module.roberta.encoder.layer.9.attention.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="785">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1148" name="__module.roberta.encoder.layer.9.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1149" name="__module.roberta.encoder.layer.9.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1150" name="Constant_857634" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="170765296" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1151" name="__module.roberta.encoder.layer.9.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1152" name="Constant_857635" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="170769392" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1153" name="__module.roberta.encoder.layer.9.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="789,input_tensor.19">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1154" name="__module.roberta.encoder.layer.9.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="170773488" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1155" name="__module.roberta.encoder.layer.9.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1156" name="__module.roberta.encoder.layer.9.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="170777584" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1157" name="__module.roberta.encoder.layer.9.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="170777588" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1158" name="__module.roberta.encoder.layer.9.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="170777584" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1159" name="__module.roberta.encoder.layer.9.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="170777588" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1160" name="__module.roberta.encoder.layer.9.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1161" name="Constant_1974308" type="Const" version="opset1">
|
|
<data element_type="i8" shape="4096, 1024" offset="170777592" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1162" name="Convert_1974309" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1163" name="Constant_1974310" type="Const" version="opset1">
|
|
<data element_type="f32" shape="4096, 1" offset="174971896" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1164" name="__module.roberta.encoder.layer.9.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1165" name="__module.roberta.encoder.layer.9.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1166" name="Constant_857636" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="174988280" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1167" name="__module.roberta.encoder.layer.9.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="793">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1168" name="__module.roberta.encoder.layer.9.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
|
<data approximation_mode="ERF" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32" names="794">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1169" name="__module.roberta.encoder.layer.9.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="175004664" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1170" name="__module.roberta.encoder.layer.9.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1171" name="__module.roberta.encoder.layer.9.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="175021048" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1172" name="__module.roberta.encoder.layer.9.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="175021052" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1173" name="__module.roberta.encoder.layer.9.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="175021048" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1174" name="__module.roberta.encoder.layer.9.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="175021052" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1175" name="__module.roberta.encoder.layer.9.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1176" name="Constant_1974312" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 4096" offset="175021056" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1177" name="Convert_1974313" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1178" name="Constant_1974314" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="179215360" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1179" name="__module.roberta.encoder.layer.9.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1180" name="__module.roberta.encoder.layer.9.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1181" name="Constant_857637" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="179219456" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1182" name="__module.roberta.encoder.layer.9.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="799,input.41">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1183" name="__module.roberta.encoder.layer.9.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="801">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1184" name="__module.roberta.encoder.layer.9.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1185" name="__module.roberta.encoder.layer.9.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1186" name="Constant_857638" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="179223552" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1187" name="__module.roberta.encoder.layer.9.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1188" name="Constant_857639" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="179227648" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1189" name="__module.roberta.encoder.layer.9.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="805,hidden_states.61">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1190" name="__module.roberta.encoder.layer.9.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="179231744" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1191" name="__module.roberta.encoder.layer.9.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1192" name="__module.roberta.encoder.layer.9.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="179235840" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1193" name="__module.roberta.encoder.layer.9.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="179235844" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1194" name="__module.roberta.encoder.layer.9.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="179235840" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1195" name="__module.roberta.encoder.layer.9.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="179235844" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1196" name="__module.roberta.encoder.layer.9.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1197" name="Constant_1974316" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="179235848" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1198" name="Convert_1974317" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1199" name="Constant_1974318" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="180284424" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1200" name="__module.roberta.encoder.layer.10.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1201" name="__module.roberta.encoder.layer.10.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1202" name="Constant_857640" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="180288520" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1203" name="__module.roberta.encoder.layer.10.attention.self.query/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="818,x.121">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1204" name="__module.roberta.encoder.layer.10.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="180292616" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1205" name="__module.roberta.encoder.layer.10.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="180292620" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1206" name="__module.roberta.encoder.layer.10.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="180292616" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1207" name="__module.roberta.encoder.layer.10.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="180292620" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1208" name="__module.roberta.encoder.layer.10.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1209" name="__module.roberta.encoder.layer.10.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1210" name="__module.roberta.encoder.layer.10.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="822,x.123">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1211" name="Constant_845403" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="823">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1212" name="__module.roberta.encoder.layer.10.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="824">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1213" name="Constant_1974320" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="180292624" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1214" name="Convert_1974321" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1215" name="Constant_1974322" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="181341200" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1216" name="__module.roberta.encoder.layer.10.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1217" name="__module.roberta.encoder.layer.10.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1218" name="Constant_857641" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="181345296" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1219" name="__module.roberta.encoder.layer.10.attention.self.key/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="827,x.125">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1220" name="__module.roberta.encoder.layer.10.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="181349392" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1221" name="__module.roberta.encoder.layer.10.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="181349396" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1222" name="__module.roberta.encoder.layer.10.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="181349392" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1223" name="__module.roberta.encoder.layer.10.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="181349396" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1224" name="__module.roberta.encoder.layer.10.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1225" name="__module.roberta.encoder.layer.10.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1226" name="__module.roberta.encoder.layer.10.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="831,x.127">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1227" name="Constant_845426" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="832">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1228" name="__module.roberta.encoder.layer.10.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="833">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1229" name="Constant_1974324" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="181349400" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1230" name="Convert_1974325" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1231" name="Constant_1974326" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="182397976" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1232" name="__module.roberta.encoder.layer.10.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1233" name="__module.roberta.encoder.layer.10.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1234" name="Constant_857642" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="182402072" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1235" name="__module.roberta.encoder.layer.10.attention.self.value/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="836,x.129">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1236" name="__module.roberta.encoder.layer.10.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1237" name="__module.roberta.encoder.layer.10.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="840,x.131">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1238" name="Constant_845449" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="841">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1239" name="__module.roberta.encoder.layer.10.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="842">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1240" name="__module.roberta.encoder.layer.10.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
|
|
<data causal="false" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="3" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="4" precision="FP32" names="843,attn_output.41">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1241" name="__module.roberta.encoder.layer.10.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
|
|
<data element_type="i32" shape="4" offset="55388688" size="16" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1242" name="__module.roberta.encoder.layer.10.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="844,attn_output.43">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1243" name="Constant_857988" type="Const" version="opset1">
|
|
<data element_type="i64" shape="3" offset="55388704" size="24" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1244" name="__module.roberta.encoder.layer.10.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="846">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1245" name="__module.roberta.encoder.layer.10.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="182406168" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1246" name="__module.roberta.encoder.layer.10.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1247" name="__module.roberta.encoder.layer.10.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="182410264" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1248" name="__module.roberta.encoder.layer.10.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="182410268" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1249" name="__module.roberta.encoder.layer.10.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="182410264" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1250" name="__module.roberta.encoder.layer.10.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="182410268" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1251" name="__module.roberta.encoder.layer.10.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1252" name="Constant_1974328" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="182410272" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1253" name="Convert_1974329" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1254" name="Constant_1974330" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="183458848" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1255" name="__module.roberta.encoder.layer.10.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1256" name="__module.roberta.encoder.layer.10.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1257" name="Constant_857643" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="183462944" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1258" name="__module.roberta.encoder.layer.10.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="851,input.43">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1259" name="__module.roberta.encoder.layer.10.attention.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="853">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1260" name="__module.roberta.encoder.layer.10.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1261" name="__module.roberta.encoder.layer.10.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1262" name="Constant_857644" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="183467040" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1263" name="__module.roberta.encoder.layer.10.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1264" name="Constant_857645" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="183471136" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1265" name="__module.roberta.encoder.layer.10.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="857,input_tensor.21">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1266" name="__module.roberta.encoder.layer.10.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="183475232" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1267" name="__module.roberta.encoder.layer.10.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1268" name="__module.roberta.encoder.layer.10.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="183479328" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1269" name="__module.roberta.encoder.layer.10.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="183479332" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1270" name="__module.roberta.encoder.layer.10.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="183479328" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1271" name="__module.roberta.encoder.layer.10.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="183479332" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1272" name="__module.roberta.encoder.layer.10.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1273" name="Constant_1974332" type="Const" version="opset1">
|
|
<data element_type="i8" shape="4096, 1024" offset="183479336" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1274" name="Convert_1974333" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1275" name="Constant_1974334" type="Const" version="opset1">
|
|
<data element_type="f32" shape="4096, 1" offset="187673640" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1276" name="__module.roberta.encoder.layer.10.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1277" name="__module.roberta.encoder.layer.10.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1278" name="Constant_857646" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="187690024" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1279" name="__module.roberta.encoder.layer.10.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="861">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1280" name="__module.roberta.encoder.layer.10.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
|
<data approximation_mode="ERF" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32" names="862">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1281" name="__module.roberta.encoder.layer.10.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="187706408" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1282" name="__module.roberta.encoder.layer.10.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1283" name="__module.roberta.encoder.layer.10.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="187722792" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1284" name="__module.roberta.encoder.layer.10.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="187722796" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1285" name="__module.roberta.encoder.layer.10.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="187722792" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1286" name="__module.roberta.encoder.layer.10.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="187722796" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1287" name="__module.roberta.encoder.layer.10.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1288" name="Constant_1974336" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 4096" offset="187722800" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1289" name="Convert_1974337" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1290" name="Constant_1974338" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="191917104" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1291" name="__module.roberta.encoder.layer.10.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1292" name="__module.roberta.encoder.layer.10.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1293" name="Constant_857647" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="191921200" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1294" name="__module.roberta.encoder.layer.10.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="867,input.45">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1295" name="__module.roberta.encoder.layer.10.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="869">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1296" name="__module.roberta.encoder.layer.10.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1297" name="__module.roberta.encoder.layer.10.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1298" name="Constant_857648" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="191925296" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1299" name="__module.roberta.encoder.layer.10.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1300" name="Constant_857649" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="191929392" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1301" name="__module.roberta.encoder.layer.10.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="873,hidden_states.67">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1302" name="__module.roberta.encoder.layer.10.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="191933488" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1303" name="__module.roberta.encoder.layer.10.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1304" name="__module.roberta.encoder.layer.10.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="191937584" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1305" name="__module.roberta.encoder.layer.10.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="191937588" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1306" name="__module.roberta.encoder.layer.10.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="191937584" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1307" name="__module.roberta.encoder.layer.10.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="191937588" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1308" name="__module.roberta.encoder.layer.10.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1309" name="Constant_1974340" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="191937592" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1310" name="Convert_1974341" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1311" name="Constant_1974342" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="192986168" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1312" name="__module.roberta.encoder.layer.11.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1313" name="__module.roberta.encoder.layer.11.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1314" name="Constant_857650" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="192990264" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1315" name="__module.roberta.encoder.layer.11.attention.self.query/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="886,x.133">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1316" name="__module.roberta.encoder.layer.11.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="192994360" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1317" name="__module.roberta.encoder.layer.11.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="192994364" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1318" name="__module.roberta.encoder.layer.11.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="192994360" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1319" name="__module.roberta.encoder.layer.11.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="192994364" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1320" name="__module.roberta.encoder.layer.11.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1321" name="__module.roberta.encoder.layer.11.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1322" name="__module.roberta.encoder.layer.11.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="890,x.135">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1323" name="Constant_845626" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="891">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1324" name="__module.roberta.encoder.layer.11.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="892">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1325" name="Constant_1974344" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="192994368" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1326" name="Convert_1974345" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1327" name="Constant_1974346" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="194042944" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1328" name="__module.roberta.encoder.layer.11.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1329" name="__module.roberta.encoder.layer.11.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1330" name="Constant_857651" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="194047040" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1331" name="__module.roberta.encoder.layer.11.attention.self.key/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="895,x.137">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1332" name="__module.roberta.encoder.layer.11.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="194051136" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1333" name="__module.roberta.encoder.layer.11.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="194051140" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1334" name="__module.roberta.encoder.layer.11.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="194051136" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1335" name="__module.roberta.encoder.layer.11.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="194051140" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1336" name="__module.roberta.encoder.layer.11.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1337" name="__module.roberta.encoder.layer.11.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1338" name="__module.roberta.encoder.layer.11.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="899,x.139">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1339" name="Constant_845649" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="900">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1340" name="__module.roberta.encoder.layer.11.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="901">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1341" name="Constant_1974348" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="194051144" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1342" name="Convert_1974349" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1343" name="Constant_1974350" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="195099720" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1344" name="__module.roberta.encoder.layer.11.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1345" name="__module.roberta.encoder.layer.11.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1346" name="Constant_857652" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="195103816" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1347" name="__module.roberta.encoder.layer.11.attention.self.value/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="904,x.141">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1348" name="__module.roberta.encoder.layer.11.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1349" name="__module.roberta.encoder.layer.11.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="908,x.143">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1350" name="Constant_845672" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="909">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1351" name="__module.roberta.encoder.layer.11.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="910">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1352" name="__module.roberta.encoder.layer.11.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
|
|
<data causal="false" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="3" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="4" precision="FP32" names="911,attn_output.45">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1353" name="__module.roberta.encoder.layer.11.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
|
|
<data element_type="i32" shape="4" offset="55388688" size="16" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1354" name="__module.roberta.encoder.layer.11.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="912,attn_output.47">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1355" name="Constant_857989" type="Const" version="opset1">
|
|
<data element_type="i64" shape="3" offset="55388704" size="24" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1356" name="__module.roberta.encoder.layer.11.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="914">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1357" name="__module.roberta.encoder.layer.11.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="195107912" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1358" name="__module.roberta.encoder.layer.11.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1359" name="__module.roberta.encoder.layer.11.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="195112008" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1360" name="__module.roberta.encoder.layer.11.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="195112012" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1361" name="__module.roberta.encoder.layer.11.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="195112008" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1362" name="__module.roberta.encoder.layer.11.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="195112012" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1363" name="__module.roberta.encoder.layer.11.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1364" name="Constant_1974352" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="195112016" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1365" name="Convert_1974353" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1366" name="Constant_1974354" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="196160592" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1367" name="__module.roberta.encoder.layer.11.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1368" name="__module.roberta.encoder.layer.11.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1369" name="Constant_857653" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="196164688" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1370" name="__module.roberta.encoder.layer.11.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="919,input.47">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1371" name="__module.roberta.encoder.layer.11.attention.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="921">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1372" name="__module.roberta.encoder.layer.11.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1373" name="__module.roberta.encoder.layer.11.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1374" name="Constant_857654" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="196168784" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1375" name="__module.roberta.encoder.layer.11.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1376" name="Constant_857655" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="196172880" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1377" name="__module.roberta.encoder.layer.11.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="925,input_tensor.23">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1378" name="__module.roberta.encoder.layer.11.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="196176976" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1379" name="__module.roberta.encoder.layer.11.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1380" name="__module.roberta.encoder.layer.11.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="196181072" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1381" name="__module.roberta.encoder.layer.11.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="196181076" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1382" name="__module.roberta.encoder.layer.11.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="196181072" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1383" name="__module.roberta.encoder.layer.11.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="196181076" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1384" name="__module.roberta.encoder.layer.11.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1385" name="Constant_1974356" type="Const" version="opset1">
|
|
<data element_type="i8" shape="4096, 1024" offset="196181080" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1386" name="Convert_1974357" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1387" name="Constant_1974358" type="Const" version="opset1">
|
|
<data element_type="f32" shape="4096, 1" offset="200375384" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1388" name="__module.roberta.encoder.layer.11.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1389" name="__module.roberta.encoder.layer.11.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1390" name="Constant_857656" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="200391768" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1391" name="__module.roberta.encoder.layer.11.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="929">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1392" name="__module.roberta.encoder.layer.11.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
|
<data approximation_mode="ERF" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32" names="930">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1393" name="__module.roberta.encoder.layer.11.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="200408152" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1394" name="__module.roberta.encoder.layer.11.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1395" name="__module.roberta.encoder.layer.11.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="200424536" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1396" name="__module.roberta.encoder.layer.11.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="200424540" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1397" name="__module.roberta.encoder.layer.11.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="200424536" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1398" name="__module.roberta.encoder.layer.11.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="200424540" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1399" name="__module.roberta.encoder.layer.11.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1400" name="Constant_1974360" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 4096" offset="200424544" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1401" name="Convert_1974361" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1402" name="Constant_1974362" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="204618848" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1403" name="__module.roberta.encoder.layer.11.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1404" name="__module.roberta.encoder.layer.11.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1405" name="Constant_857657" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="204622944" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1406" name="__module.roberta.encoder.layer.11.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="935,input.49">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1407" name="__module.roberta.encoder.layer.11.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="937">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1408" name="__module.roberta.encoder.layer.11.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1409" name="__module.roberta.encoder.layer.11.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1410" name="Constant_857658" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="204627040" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1411" name="__module.roberta.encoder.layer.11.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1412" name="Constant_857659" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="204631136" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1413" name="__module.roberta.encoder.layer.11.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="941,hidden_states.73">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1414" name="__module.roberta.encoder.layer.11.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="204635232" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1415" name="__module.roberta.encoder.layer.11.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1416" name="__module.roberta.encoder.layer.11.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="204639328" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1417" name="__module.roberta.encoder.layer.11.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="204639332" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1418" name="__module.roberta.encoder.layer.11.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="204639328" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1419" name="__module.roberta.encoder.layer.11.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="204639332" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1420" name="__module.roberta.encoder.layer.11.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1421" name="Constant_1974364" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="204639336" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1422" name="Convert_1974365" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1423" name="Constant_1974366" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="205687912" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1424" name="__module.roberta.encoder.layer.12.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1425" name="__module.roberta.encoder.layer.12.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1426" name="Constant_857660" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="205692008" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1427" name="__module.roberta.encoder.layer.12.attention.self.query/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="954,x.145">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1428" name="__module.roberta.encoder.layer.12.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="205696104" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1429" name="__module.roberta.encoder.layer.12.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="205696108" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1430" name="__module.roberta.encoder.layer.12.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="205696104" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1431" name="__module.roberta.encoder.layer.12.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="205696108" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1432" name="__module.roberta.encoder.layer.12.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1433" name="__module.roberta.encoder.layer.12.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1434" name="__module.roberta.encoder.layer.12.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="958,x.147">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1435" name="Constant_845849" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="959">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1436" name="__module.roberta.encoder.layer.12.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="960">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1437" name="Constant_1974368" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="205696112" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1438" name="Convert_1974369" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1439" name="Constant_1974370" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="206744688" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1440" name="__module.roberta.encoder.layer.12.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1441" name="__module.roberta.encoder.layer.12.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1442" name="Constant_857661" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="206748784" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1443" name="__module.roberta.encoder.layer.12.attention.self.key/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="963,x.149">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1444" name="__module.roberta.encoder.layer.12.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="206752880" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1445" name="__module.roberta.encoder.layer.12.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="206752884" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1446" name="__module.roberta.encoder.layer.12.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="206752880" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1447" name="__module.roberta.encoder.layer.12.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="206752884" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1448" name="__module.roberta.encoder.layer.12.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1449" name="__module.roberta.encoder.layer.12.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1450" name="__module.roberta.encoder.layer.12.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="967,x.151">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1451" name="Constant_845872" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="968">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1452" name="__module.roberta.encoder.layer.12.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="969">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1453" name="Constant_1974372" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="206752888" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1454" name="Convert_1974373" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1455" name="Constant_1974374" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="207801464" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1456" name="__module.roberta.encoder.layer.12.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1457" name="__module.roberta.encoder.layer.12.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1458" name="Constant_857662" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="207805560" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1459" name="__module.roberta.encoder.layer.12.attention.self.value/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="972,x.153">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1460" name="__module.roberta.encoder.layer.12.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1461" name="__module.roberta.encoder.layer.12.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="976,x.155">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1462" name="Constant_845895" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="977">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1463" name="__module.roberta.encoder.layer.12.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="978">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1464" name="__module.roberta.encoder.layer.12.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
|
|
<data causal="false" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="3" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="4" precision="FP32" names="979,attn_output.49">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1465" name="__module.roberta.encoder.layer.12.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
|
|
<data element_type="i32" shape="4" offset="55388688" size="16" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1466" name="__module.roberta.encoder.layer.12.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="980,attn_output.51">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1467" name="Constant_857990" type="Const" version="opset1">
|
|
<data element_type="i64" shape="3" offset="55388704" size="24" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1468" name="__module.roberta.encoder.layer.12.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="982">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1469" name="__module.roberta.encoder.layer.12.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="207809656" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1470" name="__module.roberta.encoder.layer.12.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1471" name="__module.roberta.encoder.layer.12.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="207813752" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1472" name="__module.roberta.encoder.layer.12.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="207813756" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1473" name="__module.roberta.encoder.layer.12.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="207813752" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1474" name="__module.roberta.encoder.layer.12.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="207813756" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1475" name="__module.roberta.encoder.layer.12.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1476" name="Constant_1974376" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="207813760" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1477" name="Convert_1974377" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1478" name="Constant_1974378" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="208862336" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1479" name="__module.roberta.encoder.layer.12.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1480" name="__module.roberta.encoder.layer.12.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1481" name="Constant_857663" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="208866432" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1482" name="__module.roberta.encoder.layer.12.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="987,input.51">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1483" name="__module.roberta.encoder.layer.12.attention.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="989">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1484" name="__module.roberta.encoder.layer.12.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1485" name="__module.roberta.encoder.layer.12.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1486" name="Constant_857664" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="208870528" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1487" name="__module.roberta.encoder.layer.12.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1488" name="Constant_857665" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="208874624" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1489" name="__module.roberta.encoder.layer.12.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="993,input_tensor.25">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1490" name="__module.roberta.encoder.layer.12.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="208878720" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1491" name="__module.roberta.encoder.layer.12.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1492" name="__module.roberta.encoder.layer.12.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="208882816" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1493" name="__module.roberta.encoder.layer.12.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="208882820" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1494" name="__module.roberta.encoder.layer.12.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="208882816" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1495" name="__module.roberta.encoder.layer.12.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="208882820" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1496" name="__module.roberta.encoder.layer.12.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1497" name="Constant_1974380" type="Const" version="opset1">
|
|
<data element_type="i8" shape="4096, 1024" offset="208882824" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1498" name="Convert_1974381" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1499" name="Constant_1974382" type="Const" version="opset1">
|
|
<data element_type="f32" shape="4096, 1" offset="213077128" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1500" name="__module.roberta.encoder.layer.12.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1501" name="__module.roberta.encoder.layer.12.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1502" name="Constant_857666" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="213093512" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1503" name="__module.roberta.encoder.layer.12.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="997">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1504" name="__module.roberta.encoder.layer.12.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
|
<data approximation_mode="ERF" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32" names="998">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1505" name="__module.roberta.encoder.layer.12.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="213109896" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1506" name="__module.roberta.encoder.layer.12.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1507" name="__module.roberta.encoder.layer.12.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="213126280" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1508" name="__module.roberta.encoder.layer.12.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="213126284" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1509" name="__module.roberta.encoder.layer.12.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="213126280" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1510" name="__module.roberta.encoder.layer.12.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="213126284" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1511" name="__module.roberta.encoder.layer.12.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1512" name="Constant_1974384" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 4096" offset="213126288" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1513" name="Convert_1974385" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1514" name="Constant_1974386" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="217320592" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1515" name="__module.roberta.encoder.layer.12.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1516" name="__module.roberta.encoder.layer.12.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1517" name="Constant_857667" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="217324688" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1518" name="__module.roberta.encoder.layer.12.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1003,input.53">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1519" name="__module.roberta.encoder.layer.12.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1005">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1520" name="__module.roberta.encoder.layer.12.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1521" name="__module.roberta.encoder.layer.12.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1522" name="Constant_857668" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="217328784" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1523" name="__module.roberta.encoder.layer.12.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1524" name="Constant_857669" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="217332880" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1525" name="__module.roberta.encoder.layer.12.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1009,hidden_states.79">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1526" name="__module.roberta.encoder.layer.12.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="217336976" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1527" name="__module.roberta.encoder.layer.12.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1528" name="__module.roberta.encoder.layer.12.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="217341072" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1529" name="__module.roberta.encoder.layer.12.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="217341076" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1530" name="__module.roberta.encoder.layer.12.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="217341072" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1531" name="__module.roberta.encoder.layer.12.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="217341076" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1532" name="__module.roberta.encoder.layer.12.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1533" name="Constant_1974388" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="217341080" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1534" name="Convert_1974389" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1535" name="Constant_1974390" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="218389656" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1536" name="__module.roberta.encoder.layer.13.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1537" name="__module.roberta.encoder.layer.13.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1538" name="Constant_857670" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="218393752" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1539" name="__module.roberta.encoder.layer.13.attention.self.query/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1022,x.157">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1540" name="__module.roberta.encoder.layer.13.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="218397848" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1541" name="__module.roberta.encoder.layer.13.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="218397852" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1542" name="__module.roberta.encoder.layer.13.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="218397848" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1543" name="__module.roberta.encoder.layer.13.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="218397852" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1544" name="__module.roberta.encoder.layer.13.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1545" name="__module.roberta.encoder.layer.13.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1546" name="__module.roberta.encoder.layer.13.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1026,x.159">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1547" name="Constant_846072" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1027">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1548" name="__module.roberta.encoder.layer.13.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1028">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1549" name="Constant_1974392" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="218397856" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1550" name="Convert_1974393" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1551" name="Constant_1974394" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="219446432" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1552" name="__module.roberta.encoder.layer.13.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1553" name="__module.roberta.encoder.layer.13.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1554" name="Constant_857671" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="219450528" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1555" name="__module.roberta.encoder.layer.13.attention.self.key/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1031,x.161">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1556" name="__module.roberta.encoder.layer.13.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="219454624" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1557" name="__module.roberta.encoder.layer.13.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="219454628" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1558" name="__module.roberta.encoder.layer.13.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="219454624" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1559" name="__module.roberta.encoder.layer.13.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="219454628" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1560" name="__module.roberta.encoder.layer.13.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1561" name="__module.roberta.encoder.layer.13.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1562" name="__module.roberta.encoder.layer.13.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1035,x.163">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1563" name="Constant_846095" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1036">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1564" name="__module.roberta.encoder.layer.13.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1037">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1565" name="Constant_1974396" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="219454632" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1566" name="Convert_1974397" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1567" name="Constant_1974398" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="220503208" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1568" name="__module.roberta.encoder.layer.13.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1569" name="__module.roberta.encoder.layer.13.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1570" name="Constant_857672" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="220507304" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1571" name="__module.roberta.encoder.layer.13.attention.self.value/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1040,x.165">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1572" name="__module.roberta.encoder.layer.13.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1573" name="__module.roberta.encoder.layer.13.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1044,x.167">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1574" name="Constant_846118" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1045">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1575" name="__module.roberta.encoder.layer.13.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1046">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1576" name="__module.roberta.encoder.layer.13.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
|
|
<data causal="false" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="3" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="4" precision="FP32" names="1047,attn_output.53">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1577" name="__module.roberta.encoder.layer.13.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
|
|
<data element_type="i32" shape="4" offset="55388688" size="16" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1578" name="__module.roberta.encoder.layer.13.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1048,attn_output.55">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1579" name="Constant_857991" type="Const" version="opset1">
|
|
<data element_type="i64" shape="3" offset="55388704" size="24" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1580" name="__module.roberta.encoder.layer.13.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1050">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1581" name="__module.roberta.encoder.layer.13.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="220511400" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1582" name="__module.roberta.encoder.layer.13.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1583" name="__module.roberta.encoder.layer.13.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="220515496" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1584" name="__module.roberta.encoder.layer.13.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="220515500" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1585" name="__module.roberta.encoder.layer.13.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="220515496" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1586" name="__module.roberta.encoder.layer.13.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="220515500" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1587" name="__module.roberta.encoder.layer.13.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1588" name="Constant_1974400" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="220515504" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1589" name="Convert_1974401" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1590" name="Constant_1974402" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="221564080" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1591" name="__module.roberta.encoder.layer.13.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1592" name="__module.roberta.encoder.layer.13.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1593" name="Constant_857673" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="221568176" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1594" name="__module.roberta.encoder.layer.13.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1055,input.55">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1595" name="__module.roberta.encoder.layer.13.attention.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1057">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1596" name="__module.roberta.encoder.layer.13.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1597" name="__module.roberta.encoder.layer.13.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1598" name="Constant_857674" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="221572272" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1599" name="__module.roberta.encoder.layer.13.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1600" name="Constant_857675" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="221576368" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1601" name="__module.roberta.encoder.layer.13.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1061,input_tensor.27">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1602" name="__module.roberta.encoder.layer.13.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="221580464" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1603" name="__module.roberta.encoder.layer.13.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1604" name="__module.roberta.encoder.layer.13.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="221584560" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1605" name="__module.roberta.encoder.layer.13.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="221584564" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1606" name="__module.roberta.encoder.layer.13.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="221584560" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1607" name="__module.roberta.encoder.layer.13.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="221584564" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1608" name="__module.roberta.encoder.layer.13.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1609" name="Constant_1974404" type="Const" version="opset1">
|
|
<data element_type="i8" shape="4096, 1024" offset="221584568" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1610" name="Convert_1974405" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1611" name="Constant_1974406" type="Const" version="opset1">
|
|
<data element_type="f32" shape="4096, 1" offset="225778872" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1612" name="__module.roberta.encoder.layer.13.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1613" name="__module.roberta.encoder.layer.13.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1614" name="Constant_857676" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="225795256" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1615" name="__module.roberta.encoder.layer.13.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1065">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1616" name="__module.roberta.encoder.layer.13.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
|
<data approximation_mode="ERF" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32" names="1066">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1617" name="__module.roberta.encoder.layer.13.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="225811640" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1618" name="__module.roberta.encoder.layer.13.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1619" name="__module.roberta.encoder.layer.13.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="225828024" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1620" name="__module.roberta.encoder.layer.13.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="225828028" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1621" name="__module.roberta.encoder.layer.13.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="225828024" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1622" name="__module.roberta.encoder.layer.13.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="225828028" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1623" name="__module.roberta.encoder.layer.13.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1624" name="Constant_1974408" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 4096" offset="225828032" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1625" name="Convert_1974409" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1626" name="Constant_1974410" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="230022336" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1627" name="__module.roberta.encoder.layer.13.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1628" name="__module.roberta.encoder.layer.13.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1629" name="Constant_857677" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="230026432" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1630" name="__module.roberta.encoder.layer.13.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1071,input.57">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1631" name="__module.roberta.encoder.layer.13.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1073">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1632" name="__module.roberta.encoder.layer.13.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1633" name="__module.roberta.encoder.layer.13.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1634" name="Constant_857678" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="230030528" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1635" name="__module.roberta.encoder.layer.13.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1636" name="Constant_857679" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="230034624" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1637" name="__module.roberta.encoder.layer.13.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1077,hidden_states.85">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1638" name="__module.roberta.encoder.layer.13.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="230038720" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1639" name="__module.roberta.encoder.layer.13.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1640" name="__module.roberta.encoder.layer.13.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="230042816" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1641" name="__module.roberta.encoder.layer.13.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="230042820" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1642" name="__module.roberta.encoder.layer.13.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="230042816" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1643" name="__module.roberta.encoder.layer.13.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="230042820" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1644" name="__module.roberta.encoder.layer.13.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1645" name="Constant_1974412" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="230042824" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1646" name="Convert_1974413" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1647" name="Constant_1974414" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="231091400" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1648" name="__module.roberta.encoder.layer.14.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1649" name="__module.roberta.encoder.layer.14.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1650" name="Constant_857680" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="231095496" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1651" name="__module.roberta.encoder.layer.14.attention.self.query/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1090,x.169">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1652" name="__module.roberta.encoder.layer.14.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="231099592" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1653" name="__module.roberta.encoder.layer.14.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="231099596" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1654" name="__module.roberta.encoder.layer.14.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="231099592" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1655" name="__module.roberta.encoder.layer.14.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="231099596" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1656" name="__module.roberta.encoder.layer.14.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1657" name="__module.roberta.encoder.layer.14.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1658" name="__module.roberta.encoder.layer.14.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1094,x.171">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1659" name="Constant_846295" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1095">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1660" name="__module.roberta.encoder.layer.14.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1096">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1661" name="Constant_1974416" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="231099600" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1662" name="Convert_1974417" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1663" name="Constant_1974418" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="232148176" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1664" name="__module.roberta.encoder.layer.14.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1665" name="__module.roberta.encoder.layer.14.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1666" name="Constant_857681" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="232152272" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1667" name="__module.roberta.encoder.layer.14.attention.self.key/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1099,x.173">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1668" name="__module.roberta.encoder.layer.14.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="232156368" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1669" name="__module.roberta.encoder.layer.14.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="232156372" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1670" name="__module.roberta.encoder.layer.14.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="232156368" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1671" name="__module.roberta.encoder.layer.14.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="232156372" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1672" name="__module.roberta.encoder.layer.14.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1673" name="__module.roberta.encoder.layer.14.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1674" name="__module.roberta.encoder.layer.14.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1103,x.175">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1675" name="Constant_846318" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1104">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1676" name="__module.roberta.encoder.layer.14.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1105">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1677" name="Constant_1974420" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="232156376" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1678" name="Convert_1974421" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1679" name="Constant_1974422" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="233204952" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1680" name="__module.roberta.encoder.layer.14.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1681" name="__module.roberta.encoder.layer.14.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1682" name="Constant_857682" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="233209048" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1683" name="__module.roberta.encoder.layer.14.attention.self.value/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1108,x.177">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1684" name="__module.roberta.encoder.layer.14.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1685" name="__module.roberta.encoder.layer.14.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1112,x.179">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1686" name="Constant_846341" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1113">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1687" name="__module.roberta.encoder.layer.14.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1114">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1688" name="__module.roberta.encoder.layer.14.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
|
|
<data causal="false" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="3" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="4" precision="FP32" names="1115,attn_output.57">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1689" name="__module.roberta.encoder.layer.14.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
|
|
<data element_type="i32" shape="4" offset="55388688" size="16" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1690" name="__module.roberta.encoder.layer.14.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1116,attn_output.59">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1691" name="Constant_857992" type="Const" version="opset1">
|
|
<data element_type="i64" shape="3" offset="55388704" size="24" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1692" name="__module.roberta.encoder.layer.14.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1118">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1693" name="__module.roberta.encoder.layer.14.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="233213144" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1694" name="__module.roberta.encoder.layer.14.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1695" name="__module.roberta.encoder.layer.14.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="233217240" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1696" name="__module.roberta.encoder.layer.14.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="233217244" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1697" name="__module.roberta.encoder.layer.14.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="233217240" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1698" name="__module.roberta.encoder.layer.14.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="233217244" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1699" name="__module.roberta.encoder.layer.14.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1700" name="Constant_1974424" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="233217248" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1701" name="Convert_1974425" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1702" name="Constant_1974426" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="234265824" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1703" name="__module.roberta.encoder.layer.14.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1704" name="__module.roberta.encoder.layer.14.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1705" name="Constant_857683" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="234269920" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1706" name="__module.roberta.encoder.layer.14.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1123,input.59">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1707" name="__module.roberta.encoder.layer.14.attention.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1125">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1708" name="__module.roberta.encoder.layer.14.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1709" name="__module.roberta.encoder.layer.14.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1710" name="Constant_857684" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="234274016" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1711" name="__module.roberta.encoder.layer.14.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1712" name="Constant_857685" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="234278112" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1713" name="__module.roberta.encoder.layer.14.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1129,input_tensor.29">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1714" name="__module.roberta.encoder.layer.14.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="234282208" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1715" name="__module.roberta.encoder.layer.14.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1716" name="__module.roberta.encoder.layer.14.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="234286304" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1717" name="__module.roberta.encoder.layer.14.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="234286308" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1718" name="__module.roberta.encoder.layer.14.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="234286304" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1719" name="__module.roberta.encoder.layer.14.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="234286308" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1720" name="__module.roberta.encoder.layer.14.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1721" name="Constant_1974428" type="Const" version="opset1">
|
|
<data element_type="i8" shape="4096, 1024" offset="234286312" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1722" name="Convert_1974429" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1723" name="Constant_1974430" type="Const" version="opset1">
|
|
<data element_type="f32" shape="4096, 1" offset="238480616" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1724" name="__module.roberta.encoder.layer.14.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1725" name="__module.roberta.encoder.layer.14.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1726" name="Constant_857686" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="238497000" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1727" name="__module.roberta.encoder.layer.14.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1133">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1728" name="__module.roberta.encoder.layer.14.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
|
<data approximation_mode="ERF" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32" names="1134">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1729" name="__module.roberta.encoder.layer.14.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="238513384" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1730" name="__module.roberta.encoder.layer.14.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1731" name="__module.roberta.encoder.layer.14.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="238529768" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1732" name="__module.roberta.encoder.layer.14.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="238529772" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1733" name="__module.roberta.encoder.layer.14.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="238529768" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1734" name="__module.roberta.encoder.layer.14.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="238529772" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1735" name="__module.roberta.encoder.layer.14.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1736" name="Constant_1974432" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 4096" offset="238529776" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1737" name="Convert_1974433" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1738" name="Constant_1974434" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="242724080" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1739" name="__module.roberta.encoder.layer.14.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1740" name="__module.roberta.encoder.layer.14.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1741" name="Constant_857687" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="242728176" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1742" name="__module.roberta.encoder.layer.14.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1139,input.61">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1743" name="__module.roberta.encoder.layer.14.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1141">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1744" name="__module.roberta.encoder.layer.14.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1745" name="__module.roberta.encoder.layer.14.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1746" name="Constant_857688" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="242732272" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1747" name="__module.roberta.encoder.layer.14.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1748" name="Constant_857689" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="242736368" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1749" name="__module.roberta.encoder.layer.14.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1145,hidden_states.91">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1750" name="__module.roberta.encoder.layer.14.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="242740464" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1751" name="__module.roberta.encoder.layer.14.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1752" name="__module.roberta.encoder.layer.14.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="242744560" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1753" name="__module.roberta.encoder.layer.14.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="242744564" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1754" name="__module.roberta.encoder.layer.14.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="242744560" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1755" name="__module.roberta.encoder.layer.14.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="242744564" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1756" name="__module.roberta.encoder.layer.14.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1757" name="Constant_1974436" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="242744568" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1758" name="Convert_1974437" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1759" name="Constant_1974438" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="243793144" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1760" name="__module.roberta.encoder.layer.15.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1761" name="__module.roberta.encoder.layer.15.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1762" name="Constant_857690" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="243797240" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1763" name="__module.roberta.encoder.layer.15.attention.self.query/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1158,x.181">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1764" name="__module.roberta.encoder.layer.15.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="243801336" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1765" name="__module.roberta.encoder.layer.15.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="243801340" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1766" name="__module.roberta.encoder.layer.15.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="243801336" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1767" name="__module.roberta.encoder.layer.15.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="243801340" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1768" name="__module.roberta.encoder.layer.15.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1769" name="__module.roberta.encoder.layer.15.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1770" name="__module.roberta.encoder.layer.15.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1162,x.183">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1771" name="Constant_846518" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1163">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1772" name="__module.roberta.encoder.layer.15.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1164">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1773" name="Constant_1974440" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="243801344" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1774" name="Convert_1974441" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1775" name="Constant_1974442" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="244849920" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1776" name="__module.roberta.encoder.layer.15.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1777" name="__module.roberta.encoder.layer.15.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1778" name="Constant_857691" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="244854016" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1779" name="__module.roberta.encoder.layer.15.attention.self.key/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1167,x.185">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1780" name="__module.roberta.encoder.layer.15.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="244858112" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1781" name="__module.roberta.encoder.layer.15.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="244858116" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1782" name="__module.roberta.encoder.layer.15.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="244858112" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1783" name="__module.roberta.encoder.layer.15.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="244858116" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1784" name="__module.roberta.encoder.layer.15.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1785" name="__module.roberta.encoder.layer.15.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1786" name="__module.roberta.encoder.layer.15.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1171,x.187">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1787" name="Constant_846541" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1172">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1788" name="__module.roberta.encoder.layer.15.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1173">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1789" name="Constant_1974444" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="244858120" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1790" name="Convert_1974445" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1791" name="Constant_1974446" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="245906696" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1792" name="__module.roberta.encoder.layer.15.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1793" name="__module.roberta.encoder.layer.15.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1794" name="Constant_857692" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="245910792" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1795" name="__module.roberta.encoder.layer.15.attention.self.value/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1176,x.189">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1796" name="__module.roberta.encoder.layer.15.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1797" name="__module.roberta.encoder.layer.15.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1180,x.191">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1798" name="Constant_846564" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1181">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1799" name="__module.roberta.encoder.layer.15.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1182">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1800" name="__module.roberta.encoder.layer.15.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
|
|
<data causal="false" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="3" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="4" precision="FP32" names="1183,attn_output.61">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1801" name="__module.roberta.encoder.layer.15.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
|
|
<data element_type="i32" shape="4" offset="55388688" size="16" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1802" name="__module.roberta.encoder.layer.15.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1184,attn_output.63">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1803" name="Constant_857993" type="Const" version="opset1">
|
|
<data element_type="i64" shape="3" offset="55388704" size="24" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1804" name="__module.roberta.encoder.layer.15.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1186">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1805" name="__module.roberta.encoder.layer.15.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="245914888" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1806" name="__module.roberta.encoder.layer.15.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1807" name="__module.roberta.encoder.layer.15.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="245918984" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1808" name="__module.roberta.encoder.layer.15.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="245918988" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1809" name="__module.roberta.encoder.layer.15.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="245918984" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1810" name="__module.roberta.encoder.layer.15.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="245918988" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1811" name="__module.roberta.encoder.layer.15.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1812" name="Constant_1974448" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="245918992" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1813" name="Convert_1974449" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1814" name="Constant_1974450" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="246967568" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1815" name="__module.roberta.encoder.layer.15.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1816" name="__module.roberta.encoder.layer.15.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1817" name="Constant_857693" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="246971664" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1818" name="__module.roberta.encoder.layer.15.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1191,input.63">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1819" name="__module.roberta.encoder.layer.15.attention.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1193">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1820" name="__module.roberta.encoder.layer.15.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1821" name="__module.roberta.encoder.layer.15.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1822" name="Constant_857694" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="246975760" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1823" name="__module.roberta.encoder.layer.15.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1824" name="Constant_857695" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="246979856" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1825" name="__module.roberta.encoder.layer.15.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1197,input_tensor.31">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1826" name="__module.roberta.encoder.layer.15.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="246983952" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1827" name="__module.roberta.encoder.layer.15.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1828" name="__module.roberta.encoder.layer.15.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="246988048" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1829" name="__module.roberta.encoder.layer.15.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="246988052" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1830" name="__module.roberta.encoder.layer.15.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="246988048" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1831" name="__module.roberta.encoder.layer.15.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="246988052" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1832" name="__module.roberta.encoder.layer.15.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1833" name="Constant_1974452" type="Const" version="opset1">
|
|
<data element_type="i8" shape="4096, 1024" offset="246988056" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1834" name="Convert_1974453" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1835" name="Constant_1974454" type="Const" version="opset1">
|
|
<data element_type="f32" shape="4096, 1" offset="251182360" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1836" name="__module.roberta.encoder.layer.15.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1837" name="__module.roberta.encoder.layer.15.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1838" name="Constant_857696" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="251198744" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1839" name="__module.roberta.encoder.layer.15.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1201">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1840" name="__module.roberta.encoder.layer.15.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
|
<data approximation_mode="ERF" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32" names="1202">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1841" name="__module.roberta.encoder.layer.15.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="251215128" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1842" name="__module.roberta.encoder.layer.15.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1843" name="__module.roberta.encoder.layer.15.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="251231512" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1844" name="__module.roberta.encoder.layer.15.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="251231516" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1845" name="__module.roberta.encoder.layer.15.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="251231512" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1846" name="__module.roberta.encoder.layer.15.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="251231516" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1847" name="__module.roberta.encoder.layer.15.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1848" name="Constant_1974456" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 4096" offset="251231520" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1849" name="Convert_1974457" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1850" name="Constant_1974458" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="255425824" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1851" name="__module.roberta.encoder.layer.15.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1852" name="__module.roberta.encoder.layer.15.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1853" name="Constant_857697" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="255429920" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1854" name="__module.roberta.encoder.layer.15.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1207,input.65">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1855" name="__module.roberta.encoder.layer.15.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1209">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1856" name="__module.roberta.encoder.layer.15.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1857" name="__module.roberta.encoder.layer.15.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1858" name="Constant_857698" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="255434016" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1859" name="__module.roberta.encoder.layer.15.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1860" name="Constant_857699" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="255438112" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1861" name="__module.roberta.encoder.layer.15.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1213,hidden_states.97">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1862" name="__module.roberta.encoder.layer.15.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="255442208" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1863" name="__module.roberta.encoder.layer.15.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1864" name="__module.roberta.encoder.layer.15.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="255446304" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1865" name="__module.roberta.encoder.layer.15.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="255446308" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1866" name="__module.roberta.encoder.layer.15.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="255446304" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1867" name="__module.roberta.encoder.layer.15.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="255446308" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1868" name="__module.roberta.encoder.layer.15.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1869" name="Constant_1974460" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="255446312" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1870" name="Convert_1974461" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1871" name="Constant_1974462" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="256494888" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1872" name="__module.roberta.encoder.layer.16.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1873" name="__module.roberta.encoder.layer.16.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1874" name="Constant_857700" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="256498984" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1875" name="__module.roberta.encoder.layer.16.attention.self.query/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1226,x.193">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1876" name="__module.roberta.encoder.layer.16.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="256503080" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1877" name="__module.roberta.encoder.layer.16.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="256503084" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1878" name="__module.roberta.encoder.layer.16.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="256503080" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1879" name="__module.roberta.encoder.layer.16.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="256503084" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1880" name="__module.roberta.encoder.layer.16.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1881" name="__module.roberta.encoder.layer.16.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1882" name="__module.roberta.encoder.layer.16.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1230,x.195">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1883" name="Constant_846741" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1231">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1884" name="__module.roberta.encoder.layer.16.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1232">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1885" name="Constant_1974464" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="256503088" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1886" name="Convert_1974465" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1887" name="Constant_1974466" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="257551664" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1888" name="__module.roberta.encoder.layer.16.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1889" name="__module.roberta.encoder.layer.16.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1890" name="Constant_857701" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="257555760" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1891" name="__module.roberta.encoder.layer.16.attention.self.key/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1235,x.197">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1892" name="__module.roberta.encoder.layer.16.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="257559856" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1893" name="__module.roberta.encoder.layer.16.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="257559860" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1894" name="__module.roberta.encoder.layer.16.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="257559856" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1895" name="__module.roberta.encoder.layer.16.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="257559860" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1896" name="__module.roberta.encoder.layer.16.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1897" name="__module.roberta.encoder.layer.16.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1898" name="__module.roberta.encoder.layer.16.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1239,x.199">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1899" name="Constant_846764" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1240">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1900" name="__module.roberta.encoder.layer.16.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1241">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1901" name="Constant_1974468" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="257559864" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1902" name="Convert_1974469" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1903" name="Constant_1974470" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="258608440" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1904" name="__module.roberta.encoder.layer.16.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1905" name="__module.roberta.encoder.layer.16.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1906" name="Constant_857702" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="258612536" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1907" name="__module.roberta.encoder.layer.16.attention.self.value/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1244,x.201">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1908" name="__module.roberta.encoder.layer.16.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1909" name="__module.roberta.encoder.layer.16.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1248,x.203">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1910" name="Constant_846787" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1249">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1911" name="__module.roberta.encoder.layer.16.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1250">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1912" name="__module.roberta.encoder.layer.16.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
|
|
<data causal="false" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="3" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="4" precision="FP32" names="1251,attn_output.65">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1913" name="__module.roberta.encoder.layer.16.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
|
|
<data element_type="i32" shape="4" offset="55388688" size="16" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1914" name="__module.roberta.encoder.layer.16.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1252,attn_output.67">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1915" name="Constant_857994" type="Const" version="opset1">
|
|
<data element_type="i64" shape="3" offset="55388704" size="24" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1916" name="__module.roberta.encoder.layer.16.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1254">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1917" name="__module.roberta.encoder.layer.16.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="258616632" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1918" name="__module.roberta.encoder.layer.16.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1919" name="__module.roberta.encoder.layer.16.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="258620728" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1920" name="__module.roberta.encoder.layer.16.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="258620732" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1921" name="__module.roberta.encoder.layer.16.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="258620728" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1922" name="__module.roberta.encoder.layer.16.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="258620732" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1923" name="__module.roberta.encoder.layer.16.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1924" name="Constant_1974472" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="258620736" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1925" name="Convert_1974473" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1926" name="Constant_1974474" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="259669312" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1927" name="__module.roberta.encoder.layer.16.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1928" name="__module.roberta.encoder.layer.16.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1929" name="Constant_857703" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="259673408" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1930" name="__module.roberta.encoder.layer.16.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1259,input.67">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1931" name="__module.roberta.encoder.layer.16.attention.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1261">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1932" name="__module.roberta.encoder.layer.16.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1933" name="__module.roberta.encoder.layer.16.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1934" name="Constant_857704" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="259677504" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1935" name="__module.roberta.encoder.layer.16.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1936" name="Constant_857705" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="259681600" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1937" name="__module.roberta.encoder.layer.16.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1265,input_tensor.33">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1938" name="__module.roberta.encoder.layer.16.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="259685696" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1939" name="__module.roberta.encoder.layer.16.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1940" name="__module.roberta.encoder.layer.16.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="259689792" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1941" name="__module.roberta.encoder.layer.16.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="259689796" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1942" name="__module.roberta.encoder.layer.16.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="259689792" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1943" name="__module.roberta.encoder.layer.16.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="259689796" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1944" name="__module.roberta.encoder.layer.16.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1945" name="Constant_1974476" type="Const" version="opset1">
|
|
<data element_type="i8" shape="4096, 1024" offset="259689800" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1946" name="Convert_1974477" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1947" name="Constant_1974478" type="Const" version="opset1">
|
|
<data element_type="f32" shape="4096, 1" offset="263884104" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1948" name="__module.roberta.encoder.layer.16.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1949" name="__module.roberta.encoder.layer.16.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1950" name="Constant_857706" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="263900488" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1951" name="__module.roberta.encoder.layer.16.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1269">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1952" name="__module.roberta.encoder.layer.16.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
|
<data approximation_mode="ERF" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32" names="1270">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1953" name="__module.roberta.encoder.layer.16.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="263916872" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1954" name="__module.roberta.encoder.layer.16.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1955" name="__module.roberta.encoder.layer.16.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="263933256" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1956" name="__module.roberta.encoder.layer.16.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="263933260" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1957" name="__module.roberta.encoder.layer.16.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="263933256" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1958" name="__module.roberta.encoder.layer.16.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="263933260" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1959" name="__module.roberta.encoder.layer.16.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1960" name="Constant_1974480" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 4096" offset="263933264" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1961" name="Convert_1974481" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1962" name="Constant_1974482" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="268127568" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1963" name="__module.roberta.encoder.layer.16.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1964" name="__module.roberta.encoder.layer.16.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1965" name="Constant_857707" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="268131664" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1966" name="__module.roberta.encoder.layer.16.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1275,input.69">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1967" name="__module.roberta.encoder.layer.16.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1277">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1968" name="__module.roberta.encoder.layer.16.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1969" name="__module.roberta.encoder.layer.16.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1970" name="Constant_857708" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="268135760" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1971" name="__module.roberta.encoder.layer.16.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1972" name="Constant_857709" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="268139856" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1973" name="__module.roberta.encoder.layer.16.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1281,hidden_states.103">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1974" name="__module.roberta.encoder.layer.16.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="268143952" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1975" name="__module.roberta.encoder.layer.16.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1976" name="__module.roberta.encoder.layer.16.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="268148048" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1977" name="__module.roberta.encoder.layer.16.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="268148052" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1978" name="__module.roberta.encoder.layer.16.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="268148048" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1979" name="__module.roberta.encoder.layer.16.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="268148052" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1980" name="__module.roberta.encoder.layer.16.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1981" name="Constant_1974484" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="268148056" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1982" name="Convert_1974485" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1983" name="Constant_1974486" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="269196632" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1984" name="__module.roberta.encoder.layer.17.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1985" name="__module.roberta.encoder.layer.17.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1986" name="Constant_857710" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="269200728" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1987" name="__module.roberta.encoder.layer.17.attention.self.query/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1294,x.205">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1988" name="__module.roberta.encoder.layer.17.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="269204824" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1989" name="__module.roberta.encoder.layer.17.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="269204828" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1990" name="__module.roberta.encoder.layer.17.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="269204824" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1991" name="__module.roberta.encoder.layer.17.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="269204828" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="1992" name="__module.roberta.encoder.layer.17.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1993" name="__module.roberta.encoder.layer.17.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1994" name="__module.roberta.encoder.layer.17.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1298,x.207">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1995" name="Constant_846964" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1299">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1996" name="__module.roberta.encoder.layer.17.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1300">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1997" name="Constant_1974488" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="269204832" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1998" name="Convert_1974489" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="1999" name="Constant_1974490" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="270253408" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2000" name="__module.roberta.encoder.layer.17.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2001" name="__module.roberta.encoder.layer.17.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2002" name="Constant_857711" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="270257504" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2003" name="__module.roberta.encoder.layer.17.attention.self.key/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1303,x.209">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2004" name="__module.roberta.encoder.layer.17.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="270261600" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2005" name="__module.roberta.encoder.layer.17.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="270261604" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2006" name="__module.roberta.encoder.layer.17.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="270261600" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2007" name="__module.roberta.encoder.layer.17.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="270261604" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2008" name="__module.roberta.encoder.layer.17.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2009" name="__module.roberta.encoder.layer.17.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2010" name="__module.roberta.encoder.layer.17.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1307,x.211">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2011" name="Constant_846987" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1308">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2012" name="__module.roberta.encoder.layer.17.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1309">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2013" name="Constant_1974492" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="270261608" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2014" name="Convert_1974493" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2015" name="Constant_1974494" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="271310184" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2016" name="__module.roberta.encoder.layer.17.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2017" name="__module.roberta.encoder.layer.17.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2018" name="Constant_857712" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="271314280" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2019" name="__module.roberta.encoder.layer.17.attention.self.value/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1312,x.213">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2020" name="__module.roberta.encoder.layer.17.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2021" name="__module.roberta.encoder.layer.17.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1316,x.215">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2022" name="Constant_847010" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1317">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2023" name="__module.roberta.encoder.layer.17.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1318">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2024" name="__module.roberta.encoder.layer.17.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
|
|
<data causal="false" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="3" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="4" precision="FP32" names="1319,attn_output.69">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2025" name="__module.roberta.encoder.layer.17.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
|
|
<data element_type="i32" shape="4" offset="55388688" size="16" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2026" name="__module.roberta.encoder.layer.17.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1320,attn_output.71">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2027" name="Constant_857995" type="Const" version="opset1">
|
|
<data element_type="i64" shape="3" offset="55388704" size="24" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2028" name="__module.roberta.encoder.layer.17.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1322">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2029" name="__module.roberta.encoder.layer.17.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="271318376" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2030" name="__module.roberta.encoder.layer.17.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2031" name="__module.roberta.encoder.layer.17.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="271322472" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2032" name="__module.roberta.encoder.layer.17.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="271322476" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2033" name="__module.roberta.encoder.layer.17.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="271322472" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2034" name="__module.roberta.encoder.layer.17.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="271322476" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2035" name="__module.roberta.encoder.layer.17.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2036" name="Constant_1974496" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="271322480" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2037" name="Convert_1974497" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2038" name="Constant_1974498" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="272371056" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2039" name="__module.roberta.encoder.layer.17.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2040" name="__module.roberta.encoder.layer.17.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2041" name="Constant_857713" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="272375152" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2042" name="__module.roberta.encoder.layer.17.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1327,input.71">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2043" name="__module.roberta.encoder.layer.17.attention.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1329">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2044" name="__module.roberta.encoder.layer.17.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2045" name="__module.roberta.encoder.layer.17.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2046" name="Constant_857714" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="272379248" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2047" name="__module.roberta.encoder.layer.17.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2048" name="Constant_857715" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="272383344" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2049" name="__module.roberta.encoder.layer.17.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1333,input_tensor.35">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2050" name="__module.roberta.encoder.layer.17.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="272387440" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2051" name="__module.roberta.encoder.layer.17.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2052" name="__module.roberta.encoder.layer.17.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="272391536" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2053" name="__module.roberta.encoder.layer.17.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="272391540" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2054" name="__module.roberta.encoder.layer.17.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="272391536" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2055" name="__module.roberta.encoder.layer.17.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="272391540" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2056" name="__module.roberta.encoder.layer.17.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2057" name="Constant_1974500" type="Const" version="opset1">
|
|
<data element_type="i8" shape="4096, 1024" offset="272391544" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2058" name="Convert_1974501" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2059" name="Constant_1974502" type="Const" version="opset1">
|
|
<data element_type="f32" shape="4096, 1" offset="276585848" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2060" name="__module.roberta.encoder.layer.17.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2061" name="__module.roberta.encoder.layer.17.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2062" name="Constant_857716" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="276602232" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2063" name="__module.roberta.encoder.layer.17.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1337">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2064" name="__module.roberta.encoder.layer.17.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
|
<data approximation_mode="ERF" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32" names="1338">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2065" name="__module.roberta.encoder.layer.17.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="276618616" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2066" name="__module.roberta.encoder.layer.17.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2067" name="__module.roberta.encoder.layer.17.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="276635000" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2068" name="__module.roberta.encoder.layer.17.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="276635004" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2069" name="__module.roberta.encoder.layer.17.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="276635000" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2070" name="__module.roberta.encoder.layer.17.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="276635004" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2071" name="__module.roberta.encoder.layer.17.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2072" name="Constant_1974504" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 4096" offset="276635008" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2073" name="Convert_1974505" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2074" name="Constant_1974506" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="280829312" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2075" name="__module.roberta.encoder.layer.17.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2076" name="__module.roberta.encoder.layer.17.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2077" name="Constant_857717" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="280833408" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2078" name="__module.roberta.encoder.layer.17.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1343,input.73">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2079" name="__module.roberta.encoder.layer.17.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1345">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2080" name="__module.roberta.encoder.layer.17.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2081" name="__module.roberta.encoder.layer.17.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2082" name="Constant_857718" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="280837504" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2083" name="__module.roberta.encoder.layer.17.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2084" name="Constant_857719" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="280841600" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2085" name="__module.roberta.encoder.layer.17.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1349,hidden_states.109">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2086" name="__module.roberta.encoder.layer.17.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="280845696" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2087" name="__module.roberta.encoder.layer.17.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2088" name="__module.roberta.encoder.layer.17.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="280849792" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2089" name="__module.roberta.encoder.layer.17.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="280849796" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2090" name="__module.roberta.encoder.layer.17.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="280849792" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2091" name="__module.roberta.encoder.layer.17.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="280849796" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2092" name="__module.roberta.encoder.layer.17.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2093" name="Constant_1974508" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="280849800" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2094" name="Convert_1974509" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2095" name="Constant_1974510" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="281898376" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2096" name="__module.roberta.encoder.layer.18.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2097" name="__module.roberta.encoder.layer.18.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2098" name="Constant_857720" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="281902472" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2099" name="__module.roberta.encoder.layer.18.attention.self.query/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1362,x.217">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2100" name="__module.roberta.encoder.layer.18.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="281906568" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2101" name="__module.roberta.encoder.layer.18.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="281906572" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2102" name="__module.roberta.encoder.layer.18.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="281906568" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2103" name="__module.roberta.encoder.layer.18.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="281906572" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2104" name="__module.roberta.encoder.layer.18.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2105" name="__module.roberta.encoder.layer.18.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2106" name="__module.roberta.encoder.layer.18.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1366,x.219">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2107" name="Constant_847187" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1367">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2108" name="__module.roberta.encoder.layer.18.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1368">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2109" name="Constant_1974512" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="281906576" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2110" name="Convert_1974513" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2111" name="Constant_1974514" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="282955152" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2112" name="__module.roberta.encoder.layer.18.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2113" name="__module.roberta.encoder.layer.18.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2114" name="Constant_857721" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="282959248" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2115" name="__module.roberta.encoder.layer.18.attention.self.key/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1371,x.221">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2116" name="__module.roberta.encoder.layer.18.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="282963344" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2117" name="__module.roberta.encoder.layer.18.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="282963348" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2118" name="__module.roberta.encoder.layer.18.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="282963344" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2119" name="__module.roberta.encoder.layer.18.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="282963348" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2120" name="__module.roberta.encoder.layer.18.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2121" name="__module.roberta.encoder.layer.18.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2122" name="__module.roberta.encoder.layer.18.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1375,x.223">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2123" name="Constant_847210" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1376">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2124" name="__module.roberta.encoder.layer.18.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1377">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2125" name="Constant_1974516" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="282963352" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2126" name="Convert_1974517" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2127" name="Constant_1974518" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="284011928" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2128" name="__module.roberta.encoder.layer.18.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2129" name="__module.roberta.encoder.layer.18.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2130" name="Constant_857722" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="284016024" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2131" name="__module.roberta.encoder.layer.18.attention.self.value/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1380,x.225">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2132" name="__module.roberta.encoder.layer.18.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2133" name="__module.roberta.encoder.layer.18.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1384,x.227">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2134" name="Constant_847233" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1385">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2135" name="__module.roberta.encoder.layer.18.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1386">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2136" name="__module.roberta.encoder.layer.18.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
|
|
<data causal="false" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="3" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="4" precision="FP32" names="1387,attn_output.73">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2137" name="__module.roberta.encoder.layer.18.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
|
|
<data element_type="i32" shape="4" offset="55388688" size="16" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2138" name="__module.roberta.encoder.layer.18.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1388,attn_output.75">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2139" name="Constant_857996" type="Const" version="opset1">
|
|
<data element_type="i64" shape="3" offset="55388704" size="24" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2140" name="__module.roberta.encoder.layer.18.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1390">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2141" name="__module.roberta.encoder.layer.18.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="284020120" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2142" name="__module.roberta.encoder.layer.18.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2143" name="__module.roberta.encoder.layer.18.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="284024216" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2144" name="__module.roberta.encoder.layer.18.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="284024220" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2145" name="__module.roberta.encoder.layer.18.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="284024216" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2146" name="__module.roberta.encoder.layer.18.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="284024220" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2147" name="__module.roberta.encoder.layer.18.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2148" name="Constant_1974520" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="284024224" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2149" name="Convert_1974521" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2150" name="Constant_1974522" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="285072800" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2151" name="__module.roberta.encoder.layer.18.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2152" name="__module.roberta.encoder.layer.18.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2153" name="Constant_857723" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="285076896" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2154" name="__module.roberta.encoder.layer.18.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1395,input.75">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2155" name="__module.roberta.encoder.layer.18.attention.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1397">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2156" name="__module.roberta.encoder.layer.18.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2157" name="__module.roberta.encoder.layer.18.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2158" name="Constant_857724" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="285080992" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2159" name="__module.roberta.encoder.layer.18.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2160" name="Constant_857725" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="285085088" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2161" name="__module.roberta.encoder.layer.18.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1401,input_tensor.37">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2162" name="__module.roberta.encoder.layer.18.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="285089184" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2163" name="__module.roberta.encoder.layer.18.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2164" name="__module.roberta.encoder.layer.18.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="285093280" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2165" name="__module.roberta.encoder.layer.18.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="285093284" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2166" name="__module.roberta.encoder.layer.18.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="285093280" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2167" name="__module.roberta.encoder.layer.18.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="285093284" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2168" name="__module.roberta.encoder.layer.18.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2169" name="Constant_1974524" type="Const" version="opset1">
|
|
<data element_type="i8" shape="4096, 1024" offset="285093288" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2170" name="Convert_1974525" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2171" name="Constant_1974526" type="Const" version="opset1">
|
|
<data element_type="f32" shape="4096, 1" offset="289287592" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2172" name="__module.roberta.encoder.layer.18.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2173" name="__module.roberta.encoder.layer.18.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2174" name="Constant_857726" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="289303976" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2175" name="__module.roberta.encoder.layer.18.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1405">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2176" name="__module.roberta.encoder.layer.18.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
|
<data approximation_mode="ERF" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32" names="1406">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2177" name="__module.roberta.encoder.layer.18.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="289320360" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2178" name="__module.roberta.encoder.layer.18.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2179" name="__module.roberta.encoder.layer.18.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="289336744" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2180" name="__module.roberta.encoder.layer.18.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="289336748" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2181" name="__module.roberta.encoder.layer.18.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="289336744" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2182" name="__module.roberta.encoder.layer.18.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="289336748" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2183" name="__module.roberta.encoder.layer.18.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2184" name="Constant_1974528" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 4096" offset="289336752" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2185" name="Convert_1974529" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2186" name="Constant_1974530" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="293531056" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2187" name="__module.roberta.encoder.layer.18.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2188" name="__module.roberta.encoder.layer.18.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2189" name="Constant_857727" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="293535152" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2190" name="__module.roberta.encoder.layer.18.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1411,input.77">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2191" name="__module.roberta.encoder.layer.18.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1413">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2192" name="__module.roberta.encoder.layer.18.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2193" name="__module.roberta.encoder.layer.18.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2194" name="Constant_857728" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="293539248" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2195" name="__module.roberta.encoder.layer.18.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2196" name="Constant_857729" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="293543344" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2197" name="__module.roberta.encoder.layer.18.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1417,hidden_states.115">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2198" name="__module.roberta.encoder.layer.18.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="293547440" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2199" name="__module.roberta.encoder.layer.18.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2200" name="__module.roberta.encoder.layer.18.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="293551536" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2201" name="__module.roberta.encoder.layer.18.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="293551540" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2202" name="__module.roberta.encoder.layer.18.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="293551536" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2203" name="__module.roberta.encoder.layer.18.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="293551540" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2204" name="__module.roberta.encoder.layer.18.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2205" name="Constant_1974532" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="293551544" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2206" name="Convert_1974533" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2207" name="Constant_1974534" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="294600120" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2208" name="__module.roberta.encoder.layer.19.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2209" name="__module.roberta.encoder.layer.19.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2210" name="Constant_857730" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="294604216" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2211" name="__module.roberta.encoder.layer.19.attention.self.query/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1430,x.229">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2212" name="__module.roberta.encoder.layer.19.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="294608312" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2213" name="__module.roberta.encoder.layer.19.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="294608316" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2214" name="__module.roberta.encoder.layer.19.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="294608312" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2215" name="__module.roberta.encoder.layer.19.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="294608316" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2216" name="__module.roberta.encoder.layer.19.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2217" name="__module.roberta.encoder.layer.19.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2218" name="__module.roberta.encoder.layer.19.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1434,x.231">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2219" name="Constant_847410" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1435">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2220" name="__module.roberta.encoder.layer.19.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1436">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2221" name="Constant_1974536" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="294608320" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2222" name="Convert_1974537" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2223" name="Constant_1974538" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="295656896" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2224" name="__module.roberta.encoder.layer.19.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2225" name="__module.roberta.encoder.layer.19.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2226" name="Constant_857731" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="295660992" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2227" name="__module.roberta.encoder.layer.19.attention.self.key/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1439,x.233">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2228" name="__module.roberta.encoder.layer.19.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="295665088" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2229" name="__module.roberta.encoder.layer.19.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="295665092" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2230" name="__module.roberta.encoder.layer.19.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="295665088" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2231" name="__module.roberta.encoder.layer.19.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="295665092" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2232" name="__module.roberta.encoder.layer.19.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2233" name="__module.roberta.encoder.layer.19.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2234" name="__module.roberta.encoder.layer.19.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1443,x.235">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2235" name="Constant_847433" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1444">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2236" name="__module.roberta.encoder.layer.19.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1445">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2237" name="Constant_1974540" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="295665096" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2238" name="Convert_1974541" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2239" name="Constant_1974542" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="296713672" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2240" name="__module.roberta.encoder.layer.19.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2241" name="__module.roberta.encoder.layer.19.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2242" name="Constant_857732" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="296717768" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2243" name="__module.roberta.encoder.layer.19.attention.self.value/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1448,x.237">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2244" name="__module.roberta.encoder.layer.19.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2245" name="__module.roberta.encoder.layer.19.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1452,x.239">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2246" name="Constant_847456" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1453">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2247" name="__module.roberta.encoder.layer.19.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1454">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2248" name="__module.roberta.encoder.layer.19.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
|
|
<data causal="false" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="3" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="4" precision="FP32" names="1455,attn_output.77">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2249" name="__module.roberta.encoder.layer.19.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
|
|
<data element_type="i32" shape="4" offset="55388688" size="16" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2250" name="__module.roberta.encoder.layer.19.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1456,attn_output.79">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2251" name="Constant_857997" type="Const" version="opset1">
|
|
<data element_type="i64" shape="3" offset="55388704" size="24" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2252" name="__module.roberta.encoder.layer.19.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1458">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2253" name="__module.roberta.encoder.layer.19.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="296721864" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2254" name="__module.roberta.encoder.layer.19.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2255" name="__module.roberta.encoder.layer.19.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="296725960" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2256" name="__module.roberta.encoder.layer.19.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="296725964" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2257" name="__module.roberta.encoder.layer.19.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="296725960" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2258" name="__module.roberta.encoder.layer.19.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="296725964" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2259" name="__module.roberta.encoder.layer.19.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2260" name="Constant_1974544" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="296725968" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2261" name="Convert_1974545" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2262" name="Constant_1974546" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="297774544" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2263" name="__module.roberta.encoder.layer.19.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2264" name="__module.roberta.encoder.layer.19.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2265" name="Constant_857733" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="297778640" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2266" name="__module.roberta.encoder.layer.19.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1463,input.79">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2267" name="__module.roberta.encoder.layer.19.attention.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1465">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2268" name="__module.roberta.encoder.layer.19.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2269" name="__module.roberta.encoder.layer.19.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2270" name="Constant_857734" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="297782736" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2271" name="__module.roberta.encoder.layer.19.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2272" name="Constant_857735" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="297786832" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2273" name="__module.roberta.encoder.layer.19.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1469,input_tensor.39">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2274" name="__module.roberta.encoder.layer.19.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="297790928" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2275" name="__module.roberta.encoder.layer.19.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2276" name="__module.roberta.encoder.layer.19.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="297795024" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2277" name="__module.roberta.encoder.layer.19.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="297795028" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2278" name="__module.roberta.encoder.layer.19.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="297795024" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2279" name="__module.roberta.encoder.layer.19.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="297795028" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2280" name="__module.roberta.encoder.layer.19.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2281" name="Constant_1974548" type="Const" version="opset1">
|
|
<data element_type="i8" shape="4096, 1024" offset="297795032" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2282" name="Convert_1974549" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2283" name="Constant_1974550" type="Const" version="opset1">
|
|
<data element_type="f32" shape="4096, 1" offset="301989336" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2284" name="__module.roberta.encoder.layer.19.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2285" name="__module.roberta.encoder.layer.19.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2286" name="Constant_857736" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="302005720" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2287" name="__module.roberta.encoder.layer.19.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1473">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2288" name="__module.roberta.encoder.layer.19.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
|
<data approximation_mode="ERF" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32" names="1474">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2289" name="__module.roberta.encoder.layer.19.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="302022104" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2290" name="__module.roberta.encoder.layer.19.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2291" name="__module.roberta.encoder.layer.19.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="302038488" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2292" name="__module.roberta.encoder.layer.19.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="302038492" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2293" name="__module.roberta.encoder.layer.19.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="302038488" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2294" name="__module.roberta.encoder.layer.19.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="302038492" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2295" name="__module.roberta.encoder.layer.19.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2296" name="Constant_1974552" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 4096" offset="302038496" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2297" name="Convert_1974553" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2298" name="Constant_1974554" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="306232800" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2299" name="__module.roberta.encoder.layer.19.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2300" name="__module.roberta.encoder.layer.19.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2301" name="Constant_857737" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="306236896" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2302" name="__module.roberta.encoder.layer.19.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1479,input.81">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2303" name="__module.roberta.encoder.layer.19.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1481">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2304" name="__module.roberta.encoder.layer.19.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2305" name="__module.roberta.encoder.layer.19.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2306" name="Constant_857738" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="306240992" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2307" name="__module.roberta.encoder.layer.19.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2308" name="Constant_857739" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="306245088" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2309" name="__module.roberta.encoder.layer.19.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1485,hidden_states.121">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2310" name="__module.roberta.encoder.layer.19.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="306249184" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2311" name="__module.roberta.encoder.layer.19.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2312" name="__module.roberta.encoder.layer.19.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="306253280" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2313" name="__module.roberta.encoder.layer.19.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="306253284" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2314" name="__module.roberta.encoder.layer.19.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="306253280" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2315" name="__module.roberta.encoder.layer.19.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="306253284" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2316" name="__module.roberta.encoder.layer.19.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2317" name="Constant_1974556" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="306253288" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2318" name="Convert_1974557" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2319" name="Constant_1974558" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="307301864" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2320" name="__module.roberta.encoder.layer.20.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2321" name="__module.roberta.encoder.layer.20.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2322" name="Constant_857740" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="307305960" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2323" name="__module.roberta.encoder.layer.20.attention.self.query/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1498,x.241">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2324" name="__module.roberta.encoder.layer.20.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="307310056" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2325" name="__module.roberta.encoder.layer.20.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="307310060" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2326" name="__module.roberta.encoder.layer.20.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="307310056" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2327" name="__module.roberta.encoder.layer.20.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="307310060" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2328" name="__module.roberta.encoder.layer.20.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2329" name="__module.roberta.encoder.layer.20.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2330" name="__module.roberta.encoder.layer.20.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1502,x.243">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2331" name="Constant_847633" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1503">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2332" name="__module.roberta.encoder.layer.20.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1504">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2333" name="Constant_1974560" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="307310064" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2334" name="Convert_1974561" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2335" name="Constant_1974562" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="308358640" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2336" name="__module.roberta.encoder.layer.20.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2337" name="__module.roberta.encoder.layer.20.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2338" name="Constant_857741" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="308362736" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2339" name="__module.roberta.encoder.layer.20.attention.self.key/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1507,x.245">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2340" name="__module.roberta.encoder.layer.20.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="308366832" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2341" name="__module.roberta.encoder.layer.20.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="308366836" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2342" name="__module.roberta.encoder.layer.20.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="308366832" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2343" name="__module.roberta.encoder.layer.20.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="308366836" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2344" name="__module.roberta.encoder.layer.20.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2345" name="__module.roberta.encoder.layer.20.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2346" name="__module.roberta.encoder.layer.20.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1511,x.247">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2347" name="Constant_847656" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1512">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2348" name="__module.roberta.encoder.layer.20.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1513">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2349" name="Constant_1974564" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="308366840" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2350" name="Convert_1974565" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2351" name="Constant_1974566" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="309415416" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2352" name="__module.roberta.encoder.layer.20.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2353" name="__module.roberta.encoder.layer.20.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2354" name="Constant_857742" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="309419512" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2355" name="__module.roberta.encoder.layer.20.attention.self.value/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1516,x.249">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2356" name="__module.roberta.encoder.layer.20.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2357" name="__module.roberta.encoder.layer.20.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1520,x.251">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2358" name="Constant_847679" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1521">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2359" name="__module.roberta.encoder.layer.20.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1522">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2360" name="__module.roberta.encoder.layer.20.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
|
|
<data causal="false" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="3" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="4" precision="FP32" names="1523,attn_output.81">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2361" name="__module.roberta.encoder.layer.20.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
|
|
<data element_type="i32" shape="4" offset="55388688" size="16" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2362" name="__module.roberta.encoder.layer.20.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1524,attn_output.83">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2363" name="Constant_857998" type="Const" version="opset1">
|
|
<data element_type="i64" shape="3" offset="55388704" size="24" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2364" name="__module.roberta.encoder.layer.20.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1526">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2365" name="__module.roberta.encoder.layer.20.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="309423608" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2366" name="__module.roberta.encoder.layer.20.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2367" name="__module.roberta.encoder.layer.20.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="309427704" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2368" name="__module.roberta.encoder.layer.20.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="309427708" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2369" name="__module.roberta.encoder.layer.20.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="309427704" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2370" name="__module.roberta.encoder.layer.20.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="309427708" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2371" name="__module.roberta.encoder.layer.20.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2372" name="Constant_1974568" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="309427712" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2373" name="Convert_1974569" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2374" name="Constant_1974570" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="310476288" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2375" name="__module.roberta.encoder.layer.20.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2376" name="__module.roberta.encoder.layer.20.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2377" name="Constant_857743" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="310480384" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2378" name="__module.roberta.encoder.layer.20.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1531,input.83">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2379" name="__module.roberta.encoder.layer.20.attention.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1533">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2380" name="__module.roberta.encoder.layer.20.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2381" name="__module.roberta.encoder.layer.20.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2382" name="Constant_857744" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="310484480" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2383" name="__module.roberta.encoder.layer.20.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2384" name="Constant_857745" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="310488576" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2385" name="__module.roberta.encoder.layer.20.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1537,input_tensor.41">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2386" name="__module.roberta.encoder.layer.20.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="310492672" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2387" name="__module.roberta.encoder.layer.20.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2388" name="__module.roberta.encoder.layer.20.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="310496768" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2389" name="__module.roberta.encoder.layer.20.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="310496772" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2390" name="__module.roberta.encoder.layer.20.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="310496768" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2391" name="__module.roberta.encoder.layer.20.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="310496772" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2392" name="__module.roberta.encoder.layer.20.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2393" name="Constant_1974572" type="Const" version="opset1">
|
|
<data element_type="i8" shape="4096, 1024" offset="310496776" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2394" name="Convert_1974573" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2395" name="Constant_1974574" type="Const" version="opset1">
|
|
<data element_type="f32" shape="4096, 1" offset="314691080" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2396" name="__module.roberta.encoder.layer.20.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2397" name="__module.roberta.encoder.layer.20.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2398" name="Constant_857746" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="314707464" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2399" name="__module.roberta.encoder.layer.20.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1541">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2400" name="__module.roberta.encoder.layer.20.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
|
<data approximation_mode="ERF" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32" names="1542">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2401" name="__module.roberta.encoder.layer.20.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="314723848" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2402" name="__module.roberta.encoder.layer.20.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2403" name="__module.roberta.encoder.layer.20.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="314740232" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2404" name="__module.roberta.encoder.layer.20.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="314740236" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2405" name="__module.roberta.encoder.layer.20.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="314740232" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2406" name="__module.roberta.encoder.layer.20.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="314740236" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2407" name="__module.roberta.encoder.layer.20.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2408" name="Constant_1974576" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 4096" offset="314740240" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2409" name="Convert_1974577" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2410" name="Constant_1974578" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="318934544" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2411" name="__module.roberta.encoder.layer.20.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2412" name="__module.roberta.encoder.layer.20.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2413" name="Constant_857747" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="318938640" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2414" name="__module.roberta.encoder.layer.20.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1547,input.85">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2415" name="__module.roberta.encoder.layer.20.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1549">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2416" name="__module.roberta.encoder.layer.20.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2417" name="__module.roberta.encoder.layer.20.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2418" name="Constant_857748" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="318942736" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2419" name="__module.roberta.encoder.layer.20.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2420" name="Constant_857749" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="318946832" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2421" name="__module.roberta.encoder.layer.20.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1553,hidden_states.127">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2422" name="__module.roberta.encoder.layer.20.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="318950928" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2423" name="__module.roberta.encoder.layer.20.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2424" name="__module.roberta.encoder.layer.20.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="318955024" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2425" name="__module.roberta.encoder.layer.20.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="318955028" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2426" name="__module.roberta.encoder.layer.20.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="318955024" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2427" name="__module.roberta.encoder.layer.20.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="318955028" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2428" name="__module.roberta.encoder.layer.20.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2429" name="Constant_1974580" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="318955032" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2430" name="Convert_1974581" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2431" name="Constant_1974582" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="320003608" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2432" name="__module.roberta.encoder.layer.21.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2433" name="__module.roberta.encoder.layer.21.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2434" name="Constant_857750" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="320007704" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2435" name="__module.roberta.encoder.layer.21.attention.self.query/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1566,x.253">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2436" name="__module.roberta.encoder.layer.21.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="320011800" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2437" name="__module.roberta.encoder.layer.21.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="320011804" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2438" name="__module.roberta.encoder.layer.21.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="320011800" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2439" name="__module.roberta.encoder.layer.21.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="320011804" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2440" name="__module.roberta.encoder.layer.21.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2441" name="__module.roberta.encoder.layer.21.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2442" name="__module.roberta.encoder.layer.21.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1570,x.255">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2443" name="Constant_847856" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1571">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2444" name="__module.roberta.encoder.layer.21.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1572">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2445" name="Constant_1974584" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="320011808" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2446" name="Convert_1974585" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2447" name="Constant_1974586" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="321060384" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2448" name="__module.roberta.encoder.layer.21.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2449" name="__module.roberta.encoder.layer.21.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2450" name="Constant_857751" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="321064480" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2451" name="__module.roberta.encoder.layer.21.attention.self.key/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1575,x.257">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2452" name="__module.roberta.encoder.layer.21.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="321068576" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2453" name="__module.roberta.encoder.layer.21.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="321068580" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2454" name="__module.roberta.encoder.layer.21.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="321068576" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2455" name="__module.roberta.encoder.layer.21.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="321068580" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2456" name="__module.roberta.encoder.layer.21.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2457" name="__module.roberta.encoder.layer.21.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2458" name="__module.roberta.encoder.layer.21.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1579,x.259">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2459" name="Constant_847879" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1580">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2460" name="__module.roberta.encoder.layer.21.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1581">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2461" name="Constant_1974588" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="321068584" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2462" name="Convert_1974589" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2463" name="Constant_1974590" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="322117160" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2464" name="__module.roberta.encoder.layer.21.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2465" name="__module.roberta.encoder.layer.21.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2466" name="Constant_857752" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="322121256" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2467" name="__module.roberta.encoder.layer.21.attention.self.value/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1584,x.261">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2468" name="__module.roberta.encoder.layer.21.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2469" name="__module.roberta.encoder.layer.21.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1588,x.263">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2470" name="Constant_847902" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1589">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2471" name="__module.roberta.encoder.layer.21.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1590">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2472" name="__module.roberta.encoder.layer.21.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
|
|
<data causal="false" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="3" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="4" precision="FP32" names="1591,attn_output.85">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2473" name="__module.roberta.encoder.layer.21.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
|
|
<data element_type="i32" shape="4" offset="55388688" size="16" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2474" name="__module.roberta.encoder.layer.21.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1592,attn_output.87">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2475" name="Constant_857999" type="Const" version="opset1">
|
|
<data element_type="i64" shape="3" offset="55388704" size="24" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2476" name="__module.roberta.encoder.layer.21.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1594">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2477" name="__module.roberta.encoder.layer.21.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="322125352" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2478" name="__module.roberta.encoder.layer.21.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2479" name="__module.roberta.encoder.layer.21.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="322129448" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2480" name="__module.roberta.encoder.layer.21.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="322129452" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2481" name="__module.roberta.encoder.layer.21.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="322129448" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2482" name="__module.roberta.encoder.layer.21.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="322129452" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2483" name="__module.roberta.encoder.layer.21.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2484" name="Constant_1974592" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="322129456" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2485" name="Convert_1974593" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2486" name="Constant_1974594" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="323178032" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2487" name="__module.roberta.encoder.layer.21.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2488" name="__module.roberta.encoder.layer.21.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2489" name="Constant_857753" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="323182128" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2490" name="__module.roberta.encoder.layer.21.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1599,input.87">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2491" name="__module.roberta.encoder.layer.21.attention.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1601">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2492" name="__module.roberta.encoder.layer.21.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2493" name="__module.roberta.encoder.layer.21.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2494" name="Constant_857754" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="323186224" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2495" name="__module.roberta.encoder.layer.21.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2496" name="Constant_857755" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="323190320" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2497" name="__module.roberta.encoder.layer.21.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1605,input_tensor.43">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2498" name="__module.roberta.encoder.layer.21.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="323194416" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2499" name="__module.roberta.encoder.layer.21.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2500" name="__module.roberta.encoder.layer.21.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="323198512" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2501" name="__module.roberta.encoder.layer.21.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="323198516" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2502" name="__module.roberta.encoder.layer.21.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="323198512" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2503" name="__module.roberta.encoder.layer.21.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="323198516" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2504" name="__module.roberta.encoder.layer.21.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2505" name="Constant_1974596" type="Const" version="opset1">
|
|
<data element_type="i8" shape="4096, 1024" offset="323198520" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2506" name="Convert_1974597" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2507" name="Constant_1974598" type="Const" version="opset1">
|
|
<data element_type="f32" shape="4096, 1" offset="327392824" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2508" name="__module.roberta.encoder.layer.21.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2509" name="__module.roberta.encoder.layer.21.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2510" name="Constant_857756" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="327409208" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2511" name="__module.roberta.encoder.layer.21.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1609">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2512" name="__module.roberta.encoder.layer.21.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
|
<data approximation_mode="ERF" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32" names="1610">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2513" name="__module.roberta.encoder.layer.21.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="327425592" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2514" name="__module.roberta.encoder.layer.21.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2515" name="__module.roberta.encoder.layer.21.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="327441976" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2516" name="__module.roberta.encoder.layer.21.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="327441980" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2517" name="__module.roberta.encoder.layer.21.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="327441976" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2518" name="__module.roberta.encoder.layer.21.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="327441980" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2519" name="__module.roberta.encoder.layer.21.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2520" name="Constant_1974600" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 4096" offset="327441984" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2521" name="Convert_1974601" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2522" name="Constant_1974602" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="331636288" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2523" name="__module.roberta.encoder.layer.21.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2524" name="__module.roberta.encoder.layer.21.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2525" name="Constant_857757" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="331640384" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2526" name="__module.roberta.encoder.layer.21.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1615,input.89">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2527" name="__module.roberta.encoder.layer.21.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1617">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2528" name="__module.roberta.encoder.layer.21.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2529" name="__module.roberta.encoder.layer.21.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2530" name="Constant_857758" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="331644480" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2531" name="__module.roberta.encoder.layer.21.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2532" name="Constant_857759" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="331648576" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2533" name="__module.roberta.encoder.layer.21.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1621,hidden_states.133">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2534" name="__module.roberta.encoder.layer.21.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="331652672" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2535" name="__module.roberta.encoder.layer.21.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2536" name="__module.roberta.encoder.layer.21.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="331656768" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2537" name="__module.roberta.encoder.layer.21.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="331656772" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2538" name="__module.roberta.encoder.layer.21.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="331656768" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2539" name="__module.roberta.encoder.layer.21.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="331656772" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2540" name="__module.roberta.encoder.layer.21.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2541" name="Constant_1974604" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="331656776" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2542" name="Convert_1974605" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2543" name="Constant_1974606" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="332705352" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2544" name="__module.roberta.encoder.layer.22.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2545" name="__module.roberta.encoder.layer.22.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2546" name="Constant_857760" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="332709448" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2547" name="__module.roberta.encoder.layer.22.attention.self.query/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1634,x.265">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2548" name="__module.roberta.encoder.layer.22.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="332713544" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2549" name="__module.roberta.encoder.layer.22.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="332713548" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2550" name="__module.roberta.encoder.layer.22.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="332713544" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2551" name="__module.roberta.encoder.layer.22.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="332713548" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2552" name="__module.roberta.encoder.layer.22.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2553" name="__module.roberta.encoder.layer.22.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2554" name="__module.roberta.encoder.layer.22.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1638,x.267">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2555" name="Constant_848079" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1639">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2556" name="__module.roberta.encoder.layer.22.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1640">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2557" name="Constant_1974608" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="332713552" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2558" name="Convert_1974609" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2559" name="Constant_1974610" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="333762128" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2560" name="__module.roberta.encoder.layer.22.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2561" name="__module.roberta.encoder.layer.22.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2562" name="Constant_857761" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="333766224" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2563" name="__module.roberta.encoder.layer.22.attention.self.key/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1643,x.269">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2564" name="__module.roberta.encoder.layer.22.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="333770320" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2565" name="__module.roberta.encoder.layer.22.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="333770324" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2566" name="__module.roberta.encoder.layer.22.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="333770320" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2567" name="__module.roberta.encoder.layer.22.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="333770324" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2568" name="__module.roberta.encoder.layer.22.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2569" name="__module.roberta.encoder.layer.22.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2570" name="__module.roberta.encoder.layer.22.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1647,x.271">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2571" name="Constant_848102" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1648">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2572" name="__module.roberta.encoder.layer.22.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1649">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2573" name="Constant_1974612" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="333770328" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2574" name="Convert_1974613" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2575" name="Constant_1974614" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="334818904" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2576" name="__module.roberta.encoder.layer.22.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2577" name="__module.roberta.encoder.layer.22.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2578" name="Constant_857762" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="334823000" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2579" name="__module.roberta.encoder.layer.22.attention.self.value/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1652,x.273">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2580" name="__module.roberta.encoder.layer.22.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2581" name="__module.roberta.encoder.layer.22.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1656,x.275">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2582" name="Constant_848125" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1657">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2583" name="__module.roberta.encoder.layer.22.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1658">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2584" name="__module.roberta.encoder.layer.22.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
|
|
<data causal="false" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="3" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="4" precision="FP32" names="1659,attn_output.89">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2585" name="__module.roberta.encoder.layer.22.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
|
|
<data element_type="i32" shape="4" offset="55388688" size="16" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2586" name="__module.roberta.encoder.layer.22.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1660,attn_output.91">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2587" name="Constant_858000" type="Const" version="opset1">
|
|
<data element_type="i64" shape="3" offset="55388704" size="24" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2588" name="__module.roberta.encoder.layer.22.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1662">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2589" name="__module.roberta.encoder.layer.22.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="334827096" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2590" name="__module.roberta.encoder.layer.22.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2591" name="__module.roberta.encoder.layer.22.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="334831192" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2592" name="__module.roberta.encoder.layer.22.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="334831196" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2593" name="__module.roberta.encoder.layer.22.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="334831192" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2594" name="__module.roberta.encoder.layer.22.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="334831196" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2595" name="__module.roberta.encoder.layer.22.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2596" name="Constant_1974616" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="334831200" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2597" name="Convert_1974617" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2598" name="Constant_1974618" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="335879776" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2599" name="__module.roberta.encoder.layer.22.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2600" name="__module.roberta.encoder.layer.22.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2601" name="Constant_857763" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="335883872" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2602" name="__module.roberta.encoder.layer.22.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1667,input.91">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2603" name="__module.roberta.encoder.layer.22.attention.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1669">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2604" name="__module.roberta.encoder.layer.22.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2605" name="__module.roberta.encoder.layer.22.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2606" name="Constant_857764" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="335887968" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2607" name="__module.roberta.encoder.layer.22.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2608" name="Constant_857765" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="335892064" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2609" name="__module.roberta.encoder.layer.22.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1673,input_tensor.45">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2610" name="__module.roberta.encoder.layer.22.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="335896160" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2611" name="__module.roberta.encoder.layer.22.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2612" name="__module.roberta.encoder.layer.22.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="335900256" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2613" name="__module.roberta.encoder.layer.22.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="335900260" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2614" name="__module.roberta.encoder.layer.22.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="335900256" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2615" name="__module.roberta.encoder.layer.22.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="335900260" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2616" name="__module.roberta.encoder.layer.22.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2617" name="Constant_1974620" type="Const" version="opset1">
|
|
<data element_type="i8" shape="4096, 1024" offset="335900264" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2618" name="Convert_1974621" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2619" name="Constant_1974622" type="Const" version="opset1">
|
|
<data element_type="f32" shape="4096, 1" offset="340094568" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2620" name="__module.roberta.encoder.layer.22.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2621" name="__module.roberta.encoder.layer.22.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2622" name="Constant_857766" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="340110952" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2623" name="__module.roberta.encoder.layer.22.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1677">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2624" name="__module.roberta.encoder.layer.22.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
|
<data approximation_mode="ERF" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32" names="1678">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2625" name="__module.roberta.encoder.layer.22.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="340127336" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2626" name="__module.roberta.encoder.layer.22.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2627" name="__module.roberta.encoder.layer.22.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="340143720" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2628" name="__module.roberta.encoder.layer.22.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="340143724" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2629" name="__module.roberta.encoder.layer.22.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="340143720" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2630" name="__module.roberta.encoder.layer.22.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="340143724" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2631" name="__module.roberta.encoder.layer.22.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2632" name="Constant_1974624" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 4096" offset="340143728" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2633" name="Convert_1974625" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2634" name="Constant_1974626" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="344338032" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2635" name="__module.roberta.encoder.layer.22.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2636" name="__module.roberta.encoder.layer.22.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2637" name="Constant_857767" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="344342128" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2638" name="__module.roberta.encoder.layer.22.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1683,input.93">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2639" name="__module.roberta.encoder.layer.22.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1685">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2640" name="__module.roberta.encoder.layer.22.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2641" name="__module.roberta.encoder.layer.22.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2642" name="Constant_857768" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="344346224" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2643" name="__module.roberta.encoder.layer.22.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2644" name="Constant_857769" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="344350320" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2645" name="__module.roberta.encoder.layer.22.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1689,hidden_states.139">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2646" name="__module.roberta.encoder.layer.22.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="344354416" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2647" name="__module.roberta.encoder.layer.22.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2648" name="__module.roberta.encoder.layer.22.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="344358512" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2649" name="__module.roberta.encoder.layer.22.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="344358516" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2650" name="__module.roberta.encoder.layer.22.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="344358512" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2651" name="__module.roberta.encoder.layer.22.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="344358516" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2652" name="__module.roberta.encoder.layer.22.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2653" name="Constant_1974628" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="344358520" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2654" name="Convert_1974629" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2655" name="Constant_1974630" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="345407096" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2656" name="__module.roberta.encoder.layer.23.attention.self.query/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2657" name="__module.roberta.encoder.layer.23.attention.self.query/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2658" name="Constant_857770" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="345411192" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2659" name="__module.roberta.encoder.layer.23.attention.self.query/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1702,x.277">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2660" name="__module.roberta.encoder.layer.23.attention.self.query/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="345415288" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2661" name="__module.roberta.encoder.layer.23.attention.self.query/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="345415292" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2662" name="__module.roberta.encoder.layer.23.attention.self.query/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="345415288" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2663" name="__module.roberta.encoder.layer.23.attention.self.query/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="345415292" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2664" name="__module.roberta.encoder.layer.23.attention.self.query/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2665" name="__module.roberta.encoder.layer.23.attention.self/prim::ListConstruct/Concat" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2666" name="__module.roberta.encoder.layer.23.attention.self/aten::view/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1706,x.279">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2667" name="Constant_848302" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1707">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2668" name="__module.roberta.encoder.layer.23.attention.self/aten::permute/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1708">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2669" name="Constant_1974632" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="345415296" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2670" name="Convert_1974633" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2671" name="Constant_1974634" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="346463872" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2672" name="__module.roberta.encoder.layer.23.attention.self.key/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2673" name="__module.roberta.encoder.layer.23.attention.self.key/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2674" name="Constant_857771" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="346467968" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2675" name="__module.roberta.encoder.layer.23.attention.self.key/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1711,x.281">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2676" name="__module.roberta.encoder.layer.23.attention.self.key/aten::linear/Add/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="346472064" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2677" name="__module.roberta.encoder.layer.23.attention.self.key/aten::linear/Add/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="346472068" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2678" name="__module.roberta.encoder.layer.23.attention.self.key/aten::linear/Add/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="346472064" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2679" name="__module.roberta.encoder.layer.23.attention.self.key/aten::linear/Add/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="346472068" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2680" name="__module.roberta.encoder.layer.23.attention.self.key/aten::linear/Add/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2681" name="__module.roberta.encoder.layer.23.attention.self/prim::ListConstruct/Concat_1" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2682" name="__module.roberta.encoder.layer.23.attention.self/aten::view/Reshape_1" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1715,x.283">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2683" name="Constant_848325" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1716">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2684" name="__module.roberta.encoder.layer.23.attention.self/aten::permute/Transpose_1" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1717">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2685" name="Constant_1974636" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="346472072" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2686" name="Convert_1974637" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2687" name="Constant_1974638" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="347520648" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2688" name="__module.roberta.encoder.layer.23.attention.self.value/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2689" name="__module.roberta.encoder.layer.23.attention.self.value/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2690" name="Constant_857772" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="347524744" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2691" name="__module.roberta.encoder.layer.23.attention.self.value/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1720,x.285">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2692" name="__module.roberta.encoder.layer.23.attention.self/prim::ListConstruct/Concat_2" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275048" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2693" name="__module.roberta.encoder.layer.23.attention.self/aten::view/Reshape_2" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1724,x">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2694" name="Constant_848348" type="Const" version="opset1">
|
|
<data element_type="i64" shape="4" offset="53275080" size="32" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1725">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2695" name="__module.roberta.encoder.layer.23.attention.self/aten::permute/Transpose_2" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1726">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2696" name="__module.roberta.encoder.layer.23.attention.self/aten::scaled_dot_product_attention/ScaledDotProductAttention" type="ScaledDotProductAttention" version="opset13">
|
|
<data causal="false" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="3" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="4" precision="FP32" names="1727,attn_output.93">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2697" name="__module.roberta.encoder.layer.23.attention.self/aten::transpose/ScatterElementsUpdate" type="Const" version="opset1">
|
|
<data element_type="i32" shape="4" offset="55388688" size="16" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2698" name="__module.roberta.encoder.layer.23.attention.self/aten::transpose/Transpose" type="Transpose" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>-1</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>4</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1728,attn_output">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2699" name="Constant_858001" type="Const" version="opset1">
|
|
<data element_type="i64" shape="3" offset="55388704" size="24" />
|
|
<output>
|
|
<port id="0" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2700" name="__module.roberta.encoder.layer.23.attention.self/aten::reshape/Reshape" type="Reshape" version="opset1">
|
|
<data special_zero="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>16</dim>
|
|
<dim>64</dim>
|
|
</port>
|
|
<port id="1" precision="I64">
|
|
<dim>3</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1730">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2701" name="__module.roberta.encoder.layer.23.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="347528840" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2702" name="__module.roberta.encoder.layer.23.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2703" name="__module.roberta.encoder.layer.23.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="347532936" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2704" name="__module.roberta.encoder.layer.23.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="347532940" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2705" name="__module.roberta.encoder.layer.23.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="347532936" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2706" name="__module.roberta.encoder.layer.23.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="347532940" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2707" name="__module.roberta.encoder.layer.23.attention.self/aten::reshape/Reshape_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2708" name="Constant_1974640" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="347532944" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2709" name="Convert_1974641" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2710" name="Constant_1974642" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="348581520" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2711" name="__module.roberta.encoder.layer.23.attention.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2712" name="__module.roberta.encoder.layer.23.attention.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2713" name="Constant_857773" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="348585616" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2714" name="__module.roberta.encoder.layer.23.attention.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1735,input.95">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2715" name="__module.roberta.encoder.layer.23.attention.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1737">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2716" name="__module.roberta.encoder.layer.23.attention.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2717" name="__module.roberta.encoder.layer.23.attention.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2718" name="Constant_857774" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="348589712" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2719" name="__module.roberta.encoder.layer.23.attention.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2720" name="Constant_857775" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="348593808" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2721" name="__module.roberta.encoder.layer.23.attention.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1741,input_tensor">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2722" name="__module.roberta.encoder.layer.23.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="348597904" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2723" name="__module.roberta.encoder.layer.23.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2724" name="__module.roberta.encoder.layer.23.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="348602000" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2725" name="__module.roberta.encoder.layer.23.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="348602004" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2726" name="__module.roberta.encoder.layer.23.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="348602000" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2727" name="__module.roberta.encoder.layer.23.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="348602004" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2728" name="__module.roberta.encoder.layer.23.attention.output.LayerNorm/aten::layer_norm/Add_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2729" name="Constant_1974644" type="Const" version="opset1">
|
|
<data element_type="i8" shape="4096, 1024" offset="348602008" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2730" name="Convert_1974645" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2731" name="Constant_1974646" type="Const" version="opset1">
|
|
<data element_type="f32" shape="4096, 1" offset="352796312" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2732" name="__module.roberta.encoder.layer.23.intermediate.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2733" name="__module.roberta.encoder.layer.23.intermediate.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>4096</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2734" name="Constant_857776" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="352812696" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2735" name="__module.roberta.encoder.layer.23.intermediate.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1745">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2736" name="__module.roberta.encoder.layer.23.intermediate.intermediate_act_fn/aten::gelu/Gelu" type="Gelu" version="opset7">
|
|
<data approximation_mode="ERF" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32" names="1746">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2737" name="__module.roberta.encoder.layer.23.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 4096" offset="352829080" size="16384" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2738" name="__module.roberta.encoder.layer.23.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2739" name="__module.roberta.encoder.layer.23.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="352845464" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2740" name="__module.roberta.encoder.layer.23.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="352845468" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2741" name="__module.roberta.encoder.layer.23.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="352845464" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2742" name="__module.roberta.encoder.layer.23.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="352845468" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2743" name="__module.roberta.encoder.layer.23.intermediate.intermediate_act_fn/aten::gelu/Gelu_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2744" name="Constant_1974648" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 4096" offset="352845472" size="4194304" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2745" name="Convert_1974649" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2746" name="Constant_1974650" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="357039776" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2747" name="__module.roberta.encoder.layer.23.output.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2748" name="__module.roberta.encoder.layer.23.output.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>4096</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2749" name="Constant_857777" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="357043872" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2750" name="__module.roberta.encoder.layer.23.output.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1751,input.97">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2751" name="__module.roberta.encoder.layer.23.output/aten::add/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1753">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2752" name="__module.roberta.encoder.layer.23.output.LayerNorm/aten::layer_norm/Multiply" type="Const" version="opset1">
|
|
<data element_type="i32" shape="1" offset="52205972" size="4" />
|
|
<output>
|
|
<port id="0" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2753" name="__module.roberta.encoder.layer.23.output.LayerNorm/aten::layer_norm/MVN" type="MVN" version="opset6">
|
|
<data eps="9.9999997473787516e-06" normalize_variance="true" eps_mode="INSIDE_SQRT" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I32">
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2754" name="Constant_857778" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="357047968" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2755" name="__module.roberta.encoder.layer.23.output.LayerNorm/aten::layer_norm/Multiply_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2756" name="Constant_857779" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1, 1024" offset="357052064" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2757" name="__module.roberta.encoder.layer.23.output.LayerNorm/aten::layer_norm/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1757,1766,features">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2758" name="1762" type="Const" version="opset1">
|
|
<data element_type="i64" shape="" offset="51677564" size="8" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1762" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2759" name="1760" type="Const" version="opset1">
|
|
<data element_type="i64" shape="" offset="51677572" size="8" />
|
|
<output>
|
|
<port id="0" precision="I64" names="1760" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2760" name="__module.classifier/aten::select/Gather" type="Gather" version="opset8">
|
|
<data batch_dims="0" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="I64" />
|
|
<port id="2" precision="I64" />
|
|
</input>
|
|
<output>
|
|
<port id="3" precision="FP32" names="1767,1768,input.99">
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2761" name="__module.classifier/aten::select/Gather_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1024" offset="357056160" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2762" name="__module.classifier/aten::select/Gather_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2763" name="__module.classifier/aten::select/Gather_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="357060256" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2764" name="__module.classifier/aten::select/Gather_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="357060260" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2765" name="__module.classifier/aten::select/Gather_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="357060256" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2766" name="__module.classifier/aten::select/Gather_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="357060260" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2767" name="__module.classifier/aten::select/Gather_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2768" name="Constant_1974652" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1024, 1024" offset="357060264" size="1048576" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2769" name="Convert_1974653" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2770" name="Constant_1974654" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1024, 1" offset="358108840" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2771" name="__module.classifier.dense/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2772" name="__module.classifier.dense/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1024</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2773" name="Constant_857780" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1024" offset="358112936" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2774" name="__module.classifier.dense/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="1772">
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2775" name="__module.classifier/aten::tanh/Tanh" type="Tanh" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32" names="1773,input">
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2776" name="__module.classifier/aten::tanh/Tanh_0_0/nncf_smooth_quant/scale" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1024" offset="358117032" size="4096" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2777" name="__module.classifier/aten::tanh/Tanh_0_0/nncf_smooth_quant" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2778" name="__module.classifier/aten::tanh/Tanh_0_0/nncf_smooth_quant/fq_output_0/input_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="358121128" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2779" name="__module.classifier/aten::tanh/Tanh_0_0/nncf_smooth_quant/fq_output_0/input_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="358121132" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2780" name="__module.classifier/aten::tanh/Tanh_0_0/nncf_smooth_quant/fq_output_0/output_low" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="358121128" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2781" name="__module.classifier/aten::tanh/Tanh_0_0/nncf_smooth_quant/fq_output_0/output_high" type="Const" version="opset1">
|
|
<data element_type="f32" shape="" offset="358121132" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32" />
|
|
</output>
|
|
</layer>
|
|
<layer id="2782" name="__module.classifier/aten::tanh/Tanh_0_0/nncf_smooth_quant/fq_output_0" type="FakeQuantize" version="opset1">
|
|
<data levels="256" auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32" />
|
|
<port id="2" precision="FP32" />
|
|
<port id="3" precision="FP32" />
|
|
<port id="4" precision="FP32" />
|
|
</input>
|
|
<output>
|
|
<port id="5" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2783" name="Constant_1974656" type="Const" version="opset1">
|
|
<data element_type="i8" shape="1, 1024" offset="358121136" size="1024" />
|
|
<output>
|
|
<port id="0" precision="I8">
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2784" name="Convert_1974657" type="Convert" version="opset1">
|
|
<data destination_type="f32" />
|
|
<input>
|
|
<port id="0" precision="I8">
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2785" name="Constant_1974658" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1" offset="358122160" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2786" name="__module.classifier.out_proj/aten::linear/MatMul/fq_weights_1" type="Multiply" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2787" name="__module.classifier.out_proj/aten::linear/MatMul" type="MatMul" version="opset1">
|
|
<data transpose_a="false" transpose_b="true" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1024</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2788" name="Constant_857781" type="Const" version="opset1">
|
|
<data element_type="f32" shape="1, 1" offset="358122164" size="4" />
|
|
<output>
|
|
<port id="0" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2789" name="__module.classifier.out_proj/aten::linear/Add" type="Add" version="opset1">
|
|
<data auto_broadcast="numpy" />
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
<port id="1" precision="FP32">
|
|
<dim>1</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
<output>
|
|
<port id="2" precision="FP32" names="logits">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</output>
|
|
</layer>
|
|
<layer id="2790" name="Result_851121" type="Result" version="opset1">
|
|
<input>
|
|
<port id="0" precision="FP32">
|
|
<dim>-1</dim>
|
|
<dim>1</dim>
|
|
</port>
|
|
</input>
|
|
</layer>
|
|
</layers>
|
|
<edges>
|
|
<edge from-layer="0" from-port="0" to-layer="101" to-port="0" />
|
|
<edge from-layer="1" from-port="0" to-layer="6" to-port="0" />
|
|
<edge from-layer="1" from-port="0" to-layer="15" to-port="0" />
|
|
<edge from-layer="1" from-port="0" to-layer="32" to-port="0" />
|
|
<edge from-layer="2" from-port="0" to-layer="3" to-port="0" />
|
|
<edge from-layer="3" from-port="1" to-layer="5" to-port="0" />
|
|
<edge from-layer="4" from-port="0" to-layer="5" to-port="1" />
|
|
<edge from-layer="5" from-port="2" to-layer="8" to-port="0" />
|
|
<edge from-layer="6" from-port="1" to-layer="8" to-port="1" />
|
|
<edge from-layer="7" from-port="0" to-layer="8" to-port="2" />
|
|
<edge from-layer="8" from-port="3" to-layer="26" to-port="0" />
|
|
<edge from-layer="9" from-port="0" to-layer="10" to-port="0" />
|
|
<edge from-layer="10" from-port="1" to-layer="12" to-port="0" />
|
|
<edge from-layer="11" from-port="0" to-layer="12" to-port="1" />
|
|
<edge from-layer="12" from-port="2" to-layer="25" to-port="0" />
|
|
<edge from-layer="13" from-port="0" to-layer="21" to-port="0" />
|
|
<edge from-layer="14" from-port="0" to-layer="21" to-port="1" />
|
|
<edge from-layer="15" from-port="1" to-layer="106" to-port="0" />
|
|
<edge from-layer="15" from-port="1" to-layer="22" to-port="1" />
|
|
<edge from-layer="15" from-port="1" to-layer="110" to-port="0" />
|
|
<edge from-layer="15" from-port="1" to-layer="18" to-port="0" />
|
|
<edge from-layer="16" from-port="0" to-layer="18" to-port="1" />
|
|
<edge from-layer="17" from-port="0" to-layer="18" to-port="2" />
|
|
<edge from-layer="18" from-port="3" to-layer="21" to-port="2" />
|
|
<edge from-layer="19" from-port="0" to-layer="21" to-port="3" />
|
|
<edge from-layer="20" from-port="0" to-layer="21" to-port="4" />
|
|
<edge from-layer="21" from-port="5" to-layer="22" to-port="0" />
|
|
<edge from-layer="22" from-port="2" to-layer="23" to-port="0" />
|
|
<edge from-layer="23" from-port="1" to-layer="25" to-port="1" />
|
|
<edge from-layer="24" from-port="0" to-layer="25" to-port="2" />
|
|
<edge from-layer="25" from-port="3" to-layer="26" to-port="1" />
|
|
<edge from-layer="26" from-port="2" to-layer="43" to-port="0" />
|
|
<edge from-layer="27" from-port="0" to-layer="28" to-port="0" />
|
|
<edge from-layer="28" from-port="1" to-layer="30" to-port="0" />
|
|
<edge from-layer="29" from-port="0" to-layer="30" to-port="1" />
|
|
<edge from-layer="30" from-port="2" to-layer="42" to-port="0" />
|
|
<edge from-layer="31" from-port="0" to-layer="32" to-port="1" />
|
|
<edge from-layer="32" from-port="2" to-layer="33" to-port="0" />
|
|
<edge from-layer="33" from-port="1" to-layer="36" to-port="1" />
|
|
<edge from-layer="33" from-port="1" to-layer="35" to-port="0" />
|
|
<edge from-layer="34" from-port="0" to-layer="35" to-port="1" />
|
|
<edge from-layer="34" from-port="0" to-layer="101" to-port="1" />
|
|
<edge from-layer="35" from-port="2" to-layer="36" to-port="0" />
|
|
<edge from-layer="36" from-port="2" to-layer="37" to-port="0" />
|
|
<edge from-layer="37" from-port="1" to-layer="39" to-port="0" />
|
|
<edge from-layer="38" from-port="0" to-layer="39" to-port="1" />
|
|
<edge from-layer="39" from-port="2" to-layer="40" to-port="0" />
|
|
<edge from-layer="40" from-port="1" to-layer="42" to-port="1" />
|
|
<edge from-layer="41" from-port="0" to-layer="42" to-port="2" />
|
|
<edge from-layer="42" from-port="3" to-layer="43" to-port="1" />
|
|
<edge from-layer="43" from-port="2" to-layer="45" to-port="0" />
|
|
<edge from-layer="44" from-port="0" to-layer="45" to-port="1" />
|
|
<edge from-layer="45" from-port="2" to-layer="47" to-port="0" />
|
|
<edge from-layer="46" from-port="0" to-layer="47" to-port="1" />
|
|
<edge from-layer="47" from-port="2" to-layer="49" to-port="0" />
|
|
<edge from-layer="48" from-port="0" to-layer="49" to-port="1" />
|
|
<edge from-layer="49" from-port="2" to-layer="51" to-port="0" />
|
|
<edge from-layer="49" from-port="2" to-layer="139" to-port="1" />
|
|
<edge from-layer="50" from-port="0" to-layer="51" to-port="1" />
|
|
<edge from-layer="51" from-port="2" to-layer="56" to-port="0" />
|
|
<edge from-layer="52" from-port="0" to-layer="56" to-port="1" />
|
|
<edge from-layer="53" from-port="0" to-layer="56" to-port="2" />
|
|
<edge from-layer="54" from-port="0" to-layer="56" to-port="3" />
|
|
<edge from-layer="55" from-port="0" to-layer="56" to-port="4" />
|
|
<edge from-layer="56" from-port="5" to-layer="61" to-port="0" />
|
|
<edge from-layer="56" from-port="5" to-layer="77" to-port="0" />
|
|
<edge from-layer="56" from-port="5" to-layer="93" to-port="0" />
|
|
<edge from-layer="57" from-port="0" to-layer="58" to-port="0" />
|
|
<edge from-layer="58" from-port="1" to-layer="60" to-port="0" />
|
|
<edge from-layer="59" from-port="0" to-layer="60" to-port="1" />
|
|
<edge from-layer="60" from-port="2" to-layer="61" to-port="1" />
|
|
<edge from-layer="61" from-port="2" to-layer="63" to-port="0" />
|
|
<edge from-layer="62" from-port="0" to-layer="63" to-port="1" />
|
|
<edge from-layer="63" from-port="2" to-layer="68" to-port="0" />
|
|
<edge from-layer="64" from-port="0" to-layer="68" to-port="1" />
|
|
<edge from-layer="65" from-port="0" to-layer="68" to-port="2" />
|
|
<edge from-layer="66" from-port="0" to-layer="68" to-port="3" />
|
|
<edge from-layer="67" from-port="0" to-layer="68" to-port="4" />
|
|
<edge from-layer="68" from-port="5" to-layer="70" to-port="0" />
|
|
<edge from-layer="69" from-port="0" to-layer="70" to-port="1" />
|
|
<edge from-layer="70" from-port="2" to-layer="72" to-port="0" />
|
|
<edge from-layer="71" from-port="0" to-layer="72" to-port="1" />
|
|
<edge from-layer="72" from-port="2" to-layer="120" to-port="0" />
|
|
<edge from-layer="73" from-port="0" to-layer="74" to-port="0" />
|
|
<edge from-layer="74" from-port="1" to-layer="76" to-port="0" />
|
|
<edge from-layer="75" from-port="0" to-layer="76" to-port="1" />
|
|
<edge from-layer="76" from-port="2" to-layer="77" to-port="1" />
|
|
<edge from-layer="77" from-port="2" to-layer="79" to-port="0" />
|
|
<edge from-layer="78" from-port="0" to-layer="79" to-port="1" />
|
|
<edge from-layer="79" from-port="2" to-layer="84" to-port="0" />
|
|
<edge from-layer="80" from-port="0" to-layer="84" to-port="1" />
|
|
<edge from-layer="81" from-port="0" to-layer="84" to-port="2" />
|
|
<edge from-layer="82" from-port="0" to-layer="84" to-port="3" />
|
|
<edge from-layer="83" from-port="0" to-layer="84" to-port="4" />
|
|
<edge from-layer="84" from-port="5" to-layer="86" to-port="0" />
|
|
<edge from-layer="85" from-port="0" to-layer="86" to-port="1" />
|
|
<edge from-layer="86" from-port="2" to-layer="88" to-port="0" />
|
|
<edge from-layer="87" from-port="0" to-layer="88" to-port="1" />
|
|
<edge from-layer="88" from-port="2" to-layer="120" to-port="1" />
|
|
<edge from-layer="89" from-port="0" to-layer="90" to-port="0" />
|
|
<edge from-layer="90" from-port="1" to-layer="92" to-port="0" />
|
|
<edge from-layer="91" from-port="0" to-layer="92" to-port="1" />
|
|
<edge from-layer="92" from-port="2" to-layer="93" to-port="1" />
|
|
<edge from-layer="93" from-port="2" to-layer="95" to-port="0" />
|
|
<edge from-layer="94" from-port="0" to-layer="95" to-port="1" />
|
|
<edge from-layer="95" from-port="2" to-layer="97" to-port="0" />
|
|
<edge from-layer="96" from-port="0" to-layer="97" to-port="1" />
|
|
<edge from-layer="97" from-port="2" to-layer="99" to-port="0" />
|
|
<edge from-layer="98" from-port="0" to-layer="99" to-port="1" />
|
|
<edge from-layer="99" from-port="2" to-layer="120" to-port="2" />
|
|
<edge from-layer="100" from-port="0" to-layer="116" to-port="0" />
|
|
<edge from-layer="101" from-port="2" to-layer="103" to-port="0" />
|
|
<edge from-layer="102" from-port="0" to-layer="103" to-port="1" />
|
|
<edge from-layer="103" from-port="2" to-layer="112" to-port="0" />
|
|
<edge from-layer="104" from-port="0" to-layer="106" to-port="1" />
|
|
<edge from-layer="105" from-port="0" to-layer="106" to-port="2" />
|
|
<edge from-layer="106" from-port="3" to-layer="111" to-port="0" />
|
|
<edge from-layer="107" from-port="0" to-layer="111" to-port="1" />
|
|
<edge from-layer="108" from-port="0" to-layer="110" to-port="1" />
|
|
<edge from-layer="109" from-port="0" to-layer="110" to-port="2" />
|
|
<edge from-layer="110" from-port="3" to-layer="111" to-port="2" />
|
|
<edge from-layer="111" from-port="3" to-layer="112" to-port="1" />
|
|
<edge from-layer="112" from-port="2" to-layer="113" to-port="0" />
|
|
<edge from-layer="113" from-port="1" to-layer="115" to-port="0" />
|
|
<edge from-layer="114" from-port="0" to-layer="115" to-port="1" />
|
|
<edge from-layer="115" from-port="2" to-layer="116" to-port="1" />
|
|
<edge from-layer="116" from-port="2" to-layer="117" to-port="0" />
|
|
<edge from-layer="116" from-port="2" to-layer="119" to-port="2" />
|
|
<edge from-layer="117" from-port="1" to-layer="119" to-port="0" />
|
|
<edge from-layer="118" from-port="0" to-layer="119" to-port="1" />
|
|
<edge from-layer="119" from-port="3" to-layer="120" to-port="3" />
|
|
<edge from-layer="119" from-port="3" to-layer="2024" to-port="3" />
|
|
<edge from-layer="119" from-port="3" to-layer="2136" to-port="3" />
|
|
<edge from-layer="119" from-port="3" to-layer="2248" to-port="3" />
|
|
<edge from-layer="119" from-port="3" to-layer="1240" to-port="3" />
|
|
<edge from-layer="119" from-port="3" to-layer="2360" to-port="3" />
|
|
<edge from-layer="119" from-port="3" to-layer="2696" to-port="3" />
|
|
<edge from-layer="119" from-port="3" to-layer="232" to-port="3" />
|
|
<edge from-layer="119" from-port="3" to-layer="2472" to-port="3" />
|
|
<edge from-layer="119" from-port="3" to-layer="344" to-port="3" />
|
|
<edge from-layer="119" from-port="3" to-layer="456" to-port="3" />
|
|
<edge from-layer="119" from-port="3" to-layer="2584" to-port="3" />
|
|
<edge from-layer="119" from-port="3" to-layer="568" to-port="3" />
|
|
<edge from-layer="119" from-port="3" to-layer="680" to-port="3" />
|
|
<edge from-layer="119" from-port="3" to-layer="792" to-port="3" />
|
|
<edge from-layer="119" from-port="3" to-layer="904" to-port="3" />
|
|
<edge from-layer="119" from-port="3" to-layer="1016" to-port="3" />
|
|
<edge from-layer="119" from-port="3" to-layer="1128" to-port="3" />
|
|
<edge from-layer="119" from-port="3" to-layer="1352" to-port="3" />
|
|
<edge from-layer="119" from-port="3" to-layer="1464" to-port="3" />
|
|
<edge from-layer="119" from-port="3" to-layer="1576" to-port="3" />
|
|
<edge from-layer="119" from-port="3" to-layer="1688" to-port="3" />
|
|
<edge from-layer="119" from-port="3" to-layer="1800" to-port="3" />
|
|
<edge from-layer="119" from-port="3" to-layer="1912" to-port="3" />
|
|
<edge from-layer="120" from-port="4" to-layer="122" to-port="0" />
|
|
<edge from-layer="121" from-port="0" to-layer="122" to-port="1" />
|
|
<edge from-layer="122" from-port="2" to-layer="124" to-port="0" />
|
|
<edge from-layer="123" from-port="0" to-layer="124" to-port="1" />
|
|
<edge from-layer="124" from-port="2" to-layer="126" to-port="0" />
|
|
<edge from-layer="125" from-port="0" to-layer="126" to-port="1" />
|
|
<edge from-layer="126" from-port="2" to-layer="131" to-port="0" />
|
|
<edge from-layer="127" from-port="0" to-layer="131" to-port="1" />
|
|
<edge from-layer="128" from-port="0" to-layer="131" to-port="2" />
|
|
<edge from-layer="129" from-port="0" to-layer="131" to-port="3" />
|
|
<edge from-layer="130" from-port="0" to-layer="131" to-port="4" />
|
|
<edge from-layer="131" from-port="5" to-layer="136" to-port="0" />
|
|
<edge from-layer="132" from-port="0" to-layer="133" to-port="0" />
|
|
<edge from-layer="133" from-port="1" to-layer="135" to-port="0" />
|
|
<edge from-layer="134" from-port="0" to-layer="135" to-port="1" />
|
|
<edge from-layer="135" from-port="2" to-layer="136" to-port="1" />
|
|
<edge from-layer="136" from-port="2" to-layer="138" to-port="0" />
|
|
<edge from-layer="137" from-port="0" to-layer="138" to-port="1" />
|
|
<edge from-layer="138" from-port="2" to-layer="139" to-port="0" />
|
|
<edge from-layer="139" from-port="2" to-layer="141" to-port="0" />
|
|
<edge from-layer="140" from-port="0" to-layer="141" to-port="1" />
|
|
<edge from-layer="141" from-port="2" to-layer="143" to-port="0" />
|
|
<edge from-layer="142" from-port="0" to-layer="143" to-port="1" />
|
|
<edge from-layer="143" from-port="2" to-layer="145" to-port="0" />
|
|
<edge from-layer="144" from-port="0" to-layer="145" to-port="1" />
|
|
<edge from-layer="145" from-port="2" to-layer="147" to-port="0" />
|
|
<edge from-layer="145" from-port="2" to-layer="175" to-port="1" />
|
|
<edge from-layer="146" from-port="0" to-layer="147" to-port="1" />
|
|
<edge from-layer="147" from-port="2" to-layer="152" to-port="0" />
|
|
<edge from-layer="148" from-port="0" to-layer="152" to-port="1" />
|
|
<edge from-layer="149" from-port="0" to-layer="152" to-port="2" />
|
|
<edge from-layer="150" from-port="0" to-layer="152" to-port="3" />
|
|
<edge from-layer="151" from-port="0" to-layer="152" to-port="4" />
|
|
<edge from-layer="152" from-port="5" to-layer="157" to-port="0" />
|
|
<edge from-layer="153" from-port="0" to-layer="154" to-port="0" />
|
|
<edge from-layer="154" from-port="1" to-layer="156" to-port="0" />
|
|
<edge from-layer="155" from-port="0" to-layer="156" to-port="1" />
|
|
<edge from-layer="156" from-port="2" to-layer="157" to-port="1" />
|
|
<edge from-layer="157" from-port="2" to-layer="159" to-port="0" />
|
|
<edge from-layer="158" from-port="0" to-layer="159" to-port="1" />
|
|
<edge from-layer="159" from-port="2" to-layer="160" to-port="0" />
|
|
<edge from-layer="160" from-port="1" to-layer="162" to-port="0" />
|
|
<edge from-layer="161" from-port="0" to-layer="162" to-port="1" />
|
|
<edge from-layer="162" from-port="2" to-layer="167" to-port="0" />
|
|
<edge from-layer="163" from-port="0" to-layer="167" to-port="1" />
|
|
<edge from-layer="164" from-port="0" to-layer="167" to-port="2" />
|
|
<edge from-layer="165" from-port="0" to-layer="167" to-port="3" />
|
|
<edge from-layer="166" from-port="0" to-layer="167" to-port="4" />
|
|
<edge from-layer="167" from-port="5" to-layer="172" to-port="0" />
|
|
<edge from-layer="168" from-port="0" to-layer="169" to-port="0" />
|
|
<edge from-layer="169" from-port="1" to-layer="171" to-port="0" />
|
|
<edge from-layer="170" from-port="0" to-layer="171" to-port="1" />
|
|
<edge from-layer="171" from-port="2" to-layer="172" to-port="1" />
|
|
<edge from-layer="172" from-port="2" to-layer="174" to-port="0" />
|
|
<edge from-layer="173" from-port="0" to-layer="174" to-port="1" />
|
|
<edge from-layer="174" from-port="2" to-layer="175" to-port="0" />
|
|
<edge from-layer="175" from-port="2" to-layer="177" to-port="0" />
|
|
<edge from-layer="176" from-port="0" to-layer="177" to-port="1" />
|
|
<edge from-layer="177" from-port="2" to-layer="179" to-port="0" />
|
|
<edge from-layer="178" from-port="0" to-layer="179" to-port="1" />
|
|
<edge from-layer="179" from-port="2" to-layer="181" to-port="0" />
|
|
<edge from-layer="180" from-port="0" to-layer="181" to-port="1" />
|
|
<edge from-layer="181" from-port="2" to-layer="251" to-port="1" />
|
|
<edge from-layer="181" from-port="2" to-layer="183" to-port="0" />
|
|
<edge from-layer="182" from-port="0" to-layer="183" to-port="1" />
|
|
<edge from-layer="183" from-port="2" to-layer="188" to-port="0" />
|
|
<edge from-layer="184" from-port="0" to-layer="188" to-port="1" />
|
|
<edge from-layer="185" from-port="0" to-layer="188" to-port="2" />
|
|
<edge from-layer="186" from-port="0" to-layer="188" to-port="3" />
|
|
<edge from-layer="187" from-port="0" to-layer="188" to-port="4" />
|
|
<edge from-layer="188" from-port="5" to-layer="209" to-port="0" />
|
|
<edge from-layer="188" from-port="5" to-layer="193" to-port="0" />
|
|
<edge from-layer="188" from-port="5" to-layer="225" to-port="0" />
|
|
<edge from-layer="189" from-port="0" to-layer="190" to-port="0" />
|
|
<edge from-layer="190" from-port="1" to-layer="192" to-port="0" />
|
|
<edge from-layer="191" from-port="0" to-layer="192" to-port="1" />
|
|
<edge from-layer="192" from-port="2" to-layer="193" to-port="1" />
|
|
<edge from-layer="193" from-port="2" to-layer="195" to-port="0" />
|
|
<edge from-layer="194" from-port="0" to-layer="195" to-port="1" />
|
|
<edge from-layer="195" from-port="2" to-layer="200" to-port="0" />
|
|
<edge from-layer="196" from-port="0" to-layer="200" to-port="1" />
|
|
<edge from-layer="197" from-port="0" to-layer="200" to-port="2" />
|
|
<edge from-layer="198" from-port="0" to-layer="200" to-port="3" />
|
|
<edge from-layer="199" from-port="0" to-layer="200" to-port="4" />
|
|
<edge from-layer="200" from-port="5" to-layer="202" to-port="0" />
|
|
<edge from-layer="201" from-port="0" to-layer="202" to-port="1" />
|
|
<edge from-layer="202" from-port="2" to-layer="204" to-port="0" />
|
|
<edge from-layer="203" from-port="0" to-layer="204" to-port="1" />
|
|
<edge from-layer="204" from-port="2" to-layer="232" to-port="0" />
|
|
<edge from-layer="205" from-port="0" to-layer="206" to-port="0" />
|
|
<edge from-layer="206" from-port="1" to-layer="208" to-port="0" />
|
|
<edge from-layer="207" from-port="0" to-layer="208" to-port="1" />
|
|
<edge from-layer="208" from-port="2" to-layer="209" to-port="1" />
|
|
<edge from-layer="209" from-port="2" to-layer="211" to-port="0" />
|
|
<edge from-layer="210" from-port="0" to-layer="211" to-port="1" />
|
|
<edge from-layer="211" from-port="2" to-layer="216" to-port="0" />
|
|
<edge from-layer="212" from-port="0" to-layer="216" to-port="1" />
|
|
<edge from-layer="213" from-port="0" to-layer="216" to-port="2" />
|
|
<edge from-layer="214" from-port="0" to-layer="216" to-port="3" />
|
|
<edge from-layer="215" from-port="0" to-layer="216" to-port="4" />
|
|
<edge from-layer="216" from-port="5" to-layer="218" to-port="0" />
|
|
<edge from-layer="217" from-port="0" to-layer="218" to-port="1" />
|
|
<edge from-layer="218" from-port="2" to-layer="220" to-port="0" />
|
|
<edge from-layer="219" from-port="0" to-layer="220" to-port="1" />
|
|
<edge from-layer="220" from-port="2" to-layer="232" to-port="1" />
|
|
<edge from-layer="221" from-port="0" to-layer="222" to-port="0" />
|
|
<edge from-layer="222" from-port="1" to-layer="224" to-port="0" />
|
|
<edge from-layer="223" from-port="0" to-layer="224" to-port="1" />
|
|
<edge from-layer="224" from-port="2" to-layer="225" to-port="1" />
|
|
<edge from-layer="225" from-port="2" to-layer="227" to-port="0" />
|
|
<edge from-layer="226" from-port="0" to-layer="227" to-port="1" />
|
|
<edge from-layer="227" from-port="2" to-layer="229" to-port="0" />
|
|
<edge from-layer="228" from-port="0" to-layer="229" to-port="1" />
|
|
<edge from-layer="229" from-port="2" to-layer="231" to-port="0" />
|
|
<edge from-layer="230" from-port="0" to-layer="231" to-port="1" />
|
|
<edge from-layer="231" from-port="2" to-layer="232" to-port="2" />
|
|
<edge from-layer="232" from-port="4" to-layer="234" to-port="0" />
|
|
<edge from-layer="233" from-port="0" to-layer="234" to-port="1" />
|
|
<edge from-layer="234" from-port="2" to-layer="236" to-port="0" />
|
|
<edge from-layer="235" from-port="0" to-layer="236" to-port="1" />
|
|
<edge from-layer="236" from-port="2" to-layer="238" to-port="0" />
|
|
<edge from-layer="237" from-port="0" to-layer="238" to-port="1" />
|
|
<edge from-layer="238" from-port="2" to-layer="243" to-port="0" />
|
|
<edge from-layer="239" from-port="0" to-layer="243" to-port="1" />
|
|
<edge from-layer="240" from-port="0" to-layer="243" to-port="2" />
|
|
<edge from-layer="241" from-port="0" to-layer="243" to-port="3" />
|
|
<edge from-layer="242" from-port="0" to-layer="243" to-port="4" />
|
|
<edge from-layer="243" from-port="5" to-layer="248" to-port="0" />
|
|
<edge from-layer="244" from-port="0" to-layer="245" to-port="0" />
|
|
<edge from-layer="245" from-port="1" to-layer="247" to-port="0" />
|
|
<edge from-layer="246" from-port="0" to-layer="247" to-port="1" />
|
|
<edge from-layer="247" from-port="2" to-layer="248" to-port="1" />
|
|
<edge from-layer="248" from-port="2" to-layer="250" to-port="0" />
|
|
<edge from-layer="249" from-port="0" to-layer="250" to-port="1" />
|
|
<edge from-layer="250" from-port="2" to-layer="251" to-port="0" />
|
|
<edge from-layer="251" from-port="2" to-layer="253" to-port="0" />
|
|
<edge from-layer="252" from-port="0" to-layer="253" to-port="1" />
|
|
<edge from-layer="253" from-port="2" to-layer="255" to-port="0" />
|
|
<edge from-layer="254" from-port="0" to-layer="255" to-port="1" />
|
|
<edge from-layer="255" from-port="2" to-layer="257" to-port="0" />
|
|
<edge from-layer="256" from-port="0" to-layer="257" to-port="1" />
|
|
<edge from-layer="257" from-port="2" to-layer="259" to-port="0" />
|
|
<edge from-layer="257" from-port="2" to-layer="287" to-port="1" />
|
|
<edge from-layer="258" from-port="0" to-layer="259" to-port="1" />
|
|
<edge from-layer="259" from-port="2" to-layer="264" to-port="0" />
|
|
<edge from-layer="260" from-port="0" to-layer="264" to-port="1" />
|
|
<edge from-layer="261" from-port="0" to-layer="264" to-port="2" />
|
|
<edge from-layer="262" from-port="0" to-layer="264" to-port="3" />
|
|
<edge from-layer="263" from-port="0" to-layer="264" to-port="4" />
|
|
<edge from-layer="264" from-port="5" to-layer="269" to-port="0" />
|
|
<edge from-layer="265" from-port="0" to-layer="266" to-port="0" />
|
|
<edge from-layer="266" from-port="1" to-layer="268" to-port="0" />
|
|
<edge from-layer="267" from-port="0" to-layer="268" to-port="1" />
|
|
<edge from-layer="268" from-port="2" to-layer="269" to-port="1" />
|
|
<edge from-layer="269" from-port="2" to-layer="271" to-port="0" />
|
|
<edge from-layer="270" from-port="0" to-layer="271" to-port="1" />
|
|
<edge from-layer="271" from-port="2" to-layer="272" to-port="0" />
|
|
<edge from-layer="272" from-port="1" to-layer="274" to-port="0" />
|
|
<edge from-layer="273" from-port="0" to-layer="274" to-port="1" />
|
|
<edge from-layer="274" from-port="2" to-layer="279" to-port="0" />
|
|
<edge from-layer="275" from-port="0" to-layer="279" to-port="1" />
|
|
<edge from-layer="276" from-port="0" to-layer="279" to-port="2" />
|
|
<edge from-layer="277" from-port="0" to-layer="279" to-port="3" />
|
|
<edge from-layer="278" from-port="0" to-layer="279" to-port="4" />
|
|
<edge from-layer="279" from-port="5" to-layer="284" to-port="0" />
|
|
<edge from-layer="280" from-port="0" to-layer="281" to-port="0" />
|
|
<edge from-layer="281" from-port="1" to-layer="283" to-port="0" />
|
|
<edge from-layer="282" from-port="0" to-layer="283" to-port="1" />
|
|
<edge from-layer="283" from-port="2" to-layer="284" to-port="1" />
|
|
<edge from-layer="284" from-port="2" to-layer="286" to-port="0" />
|
|
<edge from-layer="285" from-port="0" to-layer="286" to-port="1" />
|
|
<edge from-layer="286" from-port="2" to-layer="287" to-port="0" />
|
|
<edge from-layer="287" from-port="2" to-layer="289" to-port="0" />
|
|
<edge from-layer="288" from-port="0" to-layer="289" to-port="1" />
|
|
<edge from-layer="289" from-port="2" to-layer="291" to-port="0" />
|
|
<edge from-layer="290" from-port="0" to-layer="291" to-port="1" />
|
|
<edge from-layer="291" from-port="2" to-layer="293" to-port="0" />
|
|
<edge from-layer="292" from-port="0" to-layer="293" to-port="1" />
|
|
<edge from-layer="293" from-port="2" to-layer="363" to-port="1" />
|
|
<edge from-layer="293" from-port="2" to-layer="295" to-port="0" />
|
|
<edge from-layer="294" from-port="0" to-layer="295" to-port="1" />
|
|
<edge from-layer="295" from-port="2" to-layer="300" to-port="0" />
|
|
<edge from-layer="296" from-port="0" to-layer="300" to-port="1" />
|
|
<edge from-layer="297" from-port="0" to-layer="300" to-port="2" />
|
|
<edge from-layer="298" from-port="0" to-layer="300" to-port="3" />
|
|
<edge from-layer="299" from-port="0" to-layer="300" to-port="4" />
|
|
<edge from-layer="300" from-port="5" to-layer="321" to-port="0" />
|
|
<edge from-layer="300" from-port="5" to-layer="337" to-port="0" />
|
|
<edge from-layer="300" from-port="5" to-layer="305" to-port="0" />
|
|
<edge from-layer="301" from-port="0" to-layer="302" to-port="0" />
|
|
<edge from-layer="302" from-port="1" to-layer="304" to-port="0" />
|
|
<edge from-layer="303" from-port="0" to-layer="304" to-port="1" />
|
|
<edge from-layer="304" from-port="2" to-layer="305" to-port="1" />
|
|
<edge from-layer="305" from-port="2" to-layer="307" to-port="0" />
|
|
<edge from-layer="306" from-port="0" to-layer="307" to-port="1" />
|
|
<edge from-layer="307" from-port="2" to-layer="312" to-port="0" />
|
|
<edge from-layer="308" from-port="0" to-layer="312" to-port="1" />
|
|
<edge from-layer="309" from-port="0" to-layer="312" to-port="2" />
|
|
<edge from-layer="310" from-port="0" to-layer="312" to-port="3" />
|
|
<edge from-layer="311" from-port="0" to-layer="312" to-port="4" />
|
|
<edge from-layer="312" from-port="5" to-layer="314" to-port="0" />
|
|
<edge from-layer="313" from-port="0" to-layer="314" to-port="1" />
|
|
<edge from-layer="314" from-port="2" to-layer="316" to-port="0" />
|
|
<edge from-layer="315" from-port="0" to-layer="316" to-port="1" />
|
|
<edge from-layer="316" from-port="2" to-layer="344" to-port="0" />
|
|
<edge from-layer="317" from-port="0" to-layer="318" to-port="0" />
|
|
<edge from-layer="318" from-port="1" to-layer="320" to-port="0" />
|
|
<edge from-layer="319" from-port="0" to-layer="320" to-port="1" />
|
|
<edge from-layer="320" from-port="2" to-layer="321" to-port="1" />
|
|
<edge from-layer="321" from-port="2" to-layer="323" to-port="0" />
|
|
<edge from-layer="322" from-port="0" to-layer="323" to-port="1" />
|
|
<edge from-layer="323" from-port="2" to-layer="328" to-port="0" />
|
|
<edge from-layer="324" from-port="0" to-layer="328" to-port="1" />
|
|
<edge from-layer="325" from-port="0" to-layer="328" to-port="2" />
|
|
<edge from-layer="326" from-port="0" to-layer="328" to-port="3" />
|
|
<edge from-layer="327" from-port="0" to-layer="328" to-port="4" />
|
|
<edge from-layer="328" from-port="5" to-layer="330" to-port="0" />
|
|
<edge from-layer="329" from-port="0" to-layer="330" to-port="1" />
|
|
<edge from-layer="330" from-port="2" to-layer="332" to-port="0" />
|
|
<edge from-layer="331" from-port="0" to-layer="332" to-port="1" />
|
|
<edge from-layer="332" from-port="2" to-layer="344" to-port="1" />
|
|
<edge from-layer="333" from-port="0" to-layer="334" to-port="0" />
|
|
<edge from-layer="334" from-port="1" to-layer="336" to-port="0" />
|
|
<edge from-layer="335" from-port="0" to-layer="336" to-port="1" />
|
|
<edge from-layer="336" from-port="2" to-layer="337" to-port="1" />
|
|
<edge from-layer="337" from-port="2" to-layer="339" to-port="0" />
|
|
<edge from-layer="338" from-port="0" to-layer="339" to-port="1" />
|
|
<edge from-layer="339" from-port="2" to-layer="341" to-port="0" />
|
|
<edge from-layer="340" from-port="0" to-layer="341" to-port="1" />
|
|
<edge from-layer="341" from-port="2" to-layer="343" to-port="0" />
|
|
<edge from-layer="342" from-port="0" to-layer="343" to-port="1" />
|
|
<edge from-layer="343" from-port="2" to-layer="344" to-port="2" />
|
|
<edge from-layer="344" from-port="4" to-layer="346" to-port="0" />
|
|
<edge from-layer="345" from-port="0" to-layer="346" to-port="1" />
|
|
<edge from-layer="346" from-port="2" to-layer="348" to-port="0" />
|
|
<edge from-layer="347" from-port="0" to-layer="348" to-port="1" />
|
|
<edge from-layer="348" from-port="2" to-layer="350" to-port="0" />
|
|
<edge from-layer="349" from-port="0" to-layer="350" to-port="1" />
|
|
<edge from-layer="350" from-port="2" to-layer="355" to-port="0" />
|
|
<edge from-layer="351" from-port="0" to-layer="355" to-port="1" />
|
|
<edge from-layer="352" from-port="0" to-layer="355" to-port="2" />
|
|
<edge from-layer="353" from-port="0" to-layer="355" to-port="3" />
|
|
<edge from-layer="354" from-port="0" to-layer="355" to-port="4" />
|
|
<edge from-layer="355" from-port="5" to-layer="360" to-port="0" />
|
|
<edge from-layer="356" from-port="0" to-layer="357" to-port="0" />
|
|
<edge from-layer="357" from-port="1" to-layer="359" to-port="0" />
|
|
<edge from-layer="358" from-port="0" to-layer="359" to-port="1" />
|
|
<edge from-layer="359" from-port="2" to-layer="360" to-port="1" />
|
|
<edge from-layer="360" from-port="2" to-layer="362" to-port="0" />
|
|
<edge from-layer="361" from-port="0" to-layer="362" to-port="1" />
|
|
<edge from-layer="362" from-port="2" to-layer="363" to-port="0" />
|
|
<edge from-layer="363" from-port="2" to-layer="365" to-port="0" />
|
|
<edge from-layer="364" from-port="0" to-layer="365" to-port="1" />
|
|
<edge from-layer="365" from-port="2" to-layer="367" to-port="0" />
|
|
<edge from-layer="366" from-port="0" to-layer="367" to-port="1" />
|
|
<edge from-layer="367" from-port="2" to-layer="369" to-port="0" />
|
|
<edge from-layer="368" from-port="0" to-layer="369" to-port="1" />
|
|
<edge from-layer="369" from-port="2" to-layer="399" to-port="1" />
|
|
<edge from-layer="369" from-port="2" to-layer="371" to-port="0" />
|
|
<edge from-layer="370" from-port="0" to-layer="371" to-port="1" />
|
|
<edge from-layer="371" from-port="2" to-layer="376" to-port="0" />
|
|
<edge from-layer="372" from-port="0" to-layer="376" to-port="1" />
|
|
<edge from-layer="373" from-port="0" to-layer="376" to-port="2" />
|
|
<edge from-layer="374" from-port="0" to-layer="376" to-port="3" />
|
|
<edge from-layer="375" from-port="0" to-layer="376" to-port="4" />
|
|
<edge from-layer="376" from-port="5" to-layer="381" to-port="0" />
|
|
<edge from-layer="377" from-port="0" to-layer="378" to-port="0" />
|
|
<edge from-layer="378" from-port="1" to-layer="380" to-port="0" />
|
|
<edge from-layer="379" from-port="0" to-layer="380" to-port="1" />
|
|
<edge from-layer="380" from-port="2" to-layer="381" to-port="1" />
|
|
<edge from-layer="381" from-port="2" to-layer="383" to-port="0" />
|
|
<edge from-layer="382" from-port="0" to-layer="383" to-port="1" />
|
|
<edge from-layer="383" from-port="2" to-layer="384" to-port="0" />
|
|
<edge from-layer="384" from-port="1" to-layer="386" to-port="0" />
|
|
<edge from-layer="385" from-port="0" to-layer="386" to-port="1" />
|
|
<edge from-layer="386" from-port="2" to-layer="391" to-port="0" />
|
|
<edge from-layer="387" from-port="0" to-layer="391" to-port="1" />
|
|
<edge from-layer="388" from-port="0" to-layer="391" to-port="2" />
|
|
<edge from-layer="389" from-port="0" to-layer="391" to-port="3" />
|
|
<edge from-layer="390" from-port="0" to-layer="391" to-port="4" />
|
|
<edge from-layer="391" from-port="5" to-layer="396" to-port="0" />
|
|
<edge from-layer="392" from-port="0" to-layer="393" to-port="0" />
|
|
<edge from-layer="393" from-port="1" to-layer="395" to-port="0" />
|
|
<edge from-layer="394" from-port="0" to-layer="395" to-port="1" />
|
|
<edge from-layer="395" from-port="2" to-layer="396" to-port="1" />
|
|
<edge from-layer="396" from-port="2" to-layer="398" to-port="0" />
|
|
<edge from-layer="397" from-port="0" to-layer="398" to-port="1" />
|
|
<edge from-layer="398" from-port="2" to-layer="399" to-port="0" />
|
|
<edge from-layer="399" from-port="2" to-layer="401" to-port="0" />
|
|
<edge from-layer="400" from-port="0" to-layer="401" to-port="1" />
|
|
<edge from-layer="401" from-port="2" to-layer="403" to-port="0" />
|
|
<edge from-layer="402" from-port="0" to-layer="403" to-port="1" />
|
|
<edge from-layer="403" from-port="2" to-layer="405" to-port="0" />
|
|
<edge from-layer="404" from-port="0" to-layer="405" to-port="1" />
|
|
<edge from-layer="405" from-port="2" to-layer="407" to-port="0" />
|
|
<edge from-layer="405" from-port="2" to-layer="475" to-port="1" />
|
|
<edge from-layer="406" from-port="0" to-layer="407" to-port="1" />
|
|
<edge from-layer="407" from-port="2" to-layer="412" to-port="0" />
|
|
<edge from-layer="408" from-port="0" to-layer="412" to-port="1" />
|
|
<edge from-layer="409" from-port="0" to-layer="412" to-port="2" />
|
|
<edge from-layer="410" from-port="0" to-layer="412" to-port="3" />
|
|
<edge from-layer="411" from-port="0" to-layer="412" to-port="4" />
|
|
<edge from-layer="412" from-port="5" to-layer="417" to-port="0" />
|
|
<edge from-layer="412" from-port="5" to-layer="433" to-port="0" />
|
|
<edge from-layer="412" from-port="5" to-layer="449" to-port="0" />
|
|
<edge from-layer="413" from-port="0" to-layer="414" to-port="0" />
|
|
<edge from-layer="414" from-port="1" to-layer="416" to-port="0" />
|
|
<edge from-layer="415" from-port="0" to-layer="416" to-port="1" />
|
|
<edge from-layer="416" from-port="2" to-layer="417" to-port="1" />
|
|
<edge from-layer="417" from-port="2" to-layer="419" to-port="0" />
|
|
<edge from-layer="418" from-port="0" to-layer="419" to-port="1" />
|
|
<edge from-layer="419" from-port="2" to-layer="424" to-port="0" />
|
|
<edge from-layer="420" from-port="0" to-layer="424" to-port="1" />
|
|
<edge from-layer="421" from-port="0" to-layer="424" to-port="2" />
|
|
<edge from-layer="422" from-port="0" to-layer="424" to-port="3" />
|
|
<edge from-layer="423" from-port="0" to-layer="424" to-port="4" />
|
|
<edge from-layer="424" from-port="5" to-layer="426" to-port="0" />
|
|
<edge from-layer="425" from-port="0" to-layer="426" to-port="1" />
|
|
<edge from-layer="426" from-port="2" to-layer="428" to-port="0" />
|
|
<edge from-layer="427" from-port="0" to-layer="428" to-port="1" />
|
|
<edge from-layer="428" from-port="2" to-layer="456" to-port="0" />
|
|
<edge from-layer="429" from-port="0" to-layer="430" to-port="0" />
|
|
<edge from-layer="430" from-port="1" to-layer="432" to-port="0" />
|
|
<edge from-layer="431" from-port="0" to-layer="432" to-port="1" />
|
|
<edge from-layer="432" from-port="2" to-layer="433" to-port="1" />
|
|
<edge from-layer="433" from-port="2" to-layer="435" to-port="0" />
|
|
<edge from-layer="434" from-port="0" to-layer="435" to-port="1" />
|
|
<edge from-layer="435" from-port="2" to-layer="440" to-port="0" />
|
|
<edge from-layer="436" from-port="0" to-layer="440" to-port="1" />
|
|
<edge from-layer="437" from-port="0" to-layer="440" to-port="2" />
|
|
<edge from-layer="438" from-port="0" to-layer="440" to-port="3" />
|
|
<edge from-layer="439" from-port="0" to-layer="440" to-port="4" />
|
|
<edge from-layer="440" from-port="5" to-layer="442" to-port="0" />
|
|
<edge from-layer="441" from-port="0" to-layer="442" to-port="1" />
|
|
<edge from-layer="442" from-port="2" to-layer="444" to-port="0" />
|
|
<edge from-layer="443" from-port="0" to-layer="444" to-port="1" />
|
|
<edge from-layer="444" from-port="2" to-layer="456" to-port="1" />
|
|
<edge from-layer="445" from-port="0" to-layer="446" to-port="0" />
|
|
<edge from-layer="446" from-port="1" to-layer="448" to-port="0" />
|
|
<edge from-layer="447" from-port="0" to-layer="448" to-port="1" />
|
|
<edge from-layer="448" from-port="2" to-layer="449" to-port="1" />
|
|
<edge from-layer="449" from-port="2" to-layer="451" to-port="0" />
|
|
<edge from-layer="450" from-port="0" to-layer="451" to-port="1" />
|
|
<edge from-layer="451" from-port="2" to-layer="453" to-port="0" />
|
|
<edge from-layer="452" from-port="0" to-layer="453" to-port="1" />
|
|
<edge from-layer="453" from-port="2" to-layer="455" to-port="0" />
|
|
<edge from-layer="454" from-port="0" to-layer="455" to-port="1" />
|
|
<edge from-layer="455" from-port="2" to-layer="456" to-port="2" />
|
|
<edge from-layer="456" from-port="4" to-layer="458" to-port="0" />
|
|
<edge from-layer="457" from-port="0" to-layer="458" to-port="1" />
|
|
<edge from-layer="458" from-port="2" to-layer="460" to-port="0" />
|
|
<edge from-layer="459" from-port="0" to-layer="460" to-port="1" />
|
|
<edge from-layer="460" from-port="2" to-layer="462" to-port="0" />
|
|
<edge from-layer="461" from-port="0" to-layer="462" to-port="1" />
|
|
<edge from-layer="462" from-port="2" to-layer="467" to-port="0" />
|
|
<edge from-layer="463" from-port="0" to-layer="467" to-port="1" />
|
|
<edge from-layer="464" from-port="0" to-layer="467" to-port="2" />
|
|
<edge from-layer="465" from-port="0" to-layer="467" to-port="3" />
|
|
<edge from-layer="466" from-port="0" to-layer="467" to-port="4" />
|
|
<edge from-layer="467" from-port="5" to-layer="472" to-port="0" />
|
|
<edge from-layer="468" from-port="0" to-layer="469" to-port="0" />
|
|
<edge from-layer="469" from-port="1" to-layer="471" to-port="0" />
|
|
<edge from-layer="470" from-port="0" to-layer="471" to-port="1" />
|
|
<edge from-layer="471" from-port="2" to-layer="472" to-port="1" />
|
|
<edge from-layer="472" from-port="2" to-layer="474" to-port="0" />
|
|
<edge from-layer="473" from-port="0" to-layer="474" to-port="1" />
|
|
<edge from-layer="474" from-port="2" to-layer="475" to-port="0" />
|
|
<edge from-layer="475" from-port="2" to-layer="477" to-port="0" />
|
|
<edge from-layer="476" from-port="0" to-layer="477" to-port="1" />
|
|
<edge from-layer="477" from-port="2" to-layer="479" to-port="0" />
|
|
<edge from-layer="478" from-port="0" to-layer="479" to-port="1" />
|
|
<edge from-layer="479" from-port="2" to-layer="481" to-port="0" />
|
|
<edge from-layer="480" from-port="0" to-layer="481" to-port="1" />
|
|
<edge from-layer="481" from-port="2" to-layer="511" to-port="1" />
|
|
<edge from-layer="481" from-port="2" to-layer="483" to-port="0" />
|
|
<edge from-layer="482" from-port="0" to-layer="483" to-port="1" />
|
|
<edge from-layer="483" from-port="2" to-layer="488" to-port="0" />
|
|
<edge from-layer="484" from-port="0" to-layer="488" to-port="1" />
|
|
<edge from-layer="485" from-port="0" to-layer="488" to-port="2" />
|
|
<edge from-layer="486" from-port="0" to-layer="488" to-port="3" />
|
|
<edge from-layer="487" from-port="0" to-layer="488" to-port="4" />
|
|
<edge from-layer="488" from-port="5" to-layer="493" to-port="0" />
|
|
<edge from-layer="489" from-port="0" to-layer="490" to-port="0" />
|
|
<edge from-layer="490" from-port="1" to-layer="492" to-port="0" />
|
|
<edge from-layer="491" from-port="0" to-layer="492" to-port="1" />
|
|
<edge from-layer="492" from-port="2" to-layer="493" to-port="1" />
|
|
<edge from-layer="493" from-port="2" to-layer="495" to-port="0" />
|
|
<edge from-layer="494" from-port="0" to-layer="495" to-port="1" />
|
|
<edge from-layer="495" from-port="2" to-layer="496" to-port="0" />
|
|
<edge from-layer="496" from-port="1" to-layer="498" to-port="0" />
|
|
<edge from-layer="497" from-port="0" to-layer="498" to-port="1" />
|
|
<edge from-layer="498" from-port="2" to-layer="503" to-port="0" />
|
|
<edge from-layer="499" from-port="0" to-layer="503" to-port="1" />
|
|
<edge from-layer="500" from-port="0" to-layer="503" to-port="2" />
|
|
<edge from-layer="501" from-port="0" to-layer="503" to-port="3" />
|
|
<edge from-layer="502" from-port="0" to-layer="503" to-port="4" />
|
|
<edge from-layer="503" from-port="5" to-layer="508" to-port="0" />
|
|
<edge from-layer="504" from-port="0" to-layer="505" to-port="0" />
|
|
<edge from-layer="505" from-port="1" to-layer="507" to-port="0" />
|
|
<edge from-layer="506" from-port="0" to-layer="507" to-port="1" />
|
|
<edge from-layer="507" from-port="2" to-layer="508" to-port="1" />
|
|
<edge from-layer="508" from-port="2" to-layer="510" to-port="0" />
|
|
<edge from-layer="509" from-port="0" to-layer="510" to-port="1" />
|
|
<edge from-layer="510" from-port="2" to-layer="511" to-port="0" />
|
|
<edge from-layer="511" from-port="2" to-layer="513" to-port="0" />
|
|
<edge from-layer="512" from-port="0" to-layer="513" to-port="1" />
|
|
<edge from-layer="513" from-port="2" to-layer="515" to-port="0" />
|
|
<edge from-layer="514" from-port="0" to-layer="515" to-port="1" />
|
|
<edge from-layer="515" from-port="2" to-layer="517" to-port="0" />
|
|
<edge from-layer="516" from-port="0" to-layer="517" to-port="1" />
|
|
<edge from-layer="517" from-port="2" to-layer="587" to-port="1" />
|
|
<edge from-layer="517" from-port="2" to-layer="519" to-port="0" />
|
|
<edge from-layer="518" from-port="0" to-layer="519" to-port="1" />
|
|
<edge from-layer="519" from-port="2" to-layer="524" to-port="0" />
|
|
<edge from-layer="520" from-port="0" to-layer="524" to-port="1" />
|
|
<edge from-layer="521" from-port="0" to-layer="524" to-port="2" />
|
|
<edge from-layer="522" from-port="0" to-layer="524" to-port="3" />
|
|
<edge from-layer="523" from-port="0" to-layer="524" to-port="4" />
|
|
<edge from-layer="524" from-port="5" to-layer="529" to-port="0" />
|
|
<edge from-layer="524" from-port="5" to-layer="545" to-port="0" />
|
|
<edge from-layer="524" from-port="5" to-layer="561" to-port="0" />
|
|
<edge from-layer="525" from-port="0" to-layer="526" to-port="0" />
|
|
<edge from-layer="526" from-port="1" to-layer="528" to-port="0" />
|
|
<edge from-layer="527" from-port="0" to-layer="528" to-port="1" />
|
|
<edge from-layer="528" from-port="2" to-layer="529" to-port="1" />
|
|
<edge from-layer="529" from-port="2" to-layer="531" to-port="0" />
|
|
<edge from-layer="530" from-port="0" to-layer="531" to-port="1" />
|
|
<edge from-layer="531" from-port="2" to-layer="536" to-port="0" />
|
|
<edge from-layer="532" from-port="0" to-layer="536" to-port="1" />
|
|
<edge from-layer="533" from-port="0" to-layer="536" to-port="2" />
|
|
<edge from-layer="534" from-port="0" to-layer="536" to-port="3" />
|
|
<edge from-layer="535" from-port="0" to-layer="536" to-port="4" />
|
|
<edge from-layer="536" from-port="5" to-layer="538" to-port="0" />
|
|
<edge from-layer="537" from-port="0" to-layer="538" to-port="1" />
|
|
<edge from-layer="538" from-port="2" to-layer="540" to-port="0" />
|
|
<edge from-layer="539" from-port="0" to-layer="540" to-port="1" />
|
|
<edge from-layer="540" from-port="2" to-layer="568" to-port="0" />
|
|
<edge from-layer="541" from-port="0" to-layer="542" to-port="0" />
|
|
<edge from-layer="542" from-port="1" to-layer="544" to-port="0" />
|
|
<edge from-layer="543" from-port="0" to-layer="544" to-port="1" />
|
|
<edge from-layer="544" from-port="2" to-layer="545" to-port="1" />
|
|
<edge from-layer="545" from-port="2" to-layer="547" to-port="0" />
|
|
<edge from-layer="546" from-port="0" to-layer="547" to-port="1" />
|
|
<edge from-layer="547" from-port="2" to-layer="552" to-port="0" />
|
|
<edge from-layer="548" from-port="0" to-layer="552" to-port="1" />
|
|
<edge from-layer="549" from-port="0" to-layer="552" to-port="2" />
|
|
<edge from-layer="550" from-port="0" to-layer="552" to-port="3" />
|
|
<edge from-layer="551" from-port="0" to-layer="552" to-port="4" />
|
|
<edge from-layer="552" from-port="5" to-layer="554" to-port="0" />
|
|
<edge from-layer="553" from-port="0" to-layer="554" to-port="1" />
|
|
<edge from-layer="554" from-port="2" to-layer="556" to-port="0" />
|
|
<edge from-layer="555" from-port="0" to-layer="556" to-port="1" />
|
|
<edge from-layer="556" from-port="2" to-layer="568" to-port="1" />
|
|
<edge from-layer="557" from-port="0" to-layer="558" to-port="0" />
|
|
<edge from-layer="558" from-port="1" to-layer="560" to-port="0" />
|
|
<edge from-layer="559" from-port="0" to-layer="560" to-port="1" />
|
|
<edge from-layer="560" from-port="2" to-layer="561" to-port="1" />
|
|
<edge from-layer="561" from-port="2" to-layer="563" to-port="0" />
|
|
<edge from-layer="562" from-port="0" to-layer="563" to-port="1" />
|
|
<edge from-layer="563" from-port="2" to-layer="565" to-port="0" />
|
|
<edge from-layer="564" from-port="0" to-layer="565" to-port="1" />
|
|
<edge from-layer="565" from-port="2" to-layer="567" to-port="0" />
|
|
<edge from-layer="566" from-port="0" to-layer="567" to-port="1" />
|
|
<edge from-layer="567" from-port="2" to-layer="568" to-port="2" />
|
|
<edge from-layer="568" from-port="4" to-layer="570" to-port="0" />
|
|
<edge from-layer="569" from-port="0" to-layer="570" to-port="1" />
|
|
<edge from-layer="570" from-port="2" to-layer="572" to-port="0" />
|
|
<edge from-layer="571" from-port="0" to-layer="572" to-port="1" />
|
|
<edge from-layer="572" from-port="2" to-layer="574" to-port="0" />
|
|
<edge from-layer="573" from-port="0" to-layer="574" to-port="1" />
|
|
<edge from-layer="574" from-port="2" to-layer="579" to-port="0" />
|
|
<edge from-layer="575" from-port="0" to-layer="579" to-port="1" />
|
|
<edge from-layer="576" from-port="0" to-layer="579" to-port="2" />
|
|
<edge from-layer="577" from-port="0" to-layer="579" to-port="3" />
|
|
<edge from-layer="578" from-port="0" to-layer="579" to-port="4" />
|
|
<edge from-layer="579" from-port="5" to-layer="584" to-port="0" />
|
|
<edge from-layer="580" from-port="0" to-layer="581" to-port="0" />
|
|
<edge from-layer="581" from-port="1" to-layer="583" to-port="0" />
|
|
<edge from-layer="582" from-port="0" to-layer="583" to-port="1" />
|
|
<edge from-layer="583" from-port="2" to-layer="584" to-port="1" />
|
|
<edge from-layer="584" from-port="2" to-layer="586" to-port="0" />
|
|
<edge from-layer="585" from-port="0" to-layer="586" to-port="1" />
|
|
<edge from-layer="586" from-port="2" to-layer="587" to-port="0" />
|
|
<edge from-layer="587" from-port="2" to-layer="589" to-port="0" />
|
|
<edge from-layer="588" from-port="0" to-layer="589" to-port="1" />
|
|
<edge from-layer="589" from-port="2" to-layer="591" to-port="0" />
|
|
<edge from-layer="590" from-port="0" to-layer="591" to-port="1" />
|
|
<edge from-layer="591" from-port="2" to-layer="593" to-port="0" />
|
|
<edge from-layer="592" from-port="0" to-layer="593" to-port="1" />
|
|
<edge from-layer="593" from-port="2" to-layer="595" to-port="0" />
|
|
<edge from-layer="593" from-port="2" to-layer="623" to-port="1" />
|
|
<edge from-layer="594" from-port="0" to-layer="595" to-port="1" />
|
|
<edge from-layer="595" from-port="2" to-layer="600" to-port="0" />
|
|
<edge from-layer="596" from-port="0" to-layer="600" to-port="1" />
|
|
<edge from-layer="597" from-port="0" to-layer="600" to-port="2" />
|
|
<edge from-layer="598" from-port="0" to-layer="600" to-port="3" />
|
|
<edge from-layer="599" from-port="0" to-layer="600" to-port="4" />
|
|
<edge from-layer="600" from-port="5" to-layer="605" to-port="0" />
|
|
<edge from-layer="601" from-port="0" to-layer="602" to-port="0" />
|
|
<edge from-layer="602" from-port="1" to-layer="604" to-port="0" />
|
|
<edge from-layer="603" from-port="0" to-layer="604" to-port="1" />
|
|
<edge from-layer="604" from-port="2" to-layer="605" to-port="1" />
|
|
<edge from-layer="605" from-port="2" to-layer="607" to-port="0" />
|
|
<edge from-layer="606" from-port="0" to-layer="607" to-port="1" />
|
|
<edge from-layer="607" from-port="2" to-layer="608" to-port="0" />
|
|
<edge from-layer="608" from-port="1" to-layer="610" to-port="0" />
|
|
<edge from-layer="609" from-port="0" to-layer="610" to-port="1" />
|
|
<edge from-layer="610" from-port="2" to-layer="615" to-port="0" />
|
|
<edge from-layer="611" from-port="0" to-layer="615" to-port="1" />
|
|
<edge from-layer="612" from-port="0" to-layer="615" to-port="2" />
|
|
<edge from-layer="613" from-port="0" to-layer="615" to-port="3" />
|
|
<edge from-layer="614" from-port="0" to-layer="615" to-port="4" />
|
|
<edge from-layer="615" from-port="5" to-layer="620" to-port="0" />
|
|
<edge from-layer="616" from-port="0" to-layer="617" to-port="0" />
|
|
<edge from-layer="617" from-port="1" to-layer="619" to-port="0" />
|
|
<edge from-layer="618" from-port="0" to-layer="619" to-port="1" />
|
|
<edge from-layer="619" from-port="2" to-layer="620" to-port="1" />
|
|
<edge from-layer="620" from-port="2" to-layer="622" to-port="0" />
|
|
<edge from-layer="621" from-port="0" to-layer="622" to-port="1" />
|
|
<edge from-layer="622" from-port="2" to-layer="623" to-port="0" />
|
|
<edge from-layer="623" from-port="2" to-layer="625" to-port="0" />
|
|
<edge from-layer="624" from-port="0" to-layer="625" to-port="1" />
|
|
<edge from-layer="625" from-port="2" to-layer="627" to-port="0" />
|
|
<edge from-layer="626" from-port="0" to-layer="627" to-port="1" />
|
|
<edge from-layer="627" from-port="2" to-layer="629" to-port="0" />
|
|
<edge from-layer="628" from-port="0" to-layer="629" to-port="1" />
|
|
<edge from-layer="629" from-port="2" to-layer="699" to-port="1" />
|
|
<edge from-layer="629" from-port="2" to-layer="631" to-port="0" />
|
|
<edge from-layer="630" from-port="0" to-layer="631" to-port="1" />
|
|
<edge from-layer="631" from-port="2" to-layer="636" to-port="0" />
|
|
<edge from-layer="632" from-port="0" to-layer="636" to-port="1" />
|
|
<edge from-layer="633" from-port="0" to-layer="636" to-port="2" />
|
|
<edge from-layer="634" from-port="0" to-layer="636" to-port="3" />
|
|
<edge from-layer="635" from-port="0" to-layer="636" to-port="4" />
|
|
<edge from-layer="636" from-port="5" to-layer="641" to-port="0" />
|
|
<edge from-layer="636" from-port="5" to-layer="657" to-port="0" />
|
|
<edge from-layer="636" from-port="5" to-layer="673" to-port="0" />
|
|
<edge from-layer="637" from-port="0" to-layer="638" to-port="0" />
|
|
<edge from-layer="638" from-port="1" to-layer="640" to-port="0" />
|
|
<edge from-layer="639" from-port="0" to-layer="640" to-port="1" />
|
|
<edge from-layer="640" from-port="2" to-layer="641" to-port="1" />
|
|
<edge from-layer="641" from-port="2" to-layer="643" to-port="0" />
|
|
<edge from-layer="642" from-port="0" to-layer="643" to-port="1" />
|
|
<edge from-layer="643" from-port="2" to-layer="648" to-port="0" />
|
|
<edge from-layer="644" from-port="0" to-layer="648" to-port="1" />
|
|
<edge from-layer="645" from-port="0" to-layer="648" to-port="2" />
|
|
<edge from-layer="646" from-port="0" to-layer="648" to-port="3" />
|
|
<edge from-layer="647" from-port="0" to-layer="648" to-port="4" />
|
|
<edge from-layer="648" from-port="5" to-layer="650" to-port="0" />
|
|
<edge from-layer="649" from-port="0" to-layer="650" to-port="1" />
|
|
<edge from-layer="650" from-port="2" to-layer="652" to-port="0" />
|
|
<edge from-layer="651" from-port="0" to-layer="652" to-port="1" />
|
|
<edge from-layer="652" from-port="2" to-layer="680" to-port="0" />
|
|
<edge from-layer="653" from-port="0" to-layer="654" to-port="0" />
|
|
<edge from-layer="654" from-port="1" to-layer="656" to-port="0" />
|
|
<edge from-layer="655" from-port="0" to-layer="656" to-port="1" />
|
|
<edge from-layer="656" from-port="2" to-layer="657" to-port="1" />
|
|
<edge from-layer="657" from-port="2" to-layer="659" to-port="0" />
|
|
<edge from-layer="658" from-port="0" to-layer="659" to-port="1" />
|
|
<edge from-layer="659" from-port="2" to-layer="664" to-port="0" />
|
|
<edge from-layer="660" from-port="0" to-layer="664" to-port="1" />
|
|
<edge from-layer="661" from-port="0" to-layer="664" to-port="2" />
|
|
<edge from-layer="662" from-port="0" to-layer="664" to-port="3" />
|
|
<edge from-layer="663" from-port="0" to-layer="664" to-port="4" />
|
|
<edge from-layer="664" from-port="5" to-layer="666" to-port="0" />
|
|
<edge from-layer="665" from-port="0" to-layer="666" to-port="1" />
|
|
<edge from-layer="666" from-port="2" to-layer="668" to-port="0" />
|
|
<edge from-layer="667" from-port="0" to-layer="668" to-port="1" />
|
|
<edge from-layer="668" from-port="2" to-layer="680" to-port="1" />
|
|
<edge from-layer="669" from-port="0" to-layer="670" to-port="0" />
|
|
<edge from-layer="670" from-port="1" to-layer="672" to-port="0" />
|
|
<edge from-layer="671" from-port="0" to-layer="672" to-port="1" />
|
|
<edge from-layer="672" from-port="2" to-layer="673" to-port="1" />
|
|
<edge from-layer="673" from-port="2" to-layer="675" to-port="0" />
|
|
<edge from-layer="674" from-port="0" to-layer="675" to-port="1" />
|
|
<edge from-layer="675" from-port="2" to-layer="677" to-port="0" />
|
|
<edge from-layer="676" from-port="0" to-layer="677" to-port="1" />
|
|
<edge from-layer="677" from-port="2" to-layer="679" to-port="0" />
|
|
<edge from-layer="678" from-port="0" to-layer="679" to-port="1" />
|
|
<edge from-layer="679" from-port="2" to-layer="680" to-port="2" />
|
|
<edge from-layer="680" from-port="4" to-layer="682" to-port="0" />
|
|
<edge from-layer="681" from-port="0" to-layer="682" to-port="1" />
|
|
<edge from-layer="682" from-port="2" to-layer="684" to-port="0" />
|
|
<edge from-layer="683" from-port="0" to-layer="684" to-port="1" />
|
|
<edge from-layer="684" from-port="2" to-layer="686" to-port="0" />
|
|
<edge from-layer="685" from-port="0" to-layer="686" to-port="1" />
|
|
<edge from-layer="686" from-port="2" to-layer="691" to-port="0" />
|
|
<edge from-layer="687" from-port="0" to-layer="691" to-port="1" />
|
|
<edge from-layer="688" from-port="0" to-layer="691" to-port="2" />
|
|
<edge from-layer="689" from-port="0" to-layer="691" to-port="3" />
|
|
<edge from-layer="690" from-port="0" to-layer="691" to-port="4" />
|
|
<edge from-layer="691" from-port="5" to-layer="696" to-port="0" />
|
|
<edge from-layer="692" from-port="0" to-layer="693" to-port="0" />
|
|
<edge from-layer="693" from-port="1" to-layer="695" to-port="0" />
|
|
<edge from-layer="694" from-port="0" to-layer="695" to-port="1" />
|
|
<edge from-layer="695" from-port="2" to-layer="696" to-port="1" />
|
|
<edge from-layer="696" from-port="2" to-layer="698" to-port="0" />
|
|
<edge from-layer="697" from-port="0" to-layer="698" to-port="1" />
|
|
<edge from-layer="698" from-port="2" to-layer="699" to-port="0" />
|
|
<edge from-layer="699" from-port="2" to-layer="701" to-port="0" />
|
|
<edge from-layer="700" from-port="0" to-layer="701" to-port="1" />
|
|
<edge from-layer="701" from-port="2" to-layer="703" to-port="0" />
|
|
<edge from-layer="702" from-port="0" to-layer="703" to-port="1" />
|
|
<edge from-layer="703" from-port="2" to-layer="705" to-port="0" />
|
|
<edge from-layer="704" from-port="0" to-layer="705" to-port="1" />
|
|
<edge from-layer="705" from-port="2" to-layer="735" to-port="1" />
|
|
<edge from-layer="705" from-port="2" to-layer="707" to-port="0" />
|
|
<edge from-layer="706" from-port="0" to-layer="707" to-port="1" />
|
|
<edge from-layer="707" from-port="2" to-layer="712" to-port="0" />
|
|
<edge from-layer="708" from-port="0" to-layer="712" to-port="1" />
|
|
<edge from-layer="709" from-port="0" to-layer="712" to-port="2" />
|
|
<edge from-layer="710" from-port="0" to-layer="712" to-port="3" />
|
|
<edge from-layer="711" from-port="0" to-layer="712" to-port="4" />
|
|
<edge from-layer="712" from-port="5" to-layer="717" to-port="0" />
|
|
<edge from-layer="713" from-port="0" to-layer="714" to-port="0" />
|
|
<edge from-layer="714" from-port="1" to-layer="716" to-port="0" />
|
|
<edge from-layer="715" from-port="0" to-layer="716" to-port="1" />
|
|
<edge from-layer="716" from-port="2" to-layer="717" to-port="1" />
|
|
<edge from-layer="717" from-port="2" to-layer="719" to-port="0" />
|
|
<edge from-layer="718" from-port="0" to-layer="719" to-port="1" />
|
|
<edge from-layer="719" from-port="2" to-layer="720" to-port="0" />
|
|
<edge from-layer="720" from-port="1" to-layer="722" to-port="0" />
|
|
<edge from-layer="721" from-port="0" to-layer="722" to-port="1" />
|
|
<edge from-layer="722" from-port="2" to-layer="727" to-port="0" />
|
|
<edge from-layer="723" from-port="0" to-layer="727" to-port="1" />
|
|
<edge from-layer="724" from-port="0" to-layer="727" to-port="2" />
|
|
<edge from-layer="725" from-port="0" to-layer="727" to-port="3" />
|
|
<edge from-layer="726" from-port="0" to-layer="727" to-port="4" />
|
|
<edge from-layer="727" from-port="5" to-layer="732" to-port="0" />
|
|
<edge from-layer="728" from-port="0" to-layer="729" to-port="0" />
|
|
<edge from-layer="729" from-port="1" to-layer="731" to-port="0" />
|
|
<edge from-layer="730" from-port="0" to-layer="731" to-port="1" />
|
|
<edge from-layer="731" from-port="2" to-layer="732" to-port="1" />
|
|
<edge from-layer="732" from-port="2" to-layer="734" to-port="0" />
|
|
<edge from-layer="733" from-port="0" to-layer="734" to-port="1" />
|
|
<edge from-layer="734" from-port="2" to-layer="735" to-port="0" />
|
|
<edge from-layer="735" from-port="2" to-layer="737" to-port="0" />
|
|
<edge from-layer="736" from-port="0" to-layer="737" to-port="1" />
|
|
<edge from-layer="737" from-port="2" to-layer="739" to-port="0" />
|
|
<edge from-layer="738" from-port="0" to-layer="739" to-port="1" />
|
|
<edge from-layer="739" from-port="2" to-layer="741" to-port="0" />
|
|
<edge from-layer="740" from-port="0" to-layer="741" to-port="1" />
|
|
<edge from-layer="741" from-port="2" to-layer="743" to-port="0" />
|
|
<edge from-layer="741" from-port="2" to-layer="811" to-port="1" />
|
|
<edge from-layer="742" from-port="0" to-layer="743" to-port="1" />
|
|
<edge from-layer="743" from-port="2" to-layer="748" to-port="0" />
|
|
<edge from-layer="744" from-port="0" to-layer="748" to-port="1" />
|
|
<edge from-layer="745" from-port="0" to-layer="748" to-port="2" />
|
|
<edge from-layer="746" from-port="0" to-layer="748" to-port="3" />
|
|
<edge from-layer="747" from-port="0" to-layer="748" to-port="4" />
|
|
<edge from-layer="748" from-port="5" to-layer="753" to-port="0" />
|
|
<edge from-layer="748" from-port="5" to-layer="785" to-port="0" />
|
|
<edge from-layer="748" from-port="5" to-layer="769" to-port="0" />
|
|
<edge from-layer="749" from-port="0" to-layer="750" to-port="0" />
|
|
<edge from-layer="750" from-port="1" to-layer="752" to-port="0" />
|
|
<edge from-layer="751" from-port="0" to-layer="752" to-port="1" />
|
|
<edge from-layer="752" from-port="2" to-layer="753" to-port="1" />
|
|
<edge from-layer="753" from-port="2" to-layer="755" to-port="0" />
|
|
<edge from-layer="754" from-port="0" to-layer="755" to-port="1" />
|
|
<edge from-layer="755" from-port="2" to-layer="760" to-port="0" />
|
|
<edge from-layer="756" from-port="0" to-layer="760" to-port="1" />
|
|
<edge from-layer="757" from-port="0" to-layer="760" to-port="2" />
|
|
<edge from-layer="758" from-port="0" to-layer="760" to-port="3" />
|
|
<edge from-layer="759" from-port="0" to-layer="760" to-port="4" />
|
|
<edge from-layer="760" from-port="5" to-layer="762" to-port="0" />
|
|
<edge from-layer="761" from-port="0" to-layer="762" to-port="1" />
|
|
<edge from-layer="762" from-port="2" to-layer="764" to-port="0" />
|
|
<edge from-layer="763" from-port="0" to-layer="764" to-port="1" />
|
|
<edge from-layer="764" from-port="2" to-layer="792" to-port="0" />
|
|
<edge from-layer="765" from-port="0" to-layer="766" to-port="0" />
|
|
<edge from-layer="766" from-port="1" to-layer="768" to-port="0" />
|
|
<edge from-layer="767" from-port="0" to-layer="768" to-port="1" />
|
|
<edge from-layer="768" from-port="2" to-layer="769" to-port="1" />
|
|
<edge from-layer="769" from-port="2" to-layer="771" to-port="0" />
|
|
<edge from-layer="770" from-port="0" to-layer="771" to-port="1" />
|
|
<edge from-layer="771" from-port="2" to-layer="776" to-port="0" />
|
|
<edge from-layer="772" from-port="0" to-layer="776" to-port="1" />
|
|
<edge from-layer="773" from-port="0" to-layer="776" to-port="2" />
|
|
<edge from-layer="774" from-port="0" to-layer="776" to-port="3" />
|
|
<edge from-layer="775" from-port="0" to-layer="776" to-port="4" />
|
|
<edge from-layer="776" from-port="5" to-layer="778" to-port="0" />
|
|
<edge from-layer="777" from-port="0" to-layer="778" to-port="1" />
|
|
<edge from-layer="778" from-port="2" to-layer="780" to-port="0" />
|
|
<edge from-layer="779" from-port="0" to-layer="780" to-port="1" />
|
|
<edge from-layer="780" from-port="2" to-layer="792" to-port="1" />
|
|
<edge from-layer="781" from-port="0" to-layer="782" to-port="0" />
|
|
<edge from-layer="782" from-port="1" to-layer="784" to-port="0" />
|
|
<edge from-layer="783" from-port="0" to-layer="784" to-port="1" />
|
|
<edge from-layer="784" from-port="2" to-layer="785" to-port="1" />
|
|
<edge from-layer="785" from-port="2" to-layer="787" to-port="0" />
|
|
<edge from-layer="786" from-port="0" to-layer="787" to-port="1" />
|
|
<edge from-layer="787" from-port="2" to-layer="789" to-port="0" />
|
|
<edge from-layer="788" from-port="0" to-layer="789" to-port="1" />
|
|
<edge from-layer="789" from-port="2" to-layer="791" to-port="0" />
|
|
<edge from-layer="790" from-port="0" to-layer="791" to-port="1" />
|
|
<edge from-layer="791" from-port="2" to-layer="792" to-port="2" />
|
|
<edge from-layer="792" from-port="4" to-layer="794" to-port="0" />
|
|
<edge from-layer="793" from-port="0" to-layer="794" to-port="1" />
|
|
<edge from-layer="794" from-port="2" to-layer="796" to-port="0" />
|
|
<edge from-layer="795" from-port="0" to-layer="796" to-port="1" />
|
|
<edge from-layer="796" from-port="2" to-layer="798" to-port="0" />
|
|
<edge from-layer="797" from-port="0" to-layer="798" to-port="1" />
|
|
<edge from-layer="798" from-port="2" to-layer="803" to-port="0" />
|
|
<edge from-layer="799" from-port="0" to-layer="803" to-port="1" />
|
|
<edge from-layer="800" from-port="0" to-layer="803" to-port="2" />
|
|
<edge from-layer="801" from-port="0" to-layer="803" to-port="3" />
|
|
<edge from-layer="802" from-port="0" to-layer="803" to-port="4" />
|
|
<edge from-layer="803" from-port="5" to-layer="808" to-port="0" />
|
|
<edge from-layer="804" from-port="0" to-layer="805" to-port="0" />
|
|
<edge from-layer="805" from-port="1" to-layer="807" to-port="0" />
|
|
<edge from-layer="806" from-port="0" to-layer="807" to-port="1" />
|
|
<edge from-layer="807" from-port="2" to-layer="808" to-port="1" />
|
|
<edge from-layer="808" from-port="2" to-layer="810" to-port="0" />
|
|
<edge from-layer="809" from-port="0" to-layer="810" to-port="1" />
|
|
<edge from-layer="810" from-port="2" to-layer="811" to-port="0" />
|
|
<edge from-layer="811" from-port="2" to-layer="813" to-port="0" />
|
|
<edge from-layer="812" from-port="0" to-layer="813" to-port="1" />
|
|
<edge from-layer="813" from-port="2" to-layer="815" to-port="0" />
|
|
<edge from-layer="814" from-port="0" to-layer="815" to-port="1" />
|
|
<edge from-layer="815" from-port="2" to-layer="817" to-port="0" />
|
|
<edge from-layer="816" from-port="0" to-layer="817" to-port="1" />
|
|
<edge from-layer="817" from-port="2" to-layer="847" to-port="1" />
|
|
<edge from-layer="817" from-port="2" to-layer="819" to-port="0" />
|
|
<edge from-layer="818" from-port="0" to-layer="819" to-port="1" />
|
|
<edge from-layer="819" from-port="2" to-layer="824" to-port="0" />
|
|
<edge from-layer="820" from-port="0" to-layer="824" to-port="1" />
|
|
<edge from-layer="821" from-port="0" to-layer="824" to-port="2" />
|
|
<edge from-layer="822" from-port="0" to-layer="824" to-port="3" />
|
|
<edge from-layer="823" from-port="0" to-layer="824" to-port="4" />
|
|
<edge from-layer="824" from-port="5" to-layer="829" to-port="0" />
|
|
<edge from-layer="825" from-port="0" to-layer="826" to-port="0" />
|
|
<edge from-layer="826" from-port="1" to-layer="828" to-port="0" />
|
|
<edge from-layer="827" from-port="0" to-layer="828" to-port="1" />
|
|
<edge from-layer="828" from-port="2" to-layer="829" to-port="1" />
|
|
<edge from-layer="829" from-port="2" to-layer="831" to-port="0" />
|
|
<edge from-layer="830" from-port="0" to-layer="831" to-port="1" />
|
|
<edge from-layer="831" from-port="2" to-layer="832" to-port="0" />
|
|
<edge from-layer="832" from-port="1" to-layer="834" to-port="0" />
|
|
<edge from-layer="833" from-port="0" to-layer="834" to-port="1" />
|
|
<edge from-layer="834" from-port="2" to-layer="839" to-port="0" />
|
|
<edge from-layer="835" from-port="0" to-layer="839" to-port="1" />
|
|
<edge from-layer="836" from-port="0" to-layer="839" to-port="2" />
|
|
<edge from-layer="837" from-port="0" to-layer="839" to-port="3" />
|
|
<edge from-layer="838" from-port="0" to-layer="839" to-port="4" />
|
|
<edge from-layer="839" from-port="5" to-layer="844" to-port="0" />
|
|
<edge from-layer="840" from-port="0" to-layer="841" to-port="0" />
|
|
<edge from-layer="841" from-port="1" to-layer="843" to-port="0" />
|
|
<edge from-layer="842" from-port="0" to-layer="843" to-port="1" />
|
|
<edge from-layer="843" from-port="2" to-layer="844" to-port="1" />
|
|
<edge from-layer="844" from-port="2" to-layer="846" to-port="0" />
|
|
<edge from-layer="845" from-port="0" to-layer="846" to-port="1" />
|
|
<edge from-layer="846" from-port="2" to-layer="847" to-port="0" />
|
|
<edge from-layer="847" from-port="2" to-layer="849" to-port="0" />
|
|
<edge from-layer="848" from-port="0" to-layer="849" to-port="1" />
|
|
<edge from-layer="849" from-port="2" to-layer="851" to-port="0" />
|
|
<edge from-layer="850" from-port="0" to-layer="851" to-port="1" />
|
|
<edge from-layer="851" from-port="2" to-layer="853" to-port="0" />
|
|
<edge from-layer="852" from-port="0" to-layer="853" to-port="1" />
|
|
<edge from-layer="853" from-port="2" to-layer="923" to-port="1" />
|
|
<edge from-layer="853" from-port="2" to-layer="855" to-port="0" />
|
|
<edge from-layer="854" from-port="0" to-layer="855" to-port="1" />
|
|
<edge from-layer="855" from-port="2" to-layer="860" to-port="0" />
|
|
<edge from-layer="856" from-port="0" to-layer="860" to-port="1" />
|
|
<edge from-layer="857" from-port="0" to-layer="860" to-port="2" />
|
|
<edge from-layer="858" from-port="0" to-layer="860" to-port="3" />
|
|
<edge from-layer="859" from-port="0" to-layer="860" to-port="4" />
|
|
<edge from-layer="860" from-port="5" to-layer="865" to-port="0" />
|
|
<edge from-layer="860" from-port="5" to-layer="897" to-port="0" />
|
|
<edge from-layer="860" from-port="5" to-layer="881" to-port="0" />
|
|
<edge from-layer="861" from-port="0" to-layer="862" to-port="0" />
|
|
<edge from-layer="862" from-port="1" to-layer="864" to-port="0" />
|
|
<edge from-layer="863" from-port="0" to-layer="864" to-port="1" />
|
|
<edge from-layer="864" from-port="2" to-layer="865" to-port="1" />
|
|
<edge from-layer="865" from-port="2" to-layer="867" to-port="0" />
|
|
<edge from-layer="866" from-port="0" to-layer="867" to-port="1" />
|
|
<edge from-layer="867" from-port="2" to-layer="872" to-port="0" />
|
|
<edge from-layer="868" from-port="0" to-layer="872" to-port="1" />
|
|
<edge from-layer="869" from-port="0" to-layer="872" to-port="2" />
|
|
<edge from-layer="870" from-port="0" to-layer="872" to-port="3" />
|
|
<edge from-layer="871" from-port="0" to-layer="872" to-port="4" />
|
|
<edge from-layer="872" from-port="5" to-layer="874" to-port="0" />
|
|
<edge from-layer="873" from-port="0" to-layer="874" to-port="1" />
|
|
<edge from-layer="874" from-port="2" to-layer="876" to-port="0" />
|
|
<edge from-layer="875" from-port="0" to-layer="876" to-port="1" />
|
|
<edge from-layer="876" from-port="2" to-layer="904" to-port="0" />
|
|
<edge from-layer="877" from-port="0" to-layer="878" to-port="0" />
|
|
<edge from-layer="878" from-port="1" to-layer="880" to-port="0" />
|
|
<edge from-layer="879" from-port="0" to-layer="880" to-port="1" />
|
|
<edge from-layer="880" from-port="2" to-layer="881" to-port="1" />
|
|
<edge from-layer="881" from-port="2" to-layer="883" to-port="0" />
|
|
<edge from-layer="882" from-port="0" to-layer="883" to-port="1" />
|
|
<edge from-layer="883" from-port="2" to-layer="888" to-port="0" />
|
|
<edge from-layer="884" from-port="0" to-layer="888" to-port="1" />
|
|
<edge from-layer="885" from-port="0" to-layer="888" to-port="2" />
|
|
<edge from-layer="886" from-port="0" to-layer="888" to-port="3" />
|
|
<edge from-layer="887" from-port="0" to-layer="888" to-port="4" />
|
|
<edge from-layer="888" from-port="5" to-layer="890" to-port="0" />
|
|
<edge from-layer="889" from-port="0" to-layer="890" to-port="1" />
|
|
<edge from-layer="890" from-port="2" to-layer="892" to-port="0" />
|
|
<edge from-layer="891" from-port="0" to-layer="892" to-port="1" />
|
|
<edge from-layer="892" from-port="2" to-layer="904" to-port="1" />
|
|
<edge from-layer="893" from-port="0" to-layer="894" to-port="0" />
|
|
<edge from-layer="894" from-port="1" to-layer="896" to-port="0" />
|
|
<edge from-layer="895" from-port="0" to-layer="896" to-port="1" />
|
|
<edge from-layer="896" from-port="2" to-layer="897" to-port="1" />
|
|
<edge from-layer="897" from-port="2" to-layer="899" to-port="0" />
|
|
<edge from-layer="898" from-port="0" to-layer="899" to-port="1" />
|
|
<edge from-layer="899" from-port="2" to-layer="901" to-port="0" />
|
|
<edge from-layer="900" from-port="0" to-layer="901" to-port="1" />
|
|
<edge from-layer="901" from-port="2" to-layer="903" to-port="0" />
|
|
<edge from-layer="902" from-port="0" to-layer="903" to-port="1" />
|
|
<edge from-layer="903" from-port="2" to-layer="904" to-port="2" />
|
|
<edge from-layer="904" from-port="4" to-layer="906" to-port="0" />
|
|
<edge from-layer="905" from-port="0" to-layer="906" to-port="1" />
|
|
<edge from-layer="906" from-port="2" to-layer="908" to-port="0" />
|
|
<edge from-layer="907" from-port="0" to-layer="908" to-port="1" />
|
|
<edge from-layer="908" from-port="2" to-layer="910" to-port="0" />
|
|
<edge from-layer="909" from-port="0" to-layer="910" to-port="1" />
|
|
<edge from-layer="910" from-port="2" to-layer="915" to-port="0" />
|
|
<edge from-layer="911" from-port="0" to-layer="915" to-port="1" />
|
|
<edge from-layer="912" from-port="0" to-layer="915" to-port="2" />
|
|
<edge from-layer="913" from-port="0" to-layer="915" to-port="3" />
|
|
<edge from-layer="914" from-port="0" to-layer="915" to-port="4" />
|
|
<edge from-layer="915" from-port="5" to-layer="920" to-port="0" />
|
|
<edge from-layer="916" from-port="0" to-layer="917" to-port="0" />
|
|
<edge from-layer="917" from-port="1" to-layer="919" to-port="0" />
|
|
<edge from-layer="918" from-port="0" to-layer="919" to-port="1" />
|
|
<edge from-layer="919" from-port="2" to-layer="920" to-port="1" />
|
|
<edge from-layer="920" from-port="2" to-layer="922" to-port="0" />
|
|
<edge from-layer="921" from-port="0" to-layer="922" to-port="1" />
|
|
<edge from-layer="922" from-port="2" to-layer="923" to-port="0" />
|
|
<edge from-layer="923" from-port="2" to-layer="925" to-port="0" />
|
|
<edge from-layer="924" from-port="0" to-layer="925" to-port="1" />
|
|
<edge from-layer="925" from-port="2" to-layer="927" to-port="0" />
|
|
<edge from-layer="926" from-port="0" to-layer="927" to-port="1" />
|
|
<edge from-layer="927" from-port="2" to-layer="929" to-port="0" />
|
|
<edge from-layer="928" from-port="0" to-layer="929" to-port="1" />
|
|
<edge from-layer="929" from-port="2" to-layer="931" to-port="0" />
|
|
<edge from-layer="929" from-port="2" to-layer="959" to-port="1" />
|
|
<edge from-layer="930" from-port="0" to-layer="931" to-port="1" />
|
|
<edge from-layer="931" from-port="2" to-layer="936" to-port="0" />
|
|
<edge from-layer="932" from-port="0" to-layer="936" to-port="1" />
|
|
<edge from-layer="933" from-port="0" to-layer="936" to-port="2" />
|
|
<edge from-layer="934" from-port="0" to-layer="936" to-port="3" />
|
|
<edge from-layer="935" from-port="0" to-layer="936" to-port="4" />
|
|
<edge from-layer="936" from-port="5" to-layer="941" to-port="0" />
|
|
<edge from-layer="937" from-port="0" to-layer="938" to-port="0" />
|
|
<edge from-layer="938" from-port="1" to-layer="940" to-port="0" />
|
|
<edge from-layer="939" from-port="0" to-layer="940" to-port="1" />
|
|
<edge from-layer="940" from-port="2" to-layer="941" to-port="1" />
|
|
<edge from-layer="941" from-port="2" to-layer="943" to-port="0" />
|
|
<edge from-layer="942" from-port="0" to-layer="943" to-port="1" />
|
|
<edge from-layer="943" from-port="2" to-layer="944" to-port="0" />
|
|
<edge from-layer="944" from-port="1" to-layer="946" to-port="0" />
|
|
<edge from-layer="945" from-port="0" to-layer="946" to-port="1" />
|
|
<edge from-layer="946" from-port="2" to-layer="951" to-port="0" />
|
|
<edge from-layer="947" from-port="0" to-layer="951" to-port="1" />
|
|
<edge from-layer="948" from-port="0" to-layer="951" to-port="2" />
|
|
<edge from-layer="949" from-port="0" to-layer="951" to-port="3" />
|
|
<edge from-layer="950" from-port="0" to-layer="951" to-port="4" />
|
|
<edge from-layer="951" from-port="5" to-layer="956" to-port="0" />
|
|
<edge from-layer="952" from-port="0" to-layer="953" to-port="0" />
|
|
<edge from-layer="953" from-port="1" to-layer="955" to-port="0" />
|
|
<edge from-layer="954" from-port="0" to-layer="955" to-port="1" />
|
|
<edge from-layer="955" from-port="2" to-layer="956" to-port="1" />
|
|
<edge from-layer="956" from-port="2" to-layer="958" to-port="0" />
|
|
<edge from-layer="957" from-port="0" to-layer="958" to-port="1" />
|
|
<edge from-layer="958" from-port="2" to-layer="959" to-port="0" />
|
|
<edge from-layer="959" from-port="2" to-layer="961" to-port="0" />
|
|
<edge from-layer="960" from-port="0" to-layer="961" to-port="1" />
|
|
<edge from-layer="961" from-port="2" to-layer="963" to-port="0" />
|
|
<edge from-layer="962" from-port="0" to-layer="963" to-port="1" />
|
|
<edge from-layer="963" from-port="2" to-layer="965" to-port="0" />
|
|
<edge from-layer="964" from-port="0" to-layer="965" to-port="1" />
|
|
<edge from-layer="965" from-port="2" to-layer="967" to-port="0" />
|
|
<edge from-layer="965" from-port="2" to-layer="1035" to-port="1" />
|
|
<edge from-layer="966" from-port="0" to-layer="967" to-port="1" />
|
|
<edge from-layer="967" from-port="2" to-layer="972" to-port="0" />
|
|
<edge from-layer="968" from-port="0" to-layer="972" to-port="1" />
|
|
<edge from-layer="969" from-port="0" to-layer="972" to-port="2" />
|
|
<edge from-layer="970" from-port="0" to-layer="972" to-port="3" />
|
|
<edge from-layer="971" from-port="0" to-layer="972" to-port="4" />
|
|
<edge from-layer="972" from-port="5" to-layer="977" to-port="0" />
|
|
<edge from-layer="972" from-port="5" to-layer="1009" to-port="0" />
|
|
<edge from-layer="972" from-port="5" to-layer="993" to-port="0" />
|
|
<edge from-layer="973" from-port="0" to-layer="974" to-port="0" />
|
|
<edge from-layer="974" from-port="1" to-layer="976" to-port="0" />
|
|
<edge from-layer="975" from-port="0" to-layer="976" to-port="1" />
|
|
<edge from-layer="976" from-port="2" to-layer="977" to-port="1" />
|
|
<edge from-layer="977" from-port="2" to-layer="979" to-port="0" />
|
|
<edge from-layer="978" from-port="0" to-layer="979" to-port="1" />
|
|
<edge from-layer="979" from-port="2" to-layer="984" to-port="0" />
|
|
<edge from-layer="980" from-port="0" to-layer="984" to-port="1" />
|
|
<edge from-layer="981" from-port="0" to-layer="984" to-port="2" />
|
|
<edge from-layer="982" from-port="0" to-layer="984" to-port="3" />
|
|
<edge from-layer="983" from-port="0" to-layer="984" to-port="4" />
|
|
<edge from-layer="984" from-port="5" to-layer="986" to-port="0" />
|
|
<edge from-layer="985" from-port="0" to-layer="986" to-port="1" />
|
|
<edge from-layer="986" from-port="2" to-layer="988" to-port="0" />
|
|
<edge from-layer="987" from-port="0" to-layer="988" to-port="1" />
|
|
<edge from-layer="988" from-port="2" to-layer="1016" to-port="0" />
|
|
<edge from-layer="989" from-port="0" to-layer="990" to-port="0" />
|
|
<edge from-layer="990" from-port="1" to-layer="992" to-port="0" />
|
|
<edge from-layer="991" from-port="0" to-layer="992" to-port="1" />
|
|
<edge from-layer="992" from-port="2" to-layer="993" to-port="1" />
|
|
<edge from-layer="993" from-port="2" to-layer="995" to-port="0" />
|
|
<edge from-layer="994" from-port="0" to-layer="995" to-port="1" />
|
|
<edge from-layer="995" from-port="2" to-layer="1000" to-port="0" />
|
|
<edge from-layer="996" from-port="0" to-layer="1000" to-port="1" />
|
|
<edge from-layer="997" from-port="0" to-layer="1000" to-port="2" />
|
|
<edge from-layer="998" from-port="0" to-layer="1000" to-port="3" />
|
|
<edge from-layer="999" from-port="0" to-layer="1000" to-port="4" />
|
|
<edge from-layer="1000" from-port="5" to-layer="1002" to-port="0" />
|
|
<edge from-layer="1001" from-port="0" to-layer="1002" to-port="1" />
|
|
<edge from-layer="1002" from-port="2" to-layer="1004" to-port="0" />
|
|
<edge from-layer="1003" from-port="0" to-layer="1004" to-port="1" />
|
|
<edge from-layer="1004" from-port="2" to-layer="1016" to-port="1" />
|
|
<edge from-layer="1005" from-port="0" to-layer="1006" to-port="0" />
|
|
<edge from-layer="1006" from-port="1" to-layer="1008" to-port="0" />
|
|
<edge from-layer="1007" from-port="0" to-layer="1008" to-port="1" />
|
|
<edge from-layer="1008" from-port="2" to-layer="1009" to-port="1" />
|
|
<edge from-layer="1009" from-port="2" to-layer="1011" to-port="0" />
|
|
<edge from-layer="1010" from-port="0" to-layer="1011" to-port="1" />
|
|
<edge from-layer="1011" from-port="2" to-layer="1013" to-port="0" />
|
|
<edge from-layer="1012" from-port="0" to-layer="1013" to-port="1" />
|
|
<edge from-layer="1013" from-port="2" to-layer="1015" to-port="0" />
|
|
<edge from-layer="1014" from-port="0" to-layer="1015" to-port="1" />
|
|
<edge from-layer="1015" from-port="2" to-layer="1016" to-port="2" />
|
|
<edge from-layer="1016" from-port="4" to-layer="1018" to-port="0" />
|
|
<edge from-layer="1017" from-port="0" to-layer="1018" to-port="1" />
|
|
<edge from-layer="1018" from-port="2" to-layer="1020" to-port="0" />
|
|
<edge from-layer="1019" from-port="0" to-layer="1020" to-port="1" />
|
|
<edge from-layer="1020" from-port="2" to-layer="1022" to-port="0" />
|
|
<edge from-layer="1021" from-port="0" to-layer="1022" to-port="1" />
|
|
<edge from-layer="1022" from-port="2" to-layer="1027" to-port="0" />
|
|
<edge from-layer="1023" from-port="0" to-layer="1027" to-port="1" />
|
|
<edge from-layer="1024" from-port="0" to-layer="1027" to-port="2" />
|
|
<edge from-layer="1025" from-port="0" to-layer="1027" to-port="3" />
|
|
<edge from-layer="1026" from-port="0" to-layer="1027" to-port="4" />
|
|
<edge from-layer="1027" from-port="5" to-layer="1032" to-port="0" />
|
|
<edge from-layer="1028" from-port="0" to-layer="1029" to-port="0" />
|
|
<edge from-layer="1029" from-port="1" to-layer="1031" to-port="0" />
|
|
<edge from-layer="1030" from-port="0" to-layer="1031" to-port="1" />
|
|
<edge from-layer="1031" from-port="2" to-layer="1032" to-port="1" />
|
|
<edge from-layer="1032" from-port="2" to-layer="1034" to-port="0" />
|
|
<edge from-layer="1033" from-port="0" to-layer="1034" to-port="1" />
|
|
<edge from-layer="1034" from-port="2" to-layer="1035" to-port="0" />
|
|
<edge from-layer="1035" from-port="2" to-layer="1037" to-port="0" />
|
|
<edge from-layer="1036" from-port="0" to-layer="1037" to-port="1" />
|
|
<edge from-layer="1037" from-port="2" to-layer="1039" to-port="0" />
|
|
<edge from-layer="1038" from-port="0" to-layer="1039" to-port="1" />
|
|
<edge from-layer="1039" from-port="2" to-layer="1041" to-port="0" />
|
|
<edge from-layer="1040" from-port="0" to-layer="1041" to-port="1" />
|
|
<edge from-layer="1041" from-port="2" to-layer="1071" to-port="1" />
|
|
<edge from-layer="1041" from-port="2" to-layer="1043" to-port="0" />
|
|
<edge from-layer="1042" from-port="0" to-layer="1043" to-port="1" />
|
|
<edge from-layer="1043" from-port="2" to-layer="1048" to-port="0" />
|
|
<edge from-layer="1044" from-port="0" to-layer="1048" to-port="1" />
|
|
<edge from-layer="1045" from-port="0" to-layer="1048" to-port="2" />
|
|
<edge from-layer="1046" from-port="0" to-layer="1048" to-port="3" />
|
|
<edge from-layer="1047" from-port="0" to-layer="1048" to-port="4" />
|
|
<edge from-layer="1048" from-port="5" to-layer="1053" to-port="0" />
|
|
<edge from-layer="1049" from-port="0" to-layer="1050" to-port="0" />
|
|
<edge from-layer="1050" from-port="1" to-layer="1052" to-port="0" />
|
|
<edge from-layer="1051" from-port="0" to-layer="1052" to-port="1" />
|
|
<edge from-layer="1052" from-port="2" to-layer="1053" to-port="1" />
|
|
<edge from-layer="1053" from-port="2" to-layer="1055" to-port="0" />
|
|
<edge from-layer="1054" from-port="0" to-layer="1055" to-port="1" />
|
|
<edge from-layer="1055" from-port="2" to-layer="1056" to-port="0" />
|
|
<edge from-layer="1056" from-port="1" to-layer="1058" to-port="0" />
|
|
<edge from-layer="1057" from-port="0" to-layer="1058" to-port="1" />
|
|
<edge from-layer="1058" from-port="2" to-layer="1063" to-port="0" />
|
|
<edge from-layer="1059" from-port="0" to-layer="1063" to-port="1" />
|
|
<edge from-layer="1060" from-port="0" to-layer="1063" to-port="2" />
|
|
<edge from-layer="1061" from-port="0" to-layer="1063" to-port="3" />
|
|
<edge from-layer="1062" from-port="0" to-layer="1063" to-port="4" />
|
|
<edge from-layer="1063" from-port="5" to-layer="1068" to-port="0" />
|
|
<edge from-layer="1064" from-port="0" to-layer="1065" to-port="0" />
|
|
<edge from-layer="1065" from-port="1" to-layer="1067" to-port="0" />
|
|
<edge from-layer="1066" from-port="0" to-layer="1067" to-port="1" />
|
|
<edge from-layer="1067" from-port="2" to-layer="1068" to-port="1" />
|
|
<edge from-layer="1068" from-port="2" to-layer="1070" to-port="0" />
|
|
<edge from-layer="1069" from-port="0" to-layer="1070" to-port="1" />
|
|
<edge from-layer="1070" from-port="2" to-layer="1071" to-port="0" />
|
|
<edge from-layer="1071" from-port="2" to-layer="1073" to-port="0" />
|
|
<edge from-layer="1072" from-port="0" to-layer="1073" to-port="1" />
|
|
<edge from-layer="1073" from-port="2" to-layer="1075" to-port="0" />
|
|
<edge from-layer="1074" from-port="0" to-layer="1075" to-port="1" />
|
|
<edge from-layer="1075" from-port="2" to-layer="1077" to-port="0" />
|
|
<edge from-layer="1076" from-port="0" to-layer="1077" to-port="1" />
|
|
<edge from-layer="1077" from-port="2" to-layer="1079" to-port="0" />
|
|
<edge from-layer="1077" from-port="2" to-layer="1147" to-port="1" />
|
|
<edge from-layer="1078" from-port="0" to-layer="1079" to-port="1" />
|
|
<edge from-layer="1079" from-port="2" to-layer="1084" to-port="0" />
|
|
<edge from-layer="1080" from-port="0" to-layer="1084" to-port="1" />
|
|
<edge from-layer="1081" from-port="0" to-layer="1084" to-port="2" />
|
|
<edge from-layer="1082" from-port="0" to-layer="1084" to-port="3" />
|
|
<edge from-layer="1083" from-port="0" to-layer="1084" to-port="4" />
|
|
<edge from-layer="1084" from-port="5" to-layer="1089" to-port="0" />
|
|
<edge from-layer="1084" from-port="5" to-layer="1105" to-port="0" />
|
|
<edge from-layer="1084" from-port="5" to-layer="1121" to-port="0" />
|
|
<edge from-layer="1085" from-port="0" to-layer="1086" to-port="0" />
|
|
<edge from-layer="1086" from-port="1" to-layer="1088" to-port="0" />
|
|
<edge from-layer="1087" from-port="0" to-layer="1088" to-port="1" />
|
|
<edge from-layer="1088" from-port="2" to-layer="1089" to-port="1" />
|
|
<edge from-layer="1089" from-port="2" to-layer="1091" to-port="0" />
|
|
<edge from-layer="1090" from-port="0" to-layer="1091" to-port="1" />
|
|
<edge from-layer="1091" from-port="2" to-layer="1096" to-port="0" />
|
|
<edge from-layer="1092" from-port="0" to-layer="1096" to-port="1" />
|
|
<edge from-layer="1093" from-port="0" to-layer="1096" to-port="2" />
|
|
<edge from-layer="1094" from-port="0" to-layer="1096" to-port="3" />
|
|
<edge from-layer="1095" from-port="0" to-layer="1096" to-port="4" />
|
|
<edge from-layer="1096" from-port="5" to-layer="1098" to-port="0" />
|
|
<edge from-layer="1097" from-port="0" to-layer="1098" to-port="1" />
|
|
<edge from-layer="1098" from-port="2" to-layer="1100" to-port="0" />
|
|
<edge from-layer="1099" from-port="0" to-layer="1100" to-port="1" />
|
|
<edge from-layer="1100" from-port="2" to-layer="1128" to-port="0" />
|
|
<edge from-layer="1101" from-port="0" to-layer="1102" to-port="0" />
|
|
<edge from-layer="1102" from-port="1" to-layer="1104" to-port="0" />
|
|
<edge from-layer="1103" from-port="0" to-layer="1104" to-port="1" />
|
|
<edge from-layer="1104" from-port="2" to-layer="1105" to-port="1" />
|
|
<edge from-layer="1105" from-port="2" to-layer="1107" to-port="0" />
|
|
<edge from-layer="1106" from-port="0" to-layer="1107" to-port="1" />
|
|
<edge from-layer="1107" from-port="2" to-layer="1112" to-port="0" />
|
|
<edge from-layer="1108" from-port="0" to-layer="1112" to-port="1" />
|
|
<edge from-layer="1109" from-port="0" to-layer="1112" to-port="2" />
|
|
<edge from-layer="1110" from-port="0" to-layer="1112" to-port="3" />
|
|
<edge from-layer="1111" from-port="0" to-layer="1112" to-port="4" />
|
|
<edge from-layer="1112" from-port="5" to-layer="1114" to-port="0" />
|
|
<edge from-layer="1113" from-port="0" to-layer="1114" to-port="1" />
|
|
<edge from-layer="1114" from-port="2" to-layer="1116" to-port="0" />
|
|
<edge from-layer="1115" from-port="0" to-layer="1116" to-port="1" />
|
|
<edge from-layer="1116" from-port="2" to-layer="1128" to-port="1" />
|
|
<edge from-layer="1117" from-port="0" to-layer="1118" to-port="0" />
|
|
<edge from-layer="1118" from-port="1" to-layer="1120" to-port="0" />
|
|
<edge from-layer="1119" from-port="0" to-layer="1120" to-port="1" />
|
|
<edge from-layer="1120" from-port="2" to-layer="1121" to-port="1" />
|
|
<edge from-layer="1121" from-port="2" to-layer="1123" to-port="0" />
|
|
<edge from-layer="1122" from-port="0" to-layer="1123" to-port="1" />
|
|
<edge from-layer="1123" from-port="2" to-layer="1125" to-port="0" />
|
|
<edge from-layer="1124" from-port="0" to-layer="1125" to-port="1" />
|
|
<edge from-layer="1125" from-port="2" to-layer="1127" to-port="0" />
|
|
<edge from-layer="1126" from-port="0" to-layer="1127" to-port="1" />
|
|
<edge from-layer="1127" from-port="2" to-layer="1128" to-port="2" />
|
|
<edge from-layer="1128" from-port="4" to-layer="1130" to-port="0" />
|
|
<edge from-layer="1129" from-port="0" to-layer="1130" to-port="1" />
|
|
<edge from-layer="1130" from-port="2" to-layer="1132" to-port="0" />
|
|
<edge from-layer="1131" from-port="0" to-layer="1132" to-port="1" />
|
|
<edge from-layer="1132" from-port="2" to-layer="1134" to-port="0" />
|
|
<edge from-layer="1133" from-port="0" to-layer="1134" to-port="1" />
|
|
<edge from-layer="1134" from-port="2" to-layer="1139" to-port="0" />
|
|
<edge from-layer="1135" from-port="0" to-layer="1139" to-port="1" />
|
|
<edge from-layer="1136" from-port="0" to-layer="1139" to-port="2" />
|
|
<edge from-layer="1137" from-port="0" to-layer="1139" to-port="3" />
|
|
<edge from-layer="1138" from-port="0" to-layer="1139" to-port="4" />
|
|
<edge from-layer="1139" from-port="5" to-layer="1144" to-port="0" />
|
|
<edge from-layer="1140" from-port="0" to-layer="1141" to-port="0" />
|
|
<edge from-layer="1141" from-port="1" to-layer="1143" to-port="0" />
|
|
<edge from-layer="1142" from-port="0" to-layer="1143" to-port="1" />
|
|
<edge from-layer="1143" from-port="2" to-layer="1144" to-port="1" />
|
|
<edge from-layer="1144" from-port="2" to-layer="1146" to-port="0" />
|
|
<edge from-layer="1145" from-port="0" to-layer="1146" to-port="1" />
|
|
<edge from-layer="1146" from-port="2" to-layer="1147" to-port="0" />
|
|
<edge from-layer="1147" from-port="2" to-layer="1149" to-port="0" />
|
|
<edge from-layer="1148" from-port="0" to-layer="1149" to-port="1" />
|
|
<edge from-layer="1149" from-port="2" to-layer="1151" to-port="0" />
|
|
<edge from-layer="1150" from-port="0" to-layer="1151" to-port="1" />
|
|
<edge from-layer="1151" from-port="2" to-layer="1153" to-port="0" />
|
|
<edge from-layer="1152" from-port="0" to-layer="1153" to-port="1" />
|
|
<edge from-layer="1153" from-port="2" to-layer="1183" to-port="1" />
|
|
<edge from-layer="1153" from-port="2" to-layer="1155" to-port="0" />
|
|
<edge from-layer="1154" from-port="0" to-layer="1155" to-port="1" />
|
|
<edge from-layer="1155" from-port="2" to-layer="1160" to-port="0" />
|
|
<edge from-layer="1156" from-port="0" to-layer="1160" to-port="1" />
|
|
<edge from-layer="1157" from-port="0" to-layer="1160" to-port="2" />
|
|
<edge from-layer="1158" from-port="0" to-layer="1160" to-port="3" />
|
|
<edge from-layer="1159" from-port="0" to-layer="1160" to-port="4" />
|
|
<edge from-layer="1160" from-port="5" to-layer="1165" to-port="0" />
|
|
<edge from-layer="1161" from-port="0" to-layer="1162" to-port="0" />
|
|
<edge from-layer="1162" from-port="1" to-layer="1164" to-port="0" />
|
|
<edge from-layer="1163" from-port="0" to-layer="1164" to-port="1" />
|
|
<edge from-layer="1164" from-port="2" to-layer="1165" to-port="1" />
|
|
<edge from-layer="1165" from-port="2" to-layer="1167" to-port="0" />
|
|
<edge from-layer="1166" from-port="0" to-layer="1167" to-port="1" />
|
|
<edge from-layer="1167" from-port="2" to-layer="1168" to-port="0" />
|
|
<edge from-layer="1168" from-port="1" to-layer="1170" to-port="0" />
|
|
<edge from-layer="1169" from-port="0" to-layer="1170" to-port="1" />
|
|
<edge from-layer="1170" from-port="2" to-layer="1175" to-port="0" />
|
|
<edge from-layer="1171" from-port="0" to-layer="1175" to-port="1" />
|
|
<edge from-layer="1172" from-port="0" to-layer="1175" to-port="2" />
|
|
<edge from-layer="1173" from-port="0" to-layer="1175" to-port="3" />
|
|
<edge from-layer="1174" from-port="0" to-layer="1175" to-port="4" />
|
|
<edge from-layer="1175" from-port="5" to-layer="1180" to-port="0" />
|
|
<edge from-layer="1176" from-port="0" to-layer="1177" to-port="0" />
|
|
<edge from-layer="1177" from-port="1" to-layer="1179" to-port="0" />
|
|
<edge from-layer="1178" from-port="0" to-layer="1179" to-port="1" />
|
|
<edge from-layer="1179" from-port="2" to-layer="1180" to-port="1" />
|
|
<edge from-layer="1180" from-port="2" to-layer="1182" to-port="0" />
|
|
<edge from-layer="1181" from-port="0" to-layer="1182" to-port="1" />
|
|
<edge from-layer="1182" from-port="2" to-layer="1183" to-port="0" />
|
|
<edge from-layer="1183" from-port="2" to-layer="1185" to-port="0" />
|
|
<edge from-layer="1184" from-port="0" to-layer="1185" to-port="1" />
|
|
<edge from-layer="1185" from-port="2" to-layer="1187" to-port="0" />
|
|
<edge from-layer="1186" from-port="0" to-layer="1187" to-port="1" />
|
|
<edge from-layer="1187" from-port="2" to-layer="1189" to-port="0" />
|
|
<edge from-layer="1188" from-port="0" to-layer="1189" to-port="1" />
|
|
<edge from-layer="1189" from-port="2" to-layer="1191" to-port="0" />
|
|
<edge from-layer="1189" from-port="2" to-layer="1259" to-port="1" />
|
|
<edge from-layer="1190" from-port="0" to-layer="1191" to-port="1" />
|
|
<edge from-layer="1191" from-port="2" to-layer="1196" to-port="0" />
|
|
<edge from-layer="1192" from-port="0" to-layer="1196" to-port="1" />
|
|
<edge from-layer="1193" from-port="0" to-layer="1196" to-port="2" />
|
|
<edge from-layer="1194" from-port="0" to-layer="1196" to-port="3" />
|
|
<edge from-layer="1195" from-port="0" to-layer="1196" to-port="4" />
|
|
<edge from-layer="1196" from-port="5" to-layer="1201" to-port="0" />
|
|
<edge from-layer="1196" from-port="5" to-layer="1217" to-port="0" />
|
|
<edge from-layer="1196" from-port="5" to-layer="1233" to-port="0" />
|
|
<edge from-layer="1197" from-port="0" to-layer="1198" to-port="0" />
|
|
<edge from-layer="1198" from-port="1" to-layer="1200" to-port="0" />
|
|
<edge from-layer="1199" from-port="0" to-layer="1200" to-port="1" />
|
|
<edge from-layer="1200" from-port="2" to-layer="1201" to-port="1" />
|
|
<edge from-layer="1201" from-port="2" to-layer="1203" to-port="0" />
|
|
<edge from-layer="1202" from-port="0" to-layer="1203" to-port="1" />
|
|
<edge from-layer="1203" from-port="2" to-layer="1208" to-port="0" />
|
|
<edge from-layer="1204" from-port="0" to-layer="1208" to-port="1" />
|
|
<edge from-layer="1205" from-port="0" to-layer="1208" to-port="2" />
|
|
<edge from-layer="1206" from-port="0" to-layer="1208" to-port="3" />
|
|
<edge from-layer="1207" from-port="0" to-layer="1208" to-port="4" />
|
|
<edge from-layer="1208" from-port="5" to-layer="1210" to-port="0" />
|
|
<edge from-layer="1209" from-port="0" to-layer="1210" to-port="1" />
|
|
<edge from-layer="1210" from-port="2" to-layer="1212" to-port="0" />
|
|
<edge from-layer="1211" from-port="0" to-layer="1212" to-port="1" />
|
|
<edge from-layer="1212" from-port="2" to-layer="1240" to-port="0" />
|
|
<edge from-layer="1213" from-port="0" to-layer="1214" to-port="0" />
|
|
<edge from-layer="1214" from-port="1" to-layer="1216" to-port="0" />
|
|
<edge from-layer="1215" from-port="0" to-layer="1216" to-port="1" />
|
|
<edge from-layer="1216" from-port="2" to-layer="1217" to-port="1" />
|
|
<edge from-layer="1217" from-port="2" to-layer="1219" to-port="0" />
|
|
<edge from-layer="1218" from-port="0" to-layer="1219" to-port="1" />
|
|
<edge from-layer="1219" from-port="2" to-layer="1224" to-port="0" />
|
|
<edge from-layer="1220" from-port="0" to-layer="1224" to-port="1" />
|
|
<edge from-layer="1221" from-port="0" to-layer="1224" to-port="2" />
|
|
<edge from-layer="1222" from-port="0" to-layer="1224" to-port="3" />
|
|
<edge from-layer="1223" from-port="0" to-layer="1224" to-port="4" />
|
|
<edge from-layer="1224" from-port="5" to-layer="1226" to-port="0" />
|
|
<edge from-layer="1225" from-port="0" to-layer="1226" to-port="1" />
|
|
<edge from-layer="1226" from-port="2" to-layer="1228" to-port="0" />
|
|
<edge from-layer="1227" from-port="0" to-layer="1228" to-port="1" />
|
|
<edge from-layer="1228" from-port="2" to-layer="1240" to-port="1" />
|
|
<edge from-layer="1229" from-port="0" to-layer="1230" to-port="0" />
|
|
<edge from-layer="1230" from-port="1" to-layer="1232" to-port="0" />
|
|
<edge from-layer="1231" from-port="0" to-layer="1232" to-port="1" />
|
|
<edge from-layer="1232" from-port="2" to-layer="1233" to-port="1" />
|
|
<edge from-layer="1233" from-port="2" to-layer="1235" to-port="0" />
|
|
<edge from-layer="1234" from-port="0" to-layer="1235" to-port="1" />
|
|
<edge from-layer="1235" from-port="2" to-layer="1237" to-port="0" />
|
|
<edge from-layer="1236" from-port="0" to-layer="1237" to-port="1" />
|
|
<edge from-layer="1237" from-port="2" to-layer="1239" to-port="0" />
|
|
<edge from-layer="1238" from-port="0" to-layer="1239" to-port="1" />
|
|
<edge from-layer="1239" from-port="2" to-layer="1240" to-port="2" />
|
|
<edge from-layer="1240" from-port="4" to-layer="1242" to-port="0" />
|
|
<edge from-layer="1241" from-port="0" to-layer="1242" to-port="1" />
|
|
<edge from-layer="1242" from-port="2" to-layer="1244" to-port="0" />
|
|
<edge from-layer="1243" from-port="0" to-layer="1244" to-port="1" />
|
|
<edge from-layer="1244" from-port="2" to-layer="1246" to-port="0" />
|
|
<edge from-layer="1245" from-port="0" to-layer="1246" to-port="1" />
|
|
<edge from-layer="1246" from-port="2" to-layer="1251" to-port="0" />
|
|
<edge from-layer="1247" from-port="0" to-layer="1251" to-port="1" />
|
|
<edge from-layer="1248" from-port="0" to-layer="1251" to-port="2" />
|
|
<edge from-layer="1249" from-port="0" to-layer="1251" to-port="3" />
|
|
<edge from-layer="1250" from-port="0" to-layer="1251" to-port="4" />
|
|
<edge from-layer="1251" from-port="5" to-layer="1256" to-port="0" />
|
|
<edge from-layer="1252" from-port="0" to-layer="1253" to-port="0" />
|
|
<edge from-layer="1253" from-port="1" to-layer="1255" to-port="0" />
|
|
<edge from-layer="1254" from-port="0" to-layer="1255" to-port="1" />
|
|
<edge from-layer="1255" from-port="2" to-layer="1256" to-port="1" />
|
|
<edge from-layer="1256" from-port="2" to-layer="1258" to-port="0" />
|
|
<edge from-layer="1257" from-port="0" to-layer="1258" to-port="1" />
|
|
<edge from-layer="1258" from-port="2" to-layer="1259" to-port="0" />
|
|
<edge from-layer="1259" from-port="2" to-layer="1261" to-port="0" />
|
|
<edge from-layer="1260" from-port="0" to-layer="1261" to-port="1" />
|
|
<edge from-layer="1261" from-port="2" to-layer="1263" to-port="0" />
|
|
<edge from-layer="1262" from-port="0" to-layer="1263" to-port="1" />
|
|
<edge from-layer="1263" from-port="2" to-layer="1265" to-port="0" />
|
|
<edge from-layer="1264" from-port="0" to-layer="1265" to-port="1" />
|
|
<edge from-layer="1265" from-port="2" to-layer="1267" to-port="0" />
|
|
<edge from-layer="1265" from-port="2" to-layer="1295" to-port="1" />
|
|
<edge from-layer="1266" from-port="0" to-layer="1267" to-port="1" />
|
|
<edge from-layer="1267" from-port="2" to-layer="1272" to-port="0" />
|
|
<edge from-layer="1268" from-port="0" to-layer="1272" to-port="1" />
|
|
<edge from-layer="1269" from-port="0" to-layer="1272" to-port="2" />
|
|
<edge from-layer="1270" from-port="0" to-layer="1272" to-port="3" />
|
|
<edge from-layer="1271" from-port="0" to-layer="1272" to-port="4" />
|
|
<edge from-layer="1272" from-port="5" to-layer="1277" to-port="0" />
|
|
<edge from-layer="1273" from-port="0" to-layer="1274" to-port="0" />
|
|
<edge from-layer="1274" from-port="1" to-layer="1276" to-port="0" />
|
|
<edge from-layer="1275" from-port="0" to-layer="1276" to-port="1" />
|
|
<edge from-layer="1276" from-port="2" to-layer="1277" to-port="1" />
|
|
<edge from-layer="1277" from-port="2" to-layer="1279" to-port="0" />
|
|
<edge from-layer="1278" from-port="0" to-layer="1279" to-port="1" />
|
|
<edge from-layer="1279" from-port="2" to-layer="1280" to-port="0" />
|
|
<edge from-layer="1280" from-port="1" to-layer="1282" to-port="0" />
|
|
<edge from-layer="1281" from-port="0" to-layer="1282" to-port="1" />
|
|
<edge from-layer="1282" from-port="2" to-layer="1287" to-port="0" />
|
|
<edge from-layer="1283" from-port="0" to-layer="1287" to-port="1" />
|
|
<edge from-layer="1284" from-port="0" to-layer="1287" to-port="2" />
|
|
<edge from-layer="1285" from-port="0" to-layer="1287" to-port="3" />
|
|
<edge from-layer="1286" from-port="0" to-layer="1287" to-port="4" />
|
|
<edge from-layer="1287" from-port="5" to-layer="1292" to-port="0" />
|
|
<edge from-layer="1288" from-port="0" to-layer="1289" to-port="0" />
|
|
<edge from-layer="1289" from-port="1" to-layer="1291" to-port="0" />
|
|
<edge from-layer="1290" from-port="0" to-layer="1291" to-port="1" />
|
|
<edge from-layer="1291" from-port="2" to-layer="1292" to-port="1" />
|
|
<edge from-layer="1292" from-port="2" to-layer="1294" to-port="0" />
|
|
<edge from-layer="1293" from-port="0" to-layer="1294" to-port="1" />
|
|
<edge from-layer="1294" from-port="2" to-layer="1295" to-port="0" />
|
|
<edge from-layer="1295" from-port="2" to-layer="1297" to-port="0" />
|
|
<edge from-layer="1296" from-port="0" to-layer="1297" to-port="1" />
|
|
<edge from-layer="1297" from-port="2" to-layer="1299" to-port="0" />
|
|
<edge from-layer="1298" from-port="0" to-layer="1299" to-port="1" />
|
|
<edge from-layer="1299" from-port="2" to-layer="1301" to-port="0" />
|
|
<edge from-layer="1300" from-port="0" to-layer="1301" to-port="1" />
|
|
<edge from-layer="1301" from-port="2" to-layer="1303" to-port="0" />
|
|
<edge from-layer="1301" from-port="2" to-layer="1371" to-port="1" />
|
|
<edge from-layer="1302" from-port="0" to-layer="1303" to-port="1" />
|
|
<edge from-layer="1303" from-port="2" to-layer="1308" to-port="0" />
|
|
<edge from-layer="1304" from-port="0" to-layer="1308" to-port="1" />
|
|
<edge from-layer="1305" from-port="0" to-layer="1308" to-port="2" />
|
|
<edge from-layer="1306" from-port="0" to-layer="1308" to-port="3" />
|
|
<edge from-layer="1307" from-port="0" to-layer="1308" to-port="4" />
|
|
<edge from-layer="1308" from-port="5" to-layer="1329" to-port="0" />
|
|
<edge from-layer="1308" from-port="5" to-layer="1345" to-port="0" />
|
|
<edge from-layer="1308" from-port="5" to-layer="1313" to-port="0" />
|
|
<edge from-layer="1309" from-port="0" to-layer="1310" to-port="0" />
|
|
<edge from-layer="1310" from-port="1" to-layer="1312" to-port="0" />
|
|
<edge from-layer="1311" from-port="0" to-layer="1312" to-port="1" />
|
|
<edge from-layer="1312" from-port="2" to-layer="1313" to-port="1" />
|
|
<edge from-layer="1313" from-port="2" to-layer="1315" to-port="0" />
|
|
<edge from-layer="1314" from-port="0" to-layer="1315" to-port="1" />
|
|
<edge from-layer="1315" from-port="2" to-layer="1320" to-port="0" />
|
|
<edge from-layer="1316" from-port="0" to-layer="1320" to-port="1" />
|
|
<edge from-layer="1317" from-port="0" to-layer="1320" to-port="2" />
|
|
<edge from-layer="1318" from-port="0" to-layer="1320" to-port="3" />
|
|
<edge from-layer="1319" from-port="0" to-layer="1320" to-port="4" />
|
|
<edge from-layer="1320" from-port="5" to-layer="1322" to-port="0" />
|
|
<edge from-layer="1321" from-port="0" to-layer="1322" to-port="1" />
|
|
<edge from-layer="1322" from-port="2" to-layer="1324" to-port="0" />
|
|
<edge from-layer="1323" from-port="0" to-layer="1324" to-port="1" />
|
|
<edge from-layer="1324" from-port="2" to-layer="1352" to-port="0" />
|
|
<edge from-layer="1325" from-port="0" to-layer="1326" to-port="0" />
|
|
<edge from-layer="1326" from-port="1" to-layer="1328" to-port="0" />
|
|
<edge from-layer="1327" from-port="0" to-layer="1328" to-port="1" />
|
|
<edge from-layer="1328" from-port="2" to-layer="1329" to-port="1" />
|
|
<edge from-layer="1329" from-port="2" to-layer="1331" to-port="0" />
|
|
<edge from-layer="1330" from-port="0" to-layer="1331" to-port="1" />
|
|
<edge from-layer="1331" from-port="2" to-layer="1336" to-port="0" />
|
|
<edge from-layer="1332" from-port="0" to-layer="1336" to-port="1" />
|
|
<edge from-layer="1333" from-port="0" to-layer="1336" to-port="2" />
|
|
<edge from-layer="1334" from-port="0" to-layer="1336" to-port="3" />
|
|
<edge from-layer="1335" from-port="0" to-layer="1336" to-port="4" />
|
|
<edge from-layer="1336" from-port="5" to-layer="1338" to-port="0" />
|
|
<edge from-layer="1337" from-port="0" to-layer="1338" to-port="1" />
|
|
<edge from-layer="1338" from-port="2" to-layer="1340" to-port="0" />
|
|
<edge from-layer="1339" from-port="0" to-layer="1340" to-port="1" />
|
|
<edge from-layer="1340" from-port="2" to-layer="1352" to-port="1" />
|
|
<edge from-layer="1341" from-port="0" to-layer="1342" to-port="0" />
|
|
<edge from-layer="1342" from-port="1" to-layer="1344" to-port="0" />
|
|
<edge from-layer="1343" from-port="0" to-layer="1344" to-port="1" />
|
|
<edge from-layer="1344" from-port="2" to-layer="1345" to-port="1" />
|
|
<edge from-layer="1345" from-port="2" to-layer="1347" to-port="0" />
|
|
<edge from-layer="1346" from-port="0" to-layer="1347" to-port="1" />
|
|
<edge from-layer="1347" from-port="2" to-layer="1349" to-port="0" />
|
|
<edge from-layer="1348" from-port="0" to-layer="1349" to-port="1" />
|
|
<edge from-layer="1349" from-port="2" to-layer="1351" to-port="0" />
|
|
<edge from-layer="1350" from-port="0" to-layer="1351" to-port="1" />
|
|
<edge from-layer="1351" from-port="2" to-layer="1352" to-port="2" />
|
|
<edge from-layer="1352" from-port="4" to-layer="1354" to-port="0" />
|
|
<edge from-layer="1353" from-port="0" to-layer="1354" to-port="1" />
|
|
<edge from-layer="1354" from-port="2" to-layer="1356" to-port="0" />
|
|
<edge from-layer="1355" from-port="0" to-layer="1356" to-port="1" />
|
|
<edge from-layer="1356" from-port="2" to-layer="1358" to-port="0" />
|
|
<edge from-layer="1357" from-port="0" to-layer="1358" to-port="1" />
|
|
<edge from-layer="1358" from-port="2" to-layer="1363" to-port="0" />
|
|
<edge from-layer="1359" from-port="0" to-layer="1363" to-port="1" />
|
|
<edge from-layer="1360" from-port="0" to-layer="1363" to-port="2" />
|
|
<edge from-layer="1361" from-port="0" to-layer="1363" to-port="3" />
|
|
<edge from-layer="1362" from-port="0" to-layer="1363" to-port="4" />
|
|
<edge from-layer="1363" from-port="5" to-layer="1368" to-port="0" />
|
|
<edge from-layer="1364" from-port="0" to-layer="1365" to-port="0" />
|
|
<edge from-layer="1365" from-port="1" to-layer="1367" to-port="0" />
|
|
<edge from-layer="1366" from-port="0" to-layer="1367" to-port="1" />
|
|
<edge from-layer="1367" from-port="2" to-layer="1368" to-port="1" />
|
|
<edge from-layer="1368" from-port="2" to-layer="1370" to-port="0" />
|
|
<edge from-layer="1369" from-port="0" to-layer="1370" to-port="1" />
|
|
<edge from-layer="1370" from-port="2" to-layer="1371" to-port="0" />
|
|
<edge from-layer="1371" from-port="2" to-layer="1373" to-port="0" />
|
|
<edge from-layer="1372" from-port="0" to-layer="1373" to-port="1" />
|
|
<edge from-layer="1373" from-port="2" to-layer="1375" to-port="0" />
|
|
<edge from-layer="1374" from-port="0" to-layer="1375" to-port="1" />
|
|
<edge from-layer="1375" from-port="2" to-layer="1377" to-port="0" />
|
|
<edge from-layer="1376" from-port="0" to-layer="1377" to-port="1" />
|
|
<edge from-layer="1377" from-port="2" to-layer="1407" to-port="1" />
|
|
<edge from-layer="1377" from-port="2" to-layer="1379" to-port="0" />
|
|
<edge from-layer="1378" from-port="0" to-layer="1379" to-port="1" />
|
|
<edge from-layer="1379" from-port="2" to-layer="1384" to-port="0" />
|
|
<edge from-layer="1380" from-port="0" to-layer="1384" to-port="1" />
|
|
<edge from-layer="1381" from-port="0" to-layer="1384" to-port="2" />
|
|
<edge from-layer="1382" from-port="0" to-layer="1384" to-port="3" />
|
|
<edge from-layer="1383" from-port="0" to-layer="1384" to-port="4" />
|
|
<edge from-layer="1384" from-port="5" to-layer="1389" to-port="0" />
|
|
<edge from-layer="1385" from-port="0" to-layer="1386" to-port="0" />
|
|
<edge from-layer="1386" from-port="1" to-layer="1388" to-port="0" />
|
|
<edge from-layer="1387" from-port="0" to-layer="1388" to-port="1" />
|
|
<edge from-layer="1388" from-port="2" to-layer="1389" to-port="1" />
|
|
<edge from-layer="1389" from-port="2" to-layer="1391" to-port="0" />
|
|
<edge from-layer="1390" from-port="0" to-layer="1391" to-port="1" />
|
|
<edge from-layer="1391" from-port="2" to-layer="1392" to-port="0" />
|
|
<edge from-layer="1392" from-port="1" to-layer="1394" to-port="0" />
|
|
<edge from-layer="1393" from-port="0" to-layer="1394" to-port="1" />
|
|
<edge from-layer="1394" from-port="2" to-layer="1399" to-port="0" />
|
|
<edge from-layer="1395" from-port="0" to-layer="1399" to-port="1" />
|
|
<edge from-layer="1396" from-port="0" to-layer="1399" to-port="2" />
|
|
<edge from-layer="1397" from-port="0" to-layer="1399" to-port="3" />
|
|
<edge from-layer="1398" from-port="0" to-layer="1399" to-port="4" />
|
|
<edge from-layer="1399" from-port="5" to-layer="1404" to-port="0" />
|
|
<edge from-layer="1400" from-port="0" to-layer="1401" to-port="0" />
|
|
<edge from-layer="1401" from-port="1" to-layer="1403" to-port="0" />
|
|
<edge from-layer="1402" from-port="0" to-layer="1403" to-port="1" />
|
|
<edge from-layer="1403" from-port="2" to-layer="1404" to-port="1" />
|
|
<edge from-layer="1404" from-port="2" to-layer="1406" to-port="0" />
|
|
<edge from-layer="1405" from-port="0" to-layer="1406" to-port="1" />
|
|
<edge from-layer="1406" from-port="2" to-layer="1407" to-port="0" />
|
|
<edge from-layer="1407" from-port="2" to-layer="1409" to-port="0" />
|
|
<edge from-layer="1408" from-port="0" to-layer="1409" to-port="1" />
|
|
<edge from-layer="1409" from-port="2" to-layer="1411" to-port="0" />
|
|
<edge from-layer="1410" from-port="0" to-layer="1411" to-port="1" />
|
|
<edge from-layer="1411" from-port="2" to-layer="1413" to-port="0" />
|
|
<edge from-layer="1412" from-port="0" to-layer="1413" to-port="1" />
|
|
<edge from-layer="1413" from-port="2" to-layer="1483" to-port="1" />
|
|
<edge from-layer="1413" from-port="2" to-layer="1415" to-port="0" />
|
|
<edge from-layer="1414" from-port="0" to-layer="1415" to-port="1" />
|
|
<edge from-layer="1415" from-port="2" to-layer="1420" to-port="0" />
|
|
<edge from-layer="1416" from-port="0" to-layer="1420" to-port="1" />
|
|
<edge from-layer="1417" from-port="0" to-layer="1420" to-port="2" />
|
|
<edge from-layer="1418" from-port="0" to-layer="1420" to-port="3" />
|
|
<edge from-layer="1419" from-port="0" to-layer="1420" to-port="4" />
|
|
<edge from-layer="1420" from-port="5" to-layer="1425" to-port="0" />
|
|
<edge from-layer="1420" from-port="5" to-layer="1441" to-port="0" />
|
|
<edge from-layer="1420" from-port="5" to-layer="1457" to-port="0" />
|
|
<edge from-layer="1421" from-port="0" to-layer="1422" to-port="0" />
|
|
<edge from-layer="1422" from-port="1" to-layer="1424" to-port="0" />
|
|
<edge from-layer="1423" from-port="0" to-layer="1424" to-port="1" />
|
|
<edge from-layer="1424" from-port="2" to-layer="1425" to-port="1" />
|
|
<edge from-layer="1425" from-port="2" to-layer="1427" to-port="0" />
|
|
<edge from-layer="1426" from-port="0" to-layer="1427" to-port="1" />
|
|
<edge from-layer="1427" from-port="2" to-layer="1432" to-port="0" />
|
|
<edge from-layer="1428" from-port="0" to-layer="1432" to-port="1" />
|
|
<edge from-layer="1429" from-port="0" to-layer="1432" to-port="2" />
|
|
<edge from-layer="1430" from-port="0" to-layer="1432" to-port="3" />
|
|
<edge from-layer="1431" from-port="0" to-layer="1432" to-port="4" />
|
|
<edge from-layer="1432" from-port="5" to-layer="1434" to-port="0" />
|
|
<edge from-layer="1433" from-port="0" to-layer="1434" to-port="1" />
|
|
<edge from-layer="1434" from-port="2" to-layer="1436" to-port="0" />
|
|
<edge from-layer="1435" from-port="0" to-layer="1436" to-port="1" />
|
|
<edge from-layer="1436" from-port="2" to-layer="1464" to-port="0" />
|
|
<edge from-layer="1437" from-port="0" to-layer="1438" to-port="0" />
|
|
<edge from-layer="1438" from-port="1" to-layer="1440" to-port="0" />
|
|
<edge from-layer="1439" from-port="0" to-layer="1440" to-port="1" />
|
|
<edge from-layer="1440" from-port="2" to-layer="1441" to-port="1" />
|
|
<edge from-layer="1441" from-port="2" to-layer="1443" to-port="0" />
|
|
<edge from-layer="1442" from-port="0" to-layer="1443" to-port="1" />
|
|
<edge from-layer="1443" from-port="2" to-layer="1448" to-port="0" />
|
|
<edge from-layer="1444" from-port="0" to-layer="1448" to-port="1" />
|
|
<edge from-layer="1445" from-port="0" to-layer="1448" to-port="2" />
|
|
<edge from-layer="1446" from-port="0" to-layer="1448" to-port="3" />
|
|
<edge from-layer="1447" from-port="0" to-layer="1448" to-port="4" />
|
|
<edge from-layer="1448" from-port="5" to-layer="1450" to-port="0" />
|
|
<edge from-layer="1449" from-port="0" to-layer="1450" to-port="1" />
|
|
<edge from-layer="1450" from-port="2" to-layer="1452" to-port="0" />
|
|
<edge from-layer="1451" from-port="0" to-layer="1452" to-port="1" />
|
|
<edge from-layer="1452" from-port="2" to-layer="1464" to-port="1" />
|
|
<edge from-layer="1453" from-port="0" to-layer="1454" to-port="0" />
|
|
<edge from-layer="1454" from-port="1" to-layer="1456" to-port="0" />
|
|
<edge from-layer="1455" from-port="0" to-layer="1456" to-port="1" />
|
|
<edge from-layer="1456" from-port="2" to-layer="1457" to-port="1" />
|
|
<edge from-layer="1457" from-port="2" to-layer="1459" to-port="0" />
|
|
<edge from-layer="1458" from-port="0" to-layer="1459" to-port="1" />
|
|
<edge from-layer="1459" from-port="2" to-layer="1461" to-port="0" />
|
|
<edge from-layer="1460" from-port="0" to-layer="1461" to-port="1" />
|
|
<edge from-layer="1461" from-port="2" to-layer="1463" to-port="0" />
|
|
<edge from-layer="1462" from-port="0" to-layer="1463" to-port="1" />
|
|
<edge from-layer="1463" from-port="2" to-layer="1464" to-port="2" />
|
|
<edge from-layer="1464" from-port="4" to-layer="1466" to-port="0" />
|
|
<edge from-layer="1465" from-port="0" to-layer="1466" to-port="1" />
|
|
<edge from-layer="1466" from-port="2" to-layer="1468" to-port="0" />
|
|
<edge from-layer="1467" from-port="0" to-layer="1468" to-port="1" />
|
|
<edge from-layer="1468" from-port="2" to-layer="1470" to-port="0" />
|
|
<edge from-layer="1469" from-port="0" to-layer="1470" to-port="1" />
|
|
<edge from-layer="1470" from-port="2" to-layer="1475" to-port="0" />
|
|
<edge from-layer="1471" from-port="0" to-layer="1475" to-port="1" />
|
|
<edge from-layer="1472" from-port="0" to-layer="1475" to-port="2" />
|
|
<edge from-layer="1473" from-port="0" to-layer="1475" to-port="3" />
|
|
<edge from-layer="1474" from-port="0" to-layer="1475" to-port="4" />
|
|
<edge from-layer="1475" from-port="5" to-layer="1480" to-port="0" />
|
|
<edge from-layer="1476" from-port="0" to-layer="1477" to-port="0" />
|
|
<edge from-layer="1477" from-port="1" to-layer="1479" to-port="0" />
|
|
<edge from-layer="1478" from-port="0" to-layer="1479" to-port="1" />
|
|
<edge from-layer="1479" from-port="2" to-layer="1480" to-port="1" />
|
|
<edge from-layer="1480" from-port="2" to-layer="1482" to-port="0" />
|
|
<edge from-layer="1481" from-port="0" to-layer="1482" to-port="1" />
|
|
<edge from-layer="1482" from-port="2" to-layer="1483" to-port="0" />
|
|
<edge from-layer="1483" from-port="2" to-layer="1485" to-port="0" />
|
|
<edge from-layer="1484" from-port="0" to-layer="1485" to-port="1" />
|
|
<edge from-layer="1485" from-port="2" to-layer="1487" to-port="0" />
|
|
<edge from-layer="1486" from-port="0" to-layer="1487" to-port="1" />
|
|
<edge from-layer="1487" from-port="2" to-layer="1489" to-port="0" />
|
|
<edge from-layer="1488" from-port="0" to-layer="1489" to-port="1" />
|
|
<edge from-layer="1489" from-port="2" to-layer="1491" to-port="0" />
|
|
<edge from-layer="1489" from-port="2" to-layer="1519" to-port="1" />
|
|
<edge from-layer="1490" from-port="0" to-layer="1491" to-port="1" />
|
|
<edge from-layer="1491" from-port="2" to-layer="1496" to-port="0" />
|
|
<edge from-layer="1492" from-port="0" to-layer="1496" to-port="1" />
|
|
<edge from-layer="1493" from-port="0" to-layer="1496" to-port="2" />
|
|
<edge from-layer="1494" from-port="0" to-layer="1496" to-port="3" />
|
|
<edge from-layer="1495" from-port="0" to-layer="1496" to-port="4" />
|
|
<edge from-layer="1496" from-port="5" to-layer="1501" to-port="0" />
|
|
<edge from-layer="1497" from-port="0" to-layer="1498" to-port="0" />
|
|
<edge from-layer="1498" from-port="1" to-layer="1500" to-port="0" />
|
|
<edge from-layer="1499" from-port="0" to-layer="1500" to-port="1" />
|
|
<edge from-layer="1500" from-port="2" to-layer="1501" to-port="1" />
|
|
<edge from-layer="1501" from-port="2" to-layer="1503" to-port="0" />
|
|
<edge from-layer="1502" from-port="0" to-layer="1503" to-port="1" />
|
|
<edge from-layer="1503" from-port="2" to-layer="1504" to-port="0" />
|
|
<edge from-layer="1504" from-port="1" to-layer="1506" to-port="0" />
|
|
<edge from-layer="1505" from-port="0" to-layer="1506" to-port="1" />
|
|
<edge from-layer="1506" from-port="2" to-layer="1511" to-port="0" />
|
|
<edge from-layer="1507" from-port="0" to-layer="1511" to-port="1" />
|
|
<edge from-layer="1508" from-port="0" to-layer="1511" to-port="2" />
|
|
<edge from-layer="1509" from-port="0" to-layer="1511" to-port="3" />
|
|
<edge from-layer="1510" from-port="0" to-layer="1511" to-port="4" />
|
|
<edge from-layer="1511" from-port="5" to-layer="1516" to-port="0" />
|
|
<edge from-layer="1512" from-port="0" to-layer="1513" to-port="0" />
|
|
<edge from-layer="1513" from-port="1" to-layer="1515" to-port="0" />
|
|
<edge from-layer="1514" from-port="0" to-layer="1515" to-port="1" />
|
|
<edge from-layer="1515" from-port="2" to-layer="1516" to-port="1" />
|
|
<edge from-layer="1516" from-port="2" to-layer="1518" to-port="0" />
|
|
<edge from-layer="1517" from-port="0" to-layer="1518" to-port="1" />
|
|
<edge from-layer="1518" from-port="2" to-layer="1519" to-port="0" />
|
|
<edge from-layer="1519" from-port="2" to-layer="1521" to-port="0" />
|
|
<edge from-layer="1520" from-port="0" to-layer="1521" to-port="1" />
|
|
<edge from-layer="1521" from-port="2" to-layer="1523" to-port="0" />
|
|
<edge from-layer="1522" from-port="0" to-layer="1523" to-port="1" />
|
|
<edge from-layer="1523" from-port="2" to-layer="1525" to-port="0" />
|
|
<edge from-layer="1524" from-port="0" to-layer="1525" to-port="1" />
|
|
<edge from-layer="1525" from-port="2" to-layer="1527" to-port="0" />
|
|
<edge from-layer="1525" from-port="2" to-layer="1595" to-port="1" />
|
|
<edge from-layer="1526" from-port="0" to-layer="1527" to-port="1" />
|
|
<edge from-layer="1527" from-port="2" to-layer="1532" to-port="0" />
|
|
<edge from-layer="1528" from-port="0" to-layer="1532" to-port="1" />
|
|
<edge from-layer="1529" from-port="0" to-layer="1532" to-port="2" />
|
|
<edge from-layer="1530" from-port="0" to-layer="1532" to-port="3" />
|
|
<edge from-layer="1531" from-port="0" to-layer="1532" to-port="4" />
|
|
<edge from-layer="1532" from-port="5" to-layer="1553" to-port="0" />
|
|
<edge from-layer="1532" from-port="5" to-layer="1569" to-port="0" />
|
|
<edge from-layer="1532" from-port="5" to-layer="1537" to-port="0" />
|
|
<edge from-layer="1533" from-port="0" to-layer="1534" to-port="0" />
|
|
<edge from-layer="1534" from-port="1" to-layer="1536" to-port="0" />
|
|
<edge from-layer="1535" from-port="0" to-layer="1536" to-port="1" />
|
|
<edge from-layer="1536" from-port="2" to-layer="1537" to-port="1" />
|
|
<edge from-layer="1537" from-port="2" to-layer="1539" to-port="0" />
|
|
<edge from-layer="1538" from-port="0" to-layer="1539" to-port="1" />
|
|
<edge from-layer="1539" from-port="2" to-layer="1544" to-port="0" />
|
|
<edge from-layer="1540" from-port="0" to-layer="1544" to-port="1" />
|
|
<edge from-layer="1541" from-port="0" to-layer="1544" to-port="2" />
|
|
<edge from-layer="1542" from-port="0" to-layer="1544" to-port="3" />
|
|
<edge from-layer="1543" from-port="0" to-layer="1544" to-port="4" />
|
|
<edge from-layer="1544" from-port="5" to-layer="1546" to-port="0" />
|
|
<edge from-layer="1545" from-port="0" to-layer="1546" to-port="1" />
|
|
<edge from-layer="1546" from-port="2" to-layer="1548" to-port="0" />
|
|
<edge from-layer="1547" from-port="0" to-layer="1548" to-port="1" />
|
|
<edge from-layer="1548" from-port="2" to-layer="1576" to-port="0" />
|
|
<edge from-layer="1549" from-port="0" to-layer="1550" to-port="0" />
|
|
<edge from-layer="1550" from-port="1" to-layer="1552" to-port="0" />
|
|
<edge from-layer="1551" from-port="0" to-layer="1552" to-port="1" />
|
|
<edge from-layer="1552" from-port="2" to-layer="1553" to-port="1" />
|
|
<edge from-layer="1553" from-port="2" to-layer="1555" to-port="0" />
|
|
<edge from-layer="1554" from-port="0" to-layer="1555" to-port="1" />
|
|
<edge from-layer="1555" from-port="2" to-layer="1560" to-port="0" />
|
|
<edge from-layer="1556" from-port="0" to-layer="1560" to-port="1" />
|
|
<edge from-layer="1557" from-port="0" to-layer="1560" to-port="2" />
|
|
<edge from-layer="1558" from-port="0" to-layer="1560" to-port="3" />
|
|
<edge from-layer="1559" from-port="0" to-layer="1560" to-port="4" />
|
|
<edge from-layer="1560" from-port="5" to-layer="1562" to-port="0" />
|
|
<edge from-layer="1561" from-port="0" to-layer="1562" to-port="1" />
|
|
<edge from-layer="1562" from-port="2" to-layer="1564" to-port="0" />
|
|
<edge from-layer="1563" from-port="0" to-layer="1564" to-port="1" />
|
|
<edge from-layer="1564" from-port="2" to-layer="1576" to-port="1" />
|
|
<edge from-layer="1565" from-port="0" to-layer="1566" to-port="0" />
|
|
<edge from-layer="1566" from-port="1" to-layer="1568" to-port="0" />
|
|
<edge from-layer="1567" from-port="0" to-layer="1568" to-port="1" />
|
|
<edge from-layer="1568" from-port="2" to-layer="1569" to-port="1" />
|
|
<edge from-layer="1569" from-port="2" to-layer="1571" to-port="0" />
|
|
<edge from-layer="1570" from-port="0" to-layer="1571" to-port="1" />
|
|
<edge from-layer="1571" from-port="2" to-layer="1573" to-port="0" />
|
|
<edge from-layer="1572" from-port="0" to-layer="1573" to-port="1" />
|
|
<edge from-layer="1573" from-port="2" to-layer="1575" to-port="0" />
|
|
<edge from-layer="1574" from-port="0" to-layer="1575" to-port="1" />
|
|
<edge from-layer="1575" from-port="2" to-layer="1576" to-port="2" />
|
|
<edge from-layer="1576" from-port="4" to-layer="1578" to-port="0" />
|
|
<edge from-layer="1577" from-port="0" to-layer="1578" to-port="1" />
|
|
<edge from-layer="1578" from-port="2" to-layer="1580" to-port="0" />
|
|
<edge from-layer="1579" from-port="0" to-layer="1580" to-port="1" />
|
|
<edge from-layer="1580" from-port="2" to-layer="1582" to-port="0" />
|
|
<edge from-layer="1581" from-port="0" to-layer="1582" to-port="1" />
|
|
<edge from-layer="1582" from-port="2" to-layer="1587" to-port="0" />
|
|
<edge from-layer="1583" from-port="0" to-layer="1587" to-port="1" />
|
|
<edge from-layer="1584" from-port="0" to-layer="1587" to-port="2" />
|
|
<edge from-layer="1585" from-port="0" to-layer="1587" to-port="3" />
|
|
<edge from-layer="1586" from-port="0" to-layer="1587" to-port="4" />
|
|
<edge from-layer="1587" from-port="5" to-layer="1592" to-port="0" />
|
|
<edge from-layer="1588" from-port="0" to-layer="1589" to-port="0" />
|
|
<edge from-layer="1589" from-port="1" to-layer="1591" to-port="0" />
|
|
<edge from-layer="1590" from-port="0" to-layer="1591" to-port="1" />
|
|
<edge from-layer="1591" from-port="2" to-layer="1592" to-port="1" />
|
|
<edge from-layer="1592" from-port="2" to-layer="1594" to-port="0" />
|
|
<edge from-layer="1593" from-port="0" to-layer="1594" to-port="1" />
|
|
<edge from-layer="1594" from-port="2" to-layer="1595" to-port="0" />
|
|
<edge from-layer="1595" from-port="2" to-layer="1597" to-port="0" />
|
|
<edge from-layer="1596" from-port="0" to-layer="1597" to-port="1" />
|
|
<edge from-layer="1597" from-port="2" to-layer="1599" to-port="0" />
|
|
<edge from-layer="1598" from-port="0" to-layer="1599" to-port="1" />
|
|
<edge from-layer="1599" from-port="2" to-layer="1601" to-port="0" />
|
|
<edge from-layer="1600" from-port="0" to-layer="1601" to-port="1" />
|
|
<edge from-layer="1601" from-port="2" to-layer="1603" to-port="0" />
|
|
<edge from-layer="1601" from-port="2" to-layer="1631" to-port="1" />
|
|
<edge from-layer="1602" from-port="0" to-layer="1603" to-port="1" />
|
|
<edge from-layer="1603" from-port="2" to-layer="1608" to-port="0" />
|
|
<edge from-layer="1604" from-port="0" to-layer="1608" to-port="1" />
|
|
<edge from-layer="1605" from-port="0" to-layer="1608" to-port="2" />
|
|
<edge from-layer="1606" from-port="0" to-layer="1608" to-port="3" />
|
|
<edge from-layer="1607" from-port="0" to-layer="1608" to-port="4" />
|
|
<edge from-layer="1608" from-port="5" to-layer="1613" to-port="0" />
|
|
<edge from-layer="1609" from-port="0" to-layer="1610" to-port="0" />
|
|
<edge from-layer="1610" from-port="1" to-layer="1612" to-port="0" />
|
|
<edge from-layer="1611" from-port="0" to-layer="1612" to-port="1" />
|
|
<edge from-layer="1612" from-port="2" to-layer="1613" to-port="1" />
|
|
<edge from-layer="1613" from-port="2" to-layer="1615" to-port="0" />
|
|
<edge from-layer="1614" from-port="0" to-layer="1615" to-port="1" />
|
|
<edge from-layer="1615" from-port="2" to-layer="1616" to-port="0" />
|
|
<edge from-layer="1616" from-port="1" to-layer="1618" to-port="0" />
|
|
<edge from-layer="1617" from-port="0" to-layer="1618" to-port="1" />
|
|
<edge from-layer="1618" from-port="2" to-layer="1623" to-port="0" />
|
|
<edge from-layer="1619" from-port="0" to-layer="1623" to-port="1" />
|
|
<edge from-layer="1620" from-port="0" to-layer="1623" to-port="2" />
|
|
<edge from-layer="1621" from-port="0" to-layer="1623" to-port="3" />
|
|
<edge from-layer="1622" from-port="0" to-layer="1623" to-port="4" />
|
|
<edge from-layer="1623" from-port="5" to-layer="1628" to-port="0" />
|
|
<edge from-layer="1624" from-port="0" to-layer="1625" to-port="0" />
|
|
<edge from-layer="1625" from-port="1" to-layer="1627" to-port="0" />
|
|
<edge from-layer="1626" from-port="0" to-layer="1627" to-port="1" />
|
|
<edge from-layer="1627" from-port="2" to-layer="1628" to-port="1" />
|
|
<edge from-layer="1628" from-port="2" to-layer="1630" to-port="0" />
|
|
<edge from-layer="1629" from-port="0" to-layer="1630" to-port="1" />
|
|
<edge from-layer="1630" from-port="2" to-layer="1631" to-port="0" />
|
|
<edge from-layer="1631" from-port="2" to-layer="1633" to-port="0" />
|
|
<edge from-layer="1632" from-port="0" to-layer="1633" to-port="1" />
|
|
<edge from-layer="1633" from-port="2" to-layer="1635" to-port="0" />
|
|
<edge from-layer="1634" from-port="0" to-layer="1635" to-port="1" />
|
|
<edge from-layer="1635" from-port="2" to-layer="1637" to-port="0" />
|
|
<edge from-layer="1636" from-port="0" to-layer="1637" to-port="1" />
|
|
<edge from-layer="1637" from-port="2" to-layer="1639" to-port="0" />
|
|
<edge from-layer="1637" from-port="2" to-layer="1707" to-port="1" />
|
|
<edge from-layer="1638" from-port="0" to-layer="1639" to-port="1" />
|
|
<edge from-layer="1639" from-port="2" to-layer="1644" to-port="0" />
|
|
<edge from-layer="1640" from-port="0" to-layer="1644" to-port="1" />
|
|
<edge from-layer="1641" from-port="0" to-layer="1644" to-port="2" />
|
|
<edge from-layer="1642" from-port="0" to-layer="1644" to-port="3" />
|
|
<edge from-layer="1643" from-port="0" to-layer="1644" to-port="4" />
|
|
<edge from-layer="1644" from-port="5" to-layer="1649" to-port="0" />
|
|
<edge from-layer="1644" from-port="5" to-layer="1665" to-port="0" />
|
|
<edge from-layer="1644" from-port="5" to-layer="1681" to-port="0" />
|
|
<edge from-layer="1645" from-port="0" to-layer="1646" to-port="0" />
|
|
<edge from-layer="1646" from-port="1" to-layer="1648" to-port="0" />
|
|
<edge from-layer="1647" from-port="0" to-layer="1648" to-port="1" />
|
|
<edge from-layer="1648" from-port="2" to-layer="1649" to-port="1" />
|
|
<edge from-layer="1649" from-port="2" to-layer="1651" to-port="0" />
|
|
<edge from-layer="1650" from-port="0" to-layer="1651" to-port="1" />
|
|
<edge from-layer="1651" from-port="2" to-layer="1656" to-port="0" />
|
|
<edge from-layer="1652" from-port="0" to-layer="1656" to-port="1" />
|
|
<edge from-layer="1653" from-port="0" to-layer="1656" to-port="2" />
|
|
<edge from-layer="1654" from-port="0" to-layer="1656" to-port="3" />
|
|
<edge from-layer="1655" from-port="0" to-layer="1656" to-port="4" />
|
|
<edge from-layer="1656" from-port="5" to-layer="1658" to-port="0" />
|
|
<edge from-layer="1657" from-port="0" to-layer="1658" to-port="1" />
|
|
<edge from-layer="1658" from-port="2" to-layer="1660" to-port="0" />
|
|
<edge from-layer="1659" from-port="0" to-layer="1660" to-port="1" />
|
|
<edge from-layer="1660" from-port="2" to-layer="1688" to-port="0" />
|
|
<edge from-layer="1661" from-port="0" to-layer="1662" to-port="0" />
|
|
<edge from-layer="1662" from-port="1" to-layer="1664" to-port="0" />
|
|
<edge from-layer="1663" from-port="0" to-layer="1664" to-port="1" />
|
|
<edge from-layer="1664" from-port="2" to-layer="1665" to-port="1" />
|
|
<edge from-layer="1665" from-port="2" to-layer="1667" to-port="0" />
|
|
<edge from-layer="1666" from-port="0" to-layer="1667" to-port="1" />
|
|
<edge from-layer="1667" from-port="2" to-layer="1672" to-port="0" />
|
|
<edge from-layer="1668" from-port="0" to-layer="1672" to-port="1" />
|
|
<edge from-layer="1669" from-port="0" to-layer="1672" to-port="2" />
|
|
<edge from-layer="1670" from-port="0" to-layer="1672" to-port="3" />
|
|
<edge from-layer="1671" from-port="0" to-layer="1672" to-port="4" />
|
|
<edge from-layer="1672" from-port="5" to-layer="1674" to-port="0" />
|
|
<edge from-layer="1673" from-port="0" to-layer="1674" to-port="1" />
|
|
<edge from-layer="1674" from-port="2" to-layer="1676" to-port="0" />
|
|
<edge from-layer="1675" from-port="0" to-layer="1676" to-port="1" />
|
|
<edge from-layer="1676" from-port="2" to-layer="1688" to-port="1" />
|
|
<edge from-layer="1677" from-port="0" to-layer="1678" to-port="0" />
|
|
<edge from-layer="1678" from-port="1" to-layer="1680" to-port="0" />
|
|
<edge from-layer="1679" from-port="0" to-layer="1680" to-port="1" />
|
|
<edge from-layer="1680" from-port="2" to-layer="1681" to-port="1" />
|
|
<edge from-layer="1681" from-port="2" to-layer="1683" to-port="0" />
|
|
<edge from-layer="1682" from-port="0" to-layer="1683" to-port="1" />
|
|
<edge from-layer="1683" from-port="2" to-layer="1685" to-port="0" />
|
|
<edge from-layer="1684" from-port="0" to-layer="1685" to-port="1" />
|
|
<edge from-layer="1685" from-port="2" to-layer="1687" to-port="0" />
|
|
<edge from-layer="1686" from-port="0" to-layer="1687" to-port="1" />
|
|
<edge from-layer="1687" from-port="2" to-layer="1688" to-port="2" />
|
|
<edge from-layer="1688" from-port="4" to-layer="1690" to-port="0" />
|
|
<edge from-layer="1689" from-port="0" to-layer="1690" to-port="1" />
|
|
<edge from-layer="1690" from-port="2" to-layer="1692" to-port="0" />
|
|
<edge from-layer="1691" from-port="0" to-layer="1692" to-port="1" />
|
|
<edge from-layer="1692" from-port="2" to-layer="1694" to-port="0" />
|
|
<edge from-layer="1693" from-port="0" to-layer="1694" to-port="1" />
|
|
<edge from-layer="1694" from-port="2" to-layer="1699" to-port="0" />
|
|
<edge from-layer="1695" from-port="0" to-layer="1699" to-port="1" />
|
|
<edge from-layer="1696" from-port="0" to-layer="1699" to-port="2" />
|
|
<edge from-layer="1697" from-port="0" to-layer="1699" to-port="3" />
|
|
<edge from-layer="1698" from-port="0" to-layer="1699" to-port="4" />
|
|
<edge from-layer="1699" from-port="5" to-layer="1704" to-port="0" />
|
|
<edge from-layer="1700" from-port="0" to-layer="1701" to-port="0" />
|
|
<edge from-layer="1701" from-port="1" to-layer="1703" to-port="0" />
|
|
<edge from-layer="1702" from-port="0" to-layer="1703" to-port="1" />
|
|
<edge from-layer="1703" from-port="2" to-layer="1704" to-port="1" />
|
|
<edge from-layer="1704" from-port="2" to-layer="1706" to-port="0" />
|
|
<edge from-layer="1705" from-port="0" to-layer="1706" to-port="1" />
|
|
<edge from-layer="1706" from-port="2" to-layer="1707" to-port="0" />
|
|
<edge from-layer="1707" from-port="2" to-layer="1709" to-port="0" />
|
|
<edge from-layer="1708" from-port="0" to-layer="1709" to-port="1" />
|
|
<edge from-layer="1709" from-port="2" to-layer="1711" to-port="0" />
|
|
<edge from-layer="1710" from-port="0" to-layer="1711" to-port="1" />
|
|
<edge from-layer="1711" from-port="2" to-layer="1713" to-port="0" />
|
|
<edge from-layer="1712" from-port="0" to-layer="1713" to-port="1" />
|
|
<edge from-layer="1713" from-port="2" to-layer="1715" to-port="0" />
|
|
<edge from-layer="1713" from-port="2" to-layer="1743" to-port="1" />
|
|
<edge from-layer="1714" from-port="0" to-layer="1715" to-port="1" />
|
|
<edge from-layer="1715" from-port="2" to-layer="1720" to-port="0" />
|
|
<edge from-layer="1716" from-port="0" to-layer="1720" to-port="1" />
|
|
<edge from-layer="1717" from-port="0" to-layer="1720" to-port="2" />
|
|
<edge from-layer="1718" from-port="0" to-layer="1720" to-port="3" />
|
|
<edge from-layer="1719" from-port="0" to-layer="1720" to-port="4" />
|
|
<edge from-layer="1720" from-port="5" to-layer="1725" to-port="0" />
|
|
<edge from-layer="1721" from-port="0" to-layer="1722" to-port="0" />
|
|
<edge from-layer="1722" from-port="1" to-layer="1724" to-port="0" />
|
|
<edge from-layer="1723" from-port="0" to-layer="1724" to-port="1" />
|
|
<edge from-layer="1724" from-port="2" to-layer="1725" to-port="1" />
|
|
<edge from-layer="1725" from-port="2" to-layer="1727" to-port="0" />
|
|
<edge from-layer="1726" from-port="0" to-layer="1727" to-port="1" />
|
|
<edge from-layer="1727" from-port="2" to-layer="1728" to-port="0" />
|
|
<edge from-layer="1728" from-port="1" to-layer="1730" to-port="0" />
|
|
<edge from-layer="1729" from-port="0" to-layer="1730" to-port="1" />
|
|
<edge from-layer="1730" from-port="2" to-layer="1735" to-port="0" />
|
|
<edge from-layer="1731" from-port="0" to-layer="1735" to-port="1" />
|
|
<edge from-layer="1732" from-port="0" to-layer="1735" to-port="2" />
|
|
<edge from-layer="1733" from-port="0" to-layer="1735" to-port="3" />
|
|
<edge from-layer="1734" from-port="0" to-layer="1735" to-port="4" />
|
|
<edge from-layer="1735" from-port="5" to-layer="1740" to-port="0" />
|
|
<edge from-layer="1736" from-port="0" to-layer="1737" to-port="0" />
|
|
<edge from-layer="1737" from-port="1" to-layer="1739" to-port="0" />
|
|
<edge from-layer="1738" from-port="0" to-layer="1739" to-port="1" />
|
|
<edge from-layer="1739" from-port="2" to-layer="1740" to-port="1" />
|
|
<edge from-layer="1740" from-port="2" to-layer="1742" to-port="0" />
|
|
<edge from-layer="1741" from-port="0" to-layer="1742" to-port="1" />
|
|
<edge from-layer="1742" from-port="2" to-layer="1743" to-port="0" />
|
|
<edge from-layer="1743" from-port="2" to-layer="1745" to-port="0" />
|
|
<edge from-layer="1744" from-port="0" to-layer="1745" to-port="1" />
|
|
<edge from-layer="1745" from-port="2" to-layer="1747" to-port="0" />
|
|
<edge from-layer="1746" from-port="0" to-layer="1747" to-port="1" />
|
|
<edge from-layer="1747" from-port="2" to-layer="1749" to-port="0" />
|
|
<edge from-layer="1748" from-port="0" to-layer="1749" to-port="1" />
|
|
<edge from-layer="1749" from-port="2" to-layer="1819" to-port="1" />
|
|
<edge from-layer="1749" from-port="2" to-layer="1751" to-port="0" />
|
|
<edge from-layer="1750" from-port="0" to-layer="1751" to-port="1" />
|
|
<edge from-layer="1751" from-port="2" to-layer="1756" to-port="0" />
|
|
<edge from-layer="1752" from-port="0" to-layer="1756" to-port="1" />
|
|
<edge from-layer="1753" from-port="0" to-layer="1756" to-port="2" />
|
|
<edge from-layer="1754" from-port="0" to-layer="1756" to-port="3" />
|
|
<edge from-layer="1755" from-port="0" to-layer="1756" to-port="4" />
|
|
<edge from-layer="1756" from-port="5" to-layer="1777" to-port="0" />
|
|
<edge from-layer="1756" from-port="5" to-layer="1761" to-port="0" />
|
|
<edge from-layer="1756" from-port="5" to-layer="1793" to-port="0" />
|
|
<edge from-layer="1757" from-port="0" to-layer="1758" to-port="0" />
|
|
<edge from-layer="1758" from-port="1" to-layer="1760" to-port="0" />
|
|
<edge from-layer="1759" from-port="0" to-layer="1760" to-port="1" />
|
|
<edge from-layer="1760" from-port="2" to-layer="1761" to-port="1" />
|
|
<edge from-layer="1761" from-port="2" to-layer="1763" to-port="0" />
|
|
<edge from-layer="1762" from-port="0" to-layer="1763" to-port="1" />
|
|
<edge from-layer="1763" from-port="2" to-layer="1768" to-port="0" />
|
|
<edge from-layer="1764" from-port="0" to-layer="1768" to-port="1" />
|
|
<edge from-layer="1765" from-port="0" to-layer="1768" to-port="2" />
|
|
<edge from-layer="1766" from-port="0" to-layer="1768" to-port="3" />
|
|
<edge from-layer="1767" from-port="0" to-layer="1768" to-port="4" />
|
|
<edge from-layer="1768" from-port="5" to-layer="1770" to-port="0" />
|
|
<edge from-layer="1769" from-port="0" to-layer="1770" to-port="1" />
|
|
<edge from-layer="1770" from-port="2" to-layer="1772" to-port="0" />
|
|
<edge from-layer="1771" from-port="0" to-layer="1772" to-port="1" />
|
|
<edge from-layer="1772" from-port="2" to-layer="1800" to-port="0" />
|
|
<edge from-layer="1773" from-port="0" to-layer="1774" to-port="0" />
|
|
<edge from-layer="1774" from-port="1" to-layer="1776" to-port="0" />
|
|
<edge from-layer="1775" from-port="0" to-layer="1776" to-port="1" />
|
|
<edge from-layer="1776" from-port="2" to-layer="1777" to-port="1" />
|
|
<edge from-layer="1777" from-port="2" to-layer="1779" to-port="0" />
|
|
<edge from-layer="1778" from-port="0" to-layer="1779" to-port="1" />
|
|
<edge from-layer="1779" from-port="2" to-layer="1784" to-port="0" />
|
|
<edge from-layer="1780" from-port="0" to-layer="1784" to-port="1" />
|
|
<edge from-layer="1781" from-port="0" to-layer="1784" to-port="2" />
|
|
<edge from-layer="1782" from-port="0" to-layer="1784" to-port="3" />
|
|
<edge from-layer="1783" from-port="0" to-layer="1784" to-port="4" />
|
|
<edge from-layer="1784" from-port="5" to-layer="1786" to-port="0" />
|
|
<edge from-layer="1785" from-port="0" to-layer="1786" to-port="1" />
|
|
<edge from-layer="1786" from-port="2" to-layer="1788" to-port="0" />
|
|
<edge from-layer="1787" from-port="0" to-layer="1788" to-port="1" />
|
|
<edge from-layer="1788" from-port="2" to-layer="1800" to-port="1" />
|
|
<edge from-layer="1789" from-port="0" to-layer="1790" to-port="0" />
|
|
<edge from-layer="1790" from-port="1" to-layer="1792" to-port="0" />
|
|
<edge from-layer="1791" from-port="0" to-layer="1792" to-port="1" />
|
|
<edge from-layer="1792" from-port="2" to-layer="1793" to-port="1" />
|
|
<edge from-layer="1793" from-port="2" to-layer="1795" to-port="0" />
|
|
<edge from-layer="1794" from-port="0" to-layer="1795" to-port="1" />
|
|
<edge from-layer="1795" from-port="2" to-layer="1797" to-port="0" />
|
|
<edge from-layer="1796" from-port="0" to-layer="1797" to-port="1" />
|
|
<edge from-layer="1797" from-port="2" to-layer="1799" to-port="0" />
|
|
<edge from-layer="1798" from-port="0" to-layer="1799" to-port="1" />
|
|
<edge from-layer="1799" from-port="2" to-layer="1800" to-port="2" />
|
|
<edge from-layer="1800" from-port="4" to-layer="1802" to-port="0" />
|
|
<edge from-layer="1801" from-port="0" to-layer="1802" to-port="1" />
|
|
<edge from-layer="1802" from-port="2" to-layer="1804" to-port="0" />
|
|
<edge from-layer="1803" from-port="0" to-layer="1804" to-port="1" />
|
|
<edge from-layer="1804" from-port="2" to-layer="1806" to-port="0" />
|
|
<edge from-layer="1805" from-port="0" to-layer="1806" to-port="1" />
|
|
<edge from-layer="1806" from-port="2" to-layer="1811" to-port="0" />
|
|
<edge from-layer="1807" from-port="0" to-layer="1811" to-port="1" />
|
|
<edge from-layer="1808" from-port="0" to-layer="1811" to-port="2" />
|
|
<edge from-layer="1809" from-port="0" to-layer="1811" to-port="3" />
|
|
<edge from-layer="1810" from-port="0" to-layer="1811" to-port="4" />
|
|
<edge from-layer="1811" from-port="5" to-layer="1816" to-port="0" />
|
|
<edge from-layer="1812" from-port="0" to-layer="1813" to-port="0" />
|
|
<edge from-layer="1813" from-port="1" to-layer="1815" to-port="0" />
|
|
<edge from-layer="1814" from-port="0" to-layer="1815" to-port="1" />
|
|
<edge from-layer="1815" from-port="2" to-layer="1816" to-port="1" />
|
|
<edge from-layer="1816" from-port="2" to-layer="1818" to-port="0" />
|
|
<edge from-layer="1817" from-port="0" to-layer="1818" to-port="1" />
|
|
<edge from-layer="1818" from-port="2" to-layer="1819" to-port="0" />
|
|
<edge from-layer="1819" from-port="2" to-layer="1821" to-port="0" />
|
|
<edge from-layer="1820" from-port="0" to-layer="1821" to-port="1" />
|
|
<edge from-layer="1821" from-port="2" to-layer="1823" to-port="0" />
|
|
<edge from-layer="1822" from-port="0" to-layer="1823" to-port="1" />
|
|
<edge from-layer="1823" from-port="2" to-layer="1825" to-port="0" />
|
|
<edge from-layer="1824" from-port="0" to-layer="1825" to-port="1" />
|
|
<edge from-layer="1825" from-port="2" to-layer="1827" to-port="0" />
|
|
<edge from-layer="1825" from-port="2" to-layer="1855" to-port="1" />
|
|
<edge from-layer="1826" from-port="0" to-layer="1827" to-port="1" />
|
|
<edge from-layer="1827" from-port="2" to-layer="1832" to-port="0" />
|
|
<edge from-layer="1828" from-port="0" to-layer="1832" to-port="1" />
|
|
<edge from-layer="1829" from-port="0" to-layer="1832" to-port="2" />
|
|
<edge from-layer="1830" from-port="0" to-layer="1832" to-port="3" />
|
|
<edge from-layer="1831" from-port="0" to-layer="1832" to-port="4" />
|
|
<edge from-layer="1832" from-port="5" to-layer="1837" to-port="0" />
|
|
<edge from-layer="1833" from-port="0" to-layer="1834" to-port="0" />
|
|
<edge from-layer="1834" from-port="1" to-layer="1836" to-port="0" />
|
|
<edge from-layer="1835" from-port="0" to-layer="1836" to-port="1" />
|
|
<edge from-layer="1836" from-port="2" to-layer="1837" to-port="1" />
|
|
<edge from-layer="1837" from-port="2" to-layer="1839" to-port="0" />
|
|
<edge from-layer="1838" from-port="0" to-layer="1839" to-port="1" />
|
|
<edge from-layer="1839" from-port="2" to-layer="1840" to-port="0" />
|
|
<edge from-layer="1840" from-port="1" to-layer="1842" to-port="0" />
|
|
<edge from-layer="1841" from-port="0" to-layer="1842" to-port="1" />
|
|
<edge from-layer="1842" from-port="2" to-layer="1847" to-port="0" />
|
|
<edge from-layer="1843" from-port="0" to-layer="1847" to-port="1" />
|
|
<edge from-layer="1844" from-port="0" to-layer="1847" to-port="2" />
|
|
<edge from-layer="1845" from-port="0" to-layer="1847" to-port="3" />
|
|
<edge from-layer="1846" from-port="0" to-layer="1847" to-port="4" />
|
|
<edge from-layer="1847" from-port="5" to-layer="1852" to-port="0" />
|
|
<edge from-layer="1848" from-port="0" to-layer="1849" to-port="0" />
|
|
<edge from-layer="1849" from-port="1" to-layer="1851" to-port="0" />
|
|
<edge from-layer="1850" from-port="0" to-layer="1851" to-port="1" />
|
|
<edge from-layer="1851" from-port="2" to-layer="1852" to-port="1" />
|
|
<edge from-layer="1852" from-port="2" to-layer="1854" to-port="0" />
|
|
<edge from-layer="1853" from-port="0" to-layer="1854" to-port="1" />
|
|
<edge from-layer="1854" from-port="2" to-layer="1855" to-port="0" />
|
|
<edge from-layer="1855" from-port="2" to-layer="1857" to-port="0" />
|
|
<edge from-layer="1856" from-port="0" to-layer="1857" to-port="1" />
|
|
<edge from-layer="1857" from-port="2" to-layer="1859" to-port="0" />
|
|
<edge from-layer="1858" from-port="0" to-layer="1859" to-port="1" />
|
|
<edge from-layer="1859" from-port="2" to-layer="1861" to-port="0" />
|
|
<edge from-layer="1860" from-port="0" to-layer="1861" to-port="1" />
|
|
<edge from-layer="1861" from-port="2" to-layer="1863" to-port="0" />
|
|
<edge from-layer="1861" from-port="2" to-layer="1931" to-port="1" />
|
|
<edge from-layer="1862" from-port="0" to-layer="1863" to-port="1" />
|
|
<edge from-layer="1863" from-port="2" to-layer="1868" to-port="0" />
|
|
<edge from-layer="1864" from-port="0" to-layer="1868" to-port="1" />
|
|
<edge from-layer="1865" from-port="0" to-layer="1868" to-port="2" />
|
|
<edge from-layer="1866" from-port="0" to-layer="1868" to-port="3" />
|
|
<edge from-layer="1867" from-port="0" to-layer="1868" to-port="4" />
|
|
<edge from-layer="1868" from-port="5" to-layer="1873" to-port="0" />
|
|
<edge from-layer="1868" from-port="5" to-layer="1889" to-port="0" />
|
|
<edge from-layer="1868" from-port="5" to-layer="1905" to-port="0" />
|
|
<edge from-layer="1869" from-port="0" to-layer="1870" to-port="0" />
|
|
<edge from-layer="1870" from-port="1" to-layer="1872" to-port="0" />
|
|
<edge from-layer="1871" from-port="0" to-layer="1872" to-port="1" />
|
|
<edge from-layer="1872" from-port="2" to-layer="1873" to-port="1" />
|
|
<edge from-layer="1873" from-port="2" to-layer="1875" to-port="0" />
|
|
<edge from-layer="1874" from-port="0" to-layer="1875" to-port="1" />
|
|
<edge from-layer="1875" from-port="2" to-layer="1880" to-port="0" />
|
|
<edge from-layer="1876" from-port="0" to-layer="1880" to-port="1" />
|
|
<edge from-layer="1877" from-port="0" to-layer="1880" to-port="2" />
|
|
<edge from-layer="1878" from-port="0" to-layer="1880" to-port="3" />
|
|
<edge from-layer="1879" from-port="0" to-layer="1880" to-port="4" />
|
|
<edge from-layer="1880" from-port="5" to-layer="1882" to-port="0" />
|
|
<edge from-layer="1881" from-port="0" to-layer="1882" to-port="1" />
|
|
<edge from-layer="1882" from-port="2" to-layer="1884" to-port="0" />
|
|
<edge from-layer="1883" from-port="0" to-layer="1884" to-port="1" />
|
|
<edge from-layer="1884" from-port="2" to-layer="1912" to-port="0" />
|
|
<edge from-layer="1885" from-port="0" to-layer="1886" to-port="0" />
|
|
<edge from-layer="1886" from-port="1" to-layer="1888" to-port="0" />
|
|
<edge from-layer="1887" from-port="0" to-layer="1888" to-port="1" />
|
|
<edge from-layer="1888" from-port="2" to-layer="1889" to-port="1" />
|
|
<edge from-layer="1889" from-port="2" to-layer="1891" to-port="0" />
|
|
<edge from-layer="1890" from-port="0" to-layer="1891" to-port="1" />
|
|
<edge from-layer="1891" from-port="2" to-layer="1896" to-port="0" />
|
|
<edge from-layer="1892" from-port="0" to-layer="1896" to-port="1" />
|
|
<edge from-layer="1893" from-port="0" to-layer="1896" to-port="2" />
|
|
<edge from-layer="1894" from-port="0" to-layer="1896" to-port="3" />
|
|
<edge from-layer="1895" from-port="0" to-layer="1896" to-port="4" />
|
|
<edge from-layer="1896" from-port="5" to-layer="1898" to-port="0" />
|
|
<edge from-layer="1897" from-port="0" to-layer="1898" to-port="1" />
|
|
<edge from-layer="1898" from-port="2" to-layer="1900" to-port="0" />
|
|
<edge from-layer="1899" from-port="0" to-layer="1900" to-port="1" />
|
|
<edge from-layer="1900" from-port="2" to-layer="1912" to-port="1" />
|
|
<edge from-layer="1901" from-port="0" to-layer="1902" to-port="0" />
|
|
<edge from-layer="1902" from-port="1" to-layer="1904" to-port="0" />
|
|
<edge from-layer="1903" from-port="0" to-layer="1904" to-port="1" />
|
|
<edge from-layer="1904" from-port="2" to-layer="1905" to-port="1" />
|
|
<edge from-layer="1905" from-port="2" to-layer="1907" to-port="0" />
|
|
<edge from-layer="1906" from-port="0" to-layer="1907" to-port="1" />
|
|
<edge from-layer="1907" from-port="2" to-layer="1909" to-port="0" />
|
|
<edge from-layer="1908" from-port="0" to-layer="1909" to-port="1" />
|
|
<edge from-layer="1909" from-port="2" to-layer="1911" to-port="0" />
|
|
<edge from-layer="1910" from-port="0" to-layer="1911" to-port="1" />
|
|
<edge from-layer="1911" from-port="2" to-layer="1912" to-port="2" />
|
|
<edge from-layer="1912" from-port="4" to-layer="1914" to-port="0" />
|
|
<edge from-layer="1913" from-port="0" to-layer="1914" to-port="1" />
|
|
<edge from-layer="1914" from-port="2" to-layer="1916" to-port="0" />
|
|
<edge from-layer="1915" from-port="0" to-layer="1916" to-port="1" />
|
|
<edge from-layer="1916" from-port="2" to-layer="1918" to-port="0" />
|
|
<edge from-layer="1917" from-port="0" to-layer="1918" to-port="1" />
|
|
<edge from-layer="1918" from-port="2" to-layer="1923" to-port="0" />
|
|
<edge from-layer="1919" from-port="0" to-layer="1923" to-port="1" />
|
|
<edge from-layer="1920" from-port="0" to-layer="1923" to-port="2" />
|
|
<edge from-layer="1921" from-port="0" to-layer="1923" to-port="3" />
|
|
<edge from-layer="1922" from-port="0" to-layer="1923" to-port="4" />
|
|
<edge from-layer="1923" from-port="5" to-layer="1928" to-port="0" />
|
|
<edge from-layer="1924" from-port="0" to-layer="1925" to-port="0" />
|
|
<edge from-layer="1925" from-port="1" to-layer="1927" to-port="0" />
|
|
<edge from-layer="1926" from-port="0" to-layer="1927" to-port="1" />
|
|
<edge from-layer="1927" from-port="2" to-layer="1928" to-port="1" />
|
|
<edge from-layer="1928" from-port="2" to-layer="1930" to-port="0" />
|
|
<edge from-layer="1929" from-port="0" to-layer="1930" to-port="1" />
|
|
<edge from-layer="1930" from-port="2" to-layer="1931" to-port="0" />
|
|
<edge from-layer="1931" from-port="2" to-layer="1933" to-port="0" />
|
|
<edge from-layer="1932" from-port="0" to-layer="1933" to-port="1" />
|
|
<edge from-layer="1933" from-port="2" to-layer="1935" to-port="0" />
|
|
<edge from-layer="1934" from-port="0" to-layer="1935" to-port="1" />
|
|
<edge from-layer="1935" from-port="2" to-layer="1937" to-port="0" />
|
|
<edge from-layer="1936" from-port="0" to-layer="1937" to-port="1" />
|
|
<edge from-layer="1937" from-port="2" to-layer="1967" to-port="1" />
|
|
<edge from-layer="1937" from-port="2" to-layer="1939" to-port="0" />
|
|
<edge from-layer="1938" from-port="0" to-layer="1939" to-port="1" />
|
|
<edge from-layer="1939" from-port="2" to-layer="1944" to-port="0" />
|
|
<edge from-layer="1940" from-port="0" to-layer="1944" to-port="1" />
|
|
<edge from-layer="1941" from-port="0" to-layer="1944" to-port="2" />
|
|
<edge from-layer="1942" from-port="0" to-layer="1944" to-port="3" />
|
|
<edge from-layer="1943" from-port="0" to-layer="1944" to-port="4" />
|
|
<edge from-layer="1944" from-port="5" to-layer="1949" to-port="0" />
|
|
<edge from-layer="1945" from-port="0" to-layer="1946" to-port="0" />
|
|
<edge from-layer="1946" from-port="1" to-layer="1948" to-port="0" />
|
|
<edge from-layer="1947" from-port="0" to-layer="1948" to-port="1" />
|
|
<edge from-layer="1948" from-port="2" to-layer="1949" to-port="1" />
|
|
<edge from-layer="1949" from-port="2" to-layer="1951" to-port="0" />
|
|
<edge from-layer="1950" from-port="0" to-layer="1951" to-port="1" />
|
|
<edge from-layer="1951" from-port="2" to-layer="1952" to-port="0" />
|
|
<edge from-layer="1952" from-port="1" to-layer="1954" to-port="0" />
|
|
<edge from-layer="1953" from-port="0" to-layer="1954" to-port="1" />
|
|
<edge from-layer="1954" from-port="2" to-layer="1959" to-port="0" />
|
|
<edge from-layer="1955" from-port="0" to-layer="1959" to-port="1" />
|
|
<edge from-layer="1956" from-port="0" to-layer="1959" to-port="2" />
|
|
<edge from-layer="1957" from-port="0" to-layer="1959" to-port="3" />
|
|
<edge from-layer="1958" from-port="0" to-layer="1959" to-port="4" />
|
|
<edge from-layer="1959" from-port="5" to-layer="1964" to-port="0" />
|
|
<edge from-layer="1960" from-port="0" to-layer="1961" to-port="0" />
|
|
<edge from-layer="1961" from-port="1" to-layer="1963" to-port="0" />
|
|
<edge from-layer="1962" from-port="0" to-layer="1963" to-port="1" />
|
|
<edge from-layer="1963" from-port="2" to-layer="1964" to-port="1" />
|
|
<edge from-layer="1964" from-port="2" to-layer="1966" to-port="0" />
|
|
<edge from-layer="1965" from-port="0" to-layer="1966" to-port="1" />
|
|
<edge from-layer="1966" from-port="2" to-layer="1967" to-port="0" />
|
|
<edge from-layer="1967" from-port="2" to-layer="1969" to-port="0" />
|
|
<edge from-layer="1968" from-port="0" to-layer="1969" to-port="1" />
|
|
<edge from-layer="1969" from-port="2" to-layer="1971" to-port="0" />
|
|
<edge from-layer="1970" from-port="0" to-layer="1971" to-port="1" />
|
|
<edge from-layer="1971" from-port="2" to-layer="1973" to-port="0" />
|
|
<edge from-layer="1972" from-port="0" to-layer="1973" to-port="1" />
|
|
<edge from-layer="1973" from-port="2" to-layer="1975" to-port="0" />
|
|
<edge from-layer="1973" from-port="2" to-layer="2043" to-port="1" />
|
|
<edge from-layer="1974" from-port="0" to-layer="1975" to-port="1" />
|
|
<edge from-layer="1975" from-port="2" to-layer="1980" to-port="0" />
|
|
<edge from-layer="1976" from-port="0" to-layer="1980" to-port="1" />
|
|
<edge from-layer="1977" from-port="0" to-layer="1980" to-port="2" />
|
|
<edge from-layer="1978" from-port="0" to-layer="1980" to-port="3" />
|
|
<edge from-layer="1979" from-port="0" to-layer="1980" to-port="4" />
|
|
<edge from-layer="1980" from-port="5" to-layer="2001" to-port="0" />
|
|
<edge from-layer="1980" from-port="5" to-layer="2017" to-port="0" />
|
|
<edge from-layer="1980" from-port="5" to-layer="1985" to-port="0" />
|
|
<edge from-layer="1981" from-port="0" to-layer="1982" to-port="0" />
|
|
<edge from-layer="1982" from-port="1" to-layer="1984" to-port="0" />
|
|
<edge from-layer="1983" from-port="0" to-layer="1984" to-port="1" />
|
|
<edge from-layer="1984" from-port="2" to-layer="1985" to-port="1" />
|
|
<edge from-layer="1985" from-port="2" to-layer="1987" to-port="0" />
|
|
<edge from-layer="1986" from-port="0" to-layer="1987" to-port="1" />
|
|
<edge from-layer="1987" from-port="2" to-layer="1992" to-port="0" />
|
|
<edge from-layer="1988" from-port="0" to-layer="1992" to-port="1" />
|
|
<edge from-layer="1989" from-port="0" to-layer="1992" to-port="2" />
|
|
<edge from-layer="1990" from-port="0" to-layer="1992" to-port="3" />
|
|
<edge from-layer="1991" from-port="0" to-layer="1992" to-port="4" />
|
|
<edge from-layer="1992" from-port="5" to-layer="1994" to-port="0" />
|
|
<edge from-layer="1993" from-port="0" to-layer="1994" to-port="1" />
|
|
<edge from-layer="1994" from-port="2" to-layer="1996" to-port="0" />
|
|
<edge from-layer="1995" from-port="0" to-layer="1996" to-port="1" />
|
|
<edge from-layer="1996" from-port="2" to-layer="2024" to-port="0" />
|
|
<edge from-layer="1997" from-port="0" to-layer="1998" to-port="0" />
|
|
<edge from-layer="1998" from-port="1" to-layer="2000" to-port="0" />
|
|
<edge from-layer="1999" from-port="0" to-layer="2000" to-port="1" />
|
|
<edge from-layer="2000" from-port="2" to-layer="2001" to-port="1" />
|
|
<edge from-layer="2001" from-port="2" to-layer="2003" to-port="0" />
|
|
<edge from-layer="2002" from-port="0" to-layer="2003" to-port="1" />
|
|
<edge from-layer="2003" from-port="2" to-layer="2008" to-port="0" />
|
|
<edge from-layer="2004" from-port="0" to-layer="2008" to-port="1" />
|
|
<edge from-layer="2005" from-port="0" to-layer="2008" to-port="2" />
|
|
<edge from-layer="2006" from-port="0" to-layer="2008" to-port="3" />
|
|
<edge from-layer="2007" from-port="0" to-layer="2008" to-port="4" />
|
|
<edge from-layer="2008" from-port="5" to-layer="2010" to-port="0" />
|
|
<edge from-layer="2009" from-port="0" to-layer="2010" to-port="1" />
|
|
<edge from-layer="2010" from-port="2" to-layer="2012" to-port="0" />
|
|
<edge from-layer="2011" from-port="0" to-layer="2012" to-port="1" />
|
|
<edge from-layer="2012" from-port="2" to-layer="2024" to-port="1" />
|
|
<edge from-layer="2013" from-port="0" to-layer="2014" to-port="0" />
|
|
<edge from-layer="2014" from-port="1" to-layer="2016" to-port="0" />
|
|
<edge from-layer="2015" from-port="0" to-layer="2016" to-port="1" />
|
|
<edge from-layer="2016" from-port="2" to-layer="2017" to-port="1" />
|
|
<edge from-layer="2017" from-port="2" to-layer="2019" to-port="0" />
|
|
<edge from-layer="2018" from-port="0" to-layer="2019" to-port="1" />
|
|
<edge from-layer="2019" from-port="2" to-layer="2021" to-port="0" />
|
|
<edge from-layer="2020" from-port="0" to-layer="2021" to-port="1" />
|
|
<edge from-layer="2021" from-port="2" to-layer="2023" to-port="0" />
|
|
<edge from-layer="2022" from-port="0" to-layer="2023" to-port="1" />
|
|
<edge from-layer="2023" from-port="2" to-layer="2024" to-port="2" />
|
|
<edge from-layer="2024" from-port="4" to-layer="2026" to-port="0" />
|
|
<edge from-layer="2025" from-port="0" to-layer="2026" to-port="1" />
|
|
<edge from-layer="2026" from-port="2" to-layer="2028" to-port="0" />
|
|
<edge from-layer="2027" from-port="0" to-layer="2028" to-port="1" />
|
|
<edge from-layer="2028" from-port="2" to-layer="2030" to-port="0" />
|
|
<edge from-layer="2029" from-port="0" to-layer="2030" to-port="1" />
|
|
<edge from-layer="2030" from-port="2" to-layer="2035" to-port="0" />
|
|
<edge from-layer="2031" from-port="0" to-layer="2035" to-port="1" />
|
|
<edge from-layer="2032" from-port="0" to-layer="2035" to-port="2" />
|
|
<edge from-layer="2033" from-port="0" to-layer="2035" to-port="3" />
|
|
<edge from-layer="2034" from-port="0" to-layer="2035" to-port="4" />
|
|
<edge from-layer="2035" from-port="5" to-layer="2040" to-port="0" />
|
|
<edge from-layer="2036" from-port="0" to-layer="2037" to-port="0" />
|
|
<edge from-layer="2037" from-port="1" to-layer="2039" to-port="0" />
|
|
<edge from-layer="2038" from-port="0" to-layer="2039" to-port="1" />
|
|
<edge from-layer="2039" from-port="2" to-layer="2040" to-port="1" />
|
|
<edge from-layer="2040" from-port="2" to-layer="2042" to-port="0" />
|
|
<edge from-layer="2041" from-port="0" to-layer="2042" to-port="1" />
|
|
<edge from-layer="2042" from-port="2" to-layer="2043" to-port="0" />
|
|
<edge from-layer="2043" from-port="2" to-layer="2045" to-port="0" />
|
|
<edge from-layer="2044" from-port="0" to-layer="2045" to-port="1" />
|
|
<edge from-layer="2045" from-port="2" to-layer="2047" to-port="0" />
|
|
<edge from-layer="2046" from-port="0" to-layer="2047" to-port="1" />
|
|
<edge from-layer="2047" from-port="2" to-layer="2049" to-port="0" />
|
|
<edge from-layer="2048" from-port="0" to-layer="2049" to-port="1" />
|
|
<edge from-layer="2049" from-port="2" to-layer="2079" to-port="1" />
|
|
<edge from-layer="2049" from-port="2" to-layer="2051" to-port="0" />
|
|
<edge from-layer="2050" from-port="0" to-layer="2051" to-port="1" />
|
|
<edge from-layer="2051" from-port="2" to-layer="2056" to-port="0" />
|
|
<edge from-layer="2052" from-port="0" to-layer="2056" to-port="1" />
|
|
<edge from-layer="2053" from-port="0" to-layer="2056" to-port="2" />
|
|
<edge from-layer="2054" from-port="0" to-layer="2056" to-port="3" />
|
|
<edge from-layer="2055" from-port="0" to-layer="2056" to-port="4" />
|
|
<edge from-layer="2056" from-port="5" to-layer="2061" to-port="0" />
|
|
<edge from-layer="2057" from-port="0" to-layer="2058" to-port="0" />
|
|
<edge from-layer="2058" from-port="1" to-layer="2060" to-port="0" />
|
|
<edge from-layer="2059" from-port="0" to-layer="2060" to-port="1" />
|
|
<edge from-layer="2060" from-port="2" to-layer="2061" to-port="1" />
|
|
<edge from-layer="2061" from-port="2" to-layer="2063" to-port="0" />
|
|
<edge from-layer="2062" from-port="0" to-layer="2063" to-port="1" />
|
|
<edge from-layer="2063" from-port="2" to-layer="2064" to-port="0" />
|
|
<edge from-layer="2064" from-port="1" to-layer="2066" to-port="0" />
|
|
<edge from-layer="2065" from-port="0" to-layer="2066" to-port="1" />
|
|
<edge from-layer="2066" from-port="2" to-layer="2071" to-port="0" />
|
|
<edge from-layer="2067" from-port="0" to-layer="2071" to-port="1" />
|
|
<edge from-layer="2068" from-port="0" to-layer="2071" to-port="2" />
|
|
<edge from-layer="2069" from-port="0" to-layer="2071" to-port="3" />
|
|
<edge from-layer="2070" from-port="0" to-layer="2071" to-port="4" />
|
|
<edge from-layer="2071" from-port="5" to-layer="2076" to-port="0" />
|
|
<edge from-layer="2072" from-port="0" to-layer="2073" to-port="0" />
|
|
<edge from-layer="2073" from-port="1" to-layer="2075" to-port="0" />
|
|
<edge from-layer="2074" from-port="0" to-layer="2075" to-port="1" />
|
|
<edge from-layer="2075" from-port="2" to-layer="2076" to-port="1" />
|
|
<edge from-layer="2076" from-port="2" to-layer="2078" to-port="0" />
|
|
<edge from-layer="2077" from-port="0" to-layer="2078" to-port="1" />
|
|
<edge from-layer="2078" from-port="2" to-layer="2079" to-port="0" />
|
|
<edge from-layer="2079" from-port="2" to-layer="2081" to-port="0" />
|
|
<edge from-layer="2080" from-port="0" to-layer="2081" to-port="1" />
|
|
<edge from-layer="2081" from-port="2" to-layer="2083" to-port="0" />
|
|
<edge from-layer="2082" from-port="0" to-layer="2083" to-port="1" />
|
|
<edge from-layer="2083" from-port="2" to-layer="2085" to-port="0" />
|
|
<edge from-layer="2084" from-port="0" to-layer="2085" to-port="1" />
|
|
<edge from-layer="2085" from-port="2" to-layer="2155" to-port="1" />
|
|
<edge from-layer="2085" from-port="2" to-layer="2087" to-port="0" />
|
|
<edge from-layer="2086" from-port="0" to-layer="2087" to-port="1" />
|
|
<edge from-layer="2087" from-port="2" to-layer="2092" to-port="0" />
|
|
<edge from-layer="2088" from-port="0" to-layer="2092" to-port="1" />
|
|
<edge from-layer="2089" from-port="0" to-layer="2092" to-port="2" />
|
|
<edge from-layer="2090" from-port="0" to-layer="2092" to-port="3" />
|
|
<edge from-layer="2091" from-port="0" to-layer="2092" to-port="4" />
|
|
<edge from-layer="2092" from-port="5" to-layer="2113" to-port="0" />
|
|
<edge from-layer="2092" from-port="5" to-layer="2129" to-port="0" />
|
|
<edge from-layer="2092" from-port="5" to-layer="2097" to-port="0" />
|
|
<edge from-layer="2093" from-port="0" to-layer="2094" to-port="0" />
|
|
<edge from-layer="2094" from-port="1" to-layer="2096" to-port="0" />
|
|
<edge from-layer="2095" from-port="0" to-layer="2096" to-port="1" />
|
|
<edge from-layer="2096" from-port="2" to-layer="2097" to-port="1" />
|
|
<edge from-layer="2097" from-port="2" to-layer="2099" to-port="0" />
|
|
<edge from-layer="2098" from-port="0" to-layer="2099" to-port="1" />
|
|
<edge from-layer="2099" from-port="2" to-layer="2104" to-port="0" />
|
|
<edge from-layer="2100" from-port="0" to-layer="2104" to-port="1" />
|
|
<edge from-layer="2101" from-port="0" to-layer="2104" to-port="2" />
|
|
<edge from-layer="2102" from-port="0" to-layer="2104" to-port="3" />
|
|
<edge from-layer="2103" from-port="0" to-layer="2104" to-port="4" />
|
|
<edge from-layer="2104" from-port="5" to-layer="2106" to-port="0" />
|
|
<edge from-layer="2105" from-port="0" to-layer="2106" to-port="1" />
|
|
<edge from-layer="2106" from-port="2" to-layer="2108" to-port="0" />
|
|
<edge from-layer="2107" from-port="0" to-layer="2108" to-port="1" />
|
|
<edge from-layer="2108" from-port="2" to-layer="2136" to-port="0" />
|
|
<edge from-layer="2109" from-port="0" to-layer="2110" to-port="0" />
|
|
<edge from-layer="2110" from-port="1" to-layer="2112" to-port="0" />
|
|
<edge from-layer="2111" from-port="0" to-layer="2112" to-port="1" />
|
|
<edge from-layer="2112" from-port="2" to-layer="2113" to-port="1" />
|
|
<edge from-layer="2113" from-port="2" to-layer="2115" to-port="0" />
|
|
<edge from-layer="2114" from-port="0" to-layer="2115" to-port="1" />
|
|
<edge from-layer="2115" from-port="2" to-layer="2120" to-port="0" />
|
|
<edge from-layer="2116" from-port="0" to-layer="2120" to-port="1" />
|
|
<edge from-layer="2117" from-port="0" to-layer="2120" to-port="2" />
|
|
<edge from-layer="2118" from-port="0" to-layer="2120" to-port="3" />
|
|
<edge from-layer="2119" from-port="0" to-layer="2120" to-port="4" />
|
|
<edge from-layer="2120" from-port="5" to-layer="2122" to-port="0" />
|
|
<edge from-layer="2121" from-port="0" to-layer="2122" to-port="1" />
|
|
<edge from-layer="2122" from-port="2" to-layer="2124" to-port="0" />
|
|
<edge from-layer="2123" from-port="0" to-layer="2124" to-port="1" />
|
|
<edge from-layer="2124" from-port="2" to-layer="2136" to-port="1" />
|
|
<edge from-layer="2125" from-port="0" to-layer="2126" to-port="0" />
|
|
<edge from-layer="2126" from-port="1" to-layer="2128" to-port="0" />
|
|
<edge from-layer="2127" from-port="0" to-layer="2128" to-port="1" />
|
|
<edge from-layer="2128" from-port="2" to-layer="2129" to-port="1" />
|
|
<edge from-layer="2129" from-port="2" to-layer="2131" to-port="0" />
|
|
<edge from-layer="2130" from-port="0" to-layer="2131" to-port="1" />
|
|
<edge from-layer="2131" from-port="2" to-layer="2133" to-port="0" />
|
|
<edge from-layer="2132" from-port="0" to-layer="2133" to-port="1" />
|
|
<edge from-layer="2133" from-port="2" to-layer="2135" to-port="0" />
|
|
<edge from-layer="2134" from-port="0" to-layer="2135" to-port="1" />
|
|
<edge from-layer="2135" from-port="2" to-layer="2136" to-port="2" />
|
|
<edge from-layer="2136" from-port="4" to-layer="2138" to-port="0" />
|
|
<edge from-layer="2137" from-port="0" to-layer="2138" to-port="1" />
|
|
<edge from-layer="2138" from-port="2" to-layer="2140" to-port="0" />
|
|
<edge from-layer="2139" from-port="0" to-layer="2140" to-port="1" />
|
|
<edge from-layer="2140" from-port="2" to-layer="2142" to-port="0" />
|
|
<edge from-layer="2141" from-port="0" to-layer="2142" to-port="1" />
|
|
<edge from-layer="2142" from-port="2" to-layer="2147" to-port="0" />
|
|
<edge from-layer="2143" from-port="0" to-layer="2147" to-port="1" />
|
|
<edge from-layer="2144" from-port="0" to-layer="2147" to-port="2" />
|
|
<edge from-layer="2145" from-port="0" to-layer="2147" to-port="3" />
|
|
<edge from-layer="2146" from-port="0" to-layer="2147" to-port="4" />
|
|
<edge from-layer="2147" from-port="5" to-layer="2152" to-port="0" />
|
|
<edge from-layer="2148" from-port="0" to-layer="2149" to-port="0" />
|
|
<edge from-layer="2149" from-port="1" to-layer="2151" to-port="0" />
|
|
<edge from-layer="2150" from-port="0" to-layer="2151" to-port="1" />
|
|
<edge from-layer="2151" from-port="2" to-layer="2152" to-port="1" />
|
|
<edge from-layer="2152" from-port="2" to-layer="2154" to-port="0" />
|
|
<edge from-layer="2153" from-port="0" to-layer="2154" to-port="1" />
|
|
<edge from-layer="2154" from-port="2" to-layer="2155" to-port="0" />
|
|
<edge from-layer="2155" from-port="2" to-layer="2157" to-port="0" />
|
|
<edge from-layer="2156" from-port="0" to-layer="2157" to-port="1" />
|
|
<edge from-layer="2157" from-port="2" to-layer="2159" to-port="0" />
|
|
<edge from-layer="2158" from-port="0" to-layer="2159" to-port="1" />
|
|
<edge from-layer="2159" from-port="2" to-layer="2161" to-port="0" />
|
|
<edge from-layer="2160" from-port="0" to-layer="2161" to-port="1" />
|
|
<edge from-layer="2161" from-port="2" to-layer="2163" to-port="0" />
|
|
<edge from-layer="2161" from-port="2" to-layer="2191" to-port="1" />
|
|
<edge from-layer="2162" from-port="0" to-layer="2163" to-port="1" />
|
|
<edge from-layer="2163" from-port="2" to-layer="2168" to-port="0" />
|
|
<edge from-layer="2164" from-port="0" to-layer="2168" to-port="1" />
|
|
<edge from-layer="2165" from-port="0" to-layer="2168" to-port="2" />
|
|
<edge from-layer="2166" from-port="0" to-layer="2168" to-port="3" />
|
|
<edge from-layer="2167" from-port="0" to-layer="2168" to-port="4" />
|
|
<edge from-layer="2168" from-port="5" to-layer="2173" to-port="0" />
|
|
<edge from-layer="2169" from-port="0" to-layer="2170" to-port="0" />
|
|
<edge from-layer="2170" from-port="1" to-layer="2172" to-port="0" />
|
|
<edge from-layer="2171" from-port="0" to-layer="2172" to-port="1" />
|
|
<edge from-layer="2172" from-port="2" to-layer="2173" to-port="1" />
|
|
<edge from-layer="2173" from-port="2" to-layer="2175" to-port="0" />
|
|
<edge from-layer="2174" from-port="0" to-layer="2175" to-port="1" />
|
|
<edge from-layer="2175" from-port="2" to-layer="2176" to-port="0" />
|
|
<edge from-layer="2176" from-port="1" to-layer="2178" to-port="0" />
|
|
<edge from-layer="2177" from-port="0" to-layer="2178" to-port="1" />
|
|
<edge from-layer="2178" from-port="2" to-layer="2183" to-port="0" />
|
|
<edge from-layer="2179" from-port="0" to-layer="2183" to-port="1" />
|
|
<edge from-layer="2180" from-port="0" to-layer="2183" to-port="2" />
|
|
<edge from-layer="2181" from-port="0" to-layer="2183" to-port="3" />
|
|
<edge from-layer="2182" from-port="0" to-layer="2183" to-port="4" />
|
|
<edge from-layer="2183" from-port="5" to-layer="2188" to-port="0" />
|
|
<edge from-layer="2184" from-port="0" to-layer="2185" to-port="0" />
|
|
<edge from-layer="2185" from-port="1" to-layer="2187" to-port="0" />
|
|
<edge from-layer="2186" from-port="0" to-layer="2187" to-port="1" />
|
|
<edge from-layer="2187" from-port="2" to-layer="2188" to-port="1" />
|
|
<edge from-layer="2188" from-port="2" to-layer="2190" to-port="0" />
|
|
<edge from-layer="2189" from-port="0" to-layer="2190" to-port="1" />
|
|
<edge from-layer="2190" from-port="2" to-layer="2191" to-port="0" />
|
|
<edge from-layer="2191" from-port="2" to-layer="2193" to-port="0" />
|
|
<edge from-layer="2192" from-port="0" to-layer="2193" to-port="1" />
|
|
<edge from-layer="2193" from-port="2" to-layer="2195" to-port="0" />
|
|
<edge from-layer="2194" from-port="0" to-layer="2195" to-port="1" />
|
|
<edge from-layer="2195" from-port="2" to-layer="2197" to-port="0" />
|
|
<edge from-layer="2196" from-port="0" to-layer="2197" to-port="1" />
|
|
<edge from-layer="2197" from-port="2" to-layer="2199" to-port="0" />
|
|
<edge from-layer="2197" from-port="2" to-layer="2267" to-port="1" />
|
|
<edge from-layer="2198" from-port="0" to-layer="2199" to-port="1" />
|
|
<edge from-layer="2199" from-port="2" to-layer="2204" to-port="0" />
|
|
<edge from-layer="2200" from-port="0" to-layer="2204" to-port="1" />
|
|
<edge from-layer="2201" from-port="0" to-layer="2204" to-port="2" />
|
|
<edge from-layer="2202" from-port="0" to-layer="2204" to-port="3" />
|
|
<edge from-layer="2203" from-port="0" to-layer="2204" to-port="4" />
|
|
<edge from-layer="2204" from-port="5" to-layer="2209" to-port="0" />
|
|
<edge from-layer="2204" from-port="5" to-layer="2241" to-port="0" />
|
|
<edge from-layer="2204" from-port="5" to-layer="2225" to-port="0" />
|
|
<edge from-layer="2205" from-port="0" to-layer="2206" to-port="0" />
|
|
<edge from-layer="2206" from-port="1" to-layer="2208" to-port="0" />
|
|
<edge from-layer="2207" from-port="0" to-layer="2208" to-port="1" />
|
|
<edge from-layer="2208" from-port="2" to-layer="2209" to-port="1" />
|
|
<edge from-layer="2209" from-port="2" to-layer="2211" to-port="0" />
|
|
<edge from-layer="2210" from-port="0" to-layer="2211" to-port="1" />
|
|
<edge from-layer="2211" from-port="2" to-layer="2216" to-port="0" />
|
|
<edge from-layer="2212" from-port="0" to-layer="2216" to-port="1" />
|
|
<edge from-layer="2213" from-port="0" to-layer="2216" to-port="2" />
|
|
<edge from-layer="2214" from-port="0" to-layer="2216" to-port="3" />
|
|
<edge from-layer="2215" from-port="0" to-layer="2216" to-port="4" />
|
|
<edge from-layer="2216" from-port="5" to-layer="2218" to-port="0" />
|
|
<edge from-layer="2217" from-port="0" to-layer="2218" to-port="1" />
|
|
<edge from-layer="2218" from-port="2" to-layer="2220" to-port="0" />
|
|
<edge from-layer="2219" from-port="0" to-layer="2220" to-port="1" />
|
|
<edge from-layer="2220" from-port="2" to-layer="2248" to-port="0" />
|
|
<edge from-layer="2221" from-port="0" to-layer="2222" to-port="0" />
|
|
<edge from-layer="2222" from-port="1" to-layer="2224" to-port="0" />
|
|
<edge from-layer="2223" from-port="0" to-layer="2224" to-port="1" />
|
|
<edge from-layer="2224" from-port="2" to-layer="2225" to-port="1" />
|
|
<edge from-layer="2225" from-port="2" to-layer="2227" to-port="0" />
|
|
<edge from-layer="2226" from-port="0" to-layer="2227" to-port="1" />
|
|
<edge from-layer="2227" from-port="2" to-layer="2232" to-port="0" />
|
|
<edge from-layer="2228" from-port="0" to-layer="2232" to-port="1" />
|
|
<edge from-layer="2229" from-port="0" to-layer="2232" to-port="2" />
|
|
<edge from-layer="2230" from-port="0" to-layer="2232" to-port="3" />
|
|
<edge from-layer="2231" from-port="0" to-layer="2232" to-port="4" />
|
|
<edge from-layer="2232" from-port="5" to-layer="2234" to-port="0" />
|
|
<edge from-layer="2233" from-port="0" to-layer="2234" to-port="1" />
|
|
<edge from-layer="2234" from-port="2" to-layer="2236" to-port="0" />
|
|
<edge from-layer="2235" from-port="0" to-layer="2236" to-port="1" />
|
|
<edge from-layer="2236" from-port="2" to-layer="2248" to-port="1" />
|
|
<edge from-layer="2237" from-port="0" to-layer="2238" to-port="0" />
|
|
<edge from-layer="2238" from-port="1" to-layer="2240" to-port="0" />
|
|
<edge from-layer="2239" from-port="0" to-layer="2240" to-port="1" />
|
|
<edge from-layer="2240" from-port="2" to-layer="2241" to-port="1" />
|
|
<edge from-layer="2241" from-port="2" to-layer="2243" to-port="0" />
|
|
<edge from-layer="2242" from-port="0" to-layer="2243" to-port="1" />
|
|
<edge from-layer="2243" from-port="2" to-layer="2245" to-port="0" />
|
|
<edge from-layer="2244" from-port="0" to-layer="2245" to-port="1" />
|
|
<edge from-layer="2245" from-port="2" to-layer="2247" to-port="0" />
|
|
<edge from-layer="2246" from-port="0" to-layer="2247" to-port="1" />
|
|
<edge from-layer="2247" from-port="2" to-layer="2248" to-port="2" />
|
|
<edge from-layer="2248" from-port="4" to-layer="2250" to-port="0" />
|
|
<edge from-layer="2249" from-port="0" to-layer="2250" to-port="1" />
|
|
<edge from-layer="2250" from-port="2" to-layer="2252" to-port="0" />
|
|
<edge from-layer="2251" from-port="0" to-layer="2252" to-port="1" />
|
|
<edge from-layer="2252" from-port="2" to-layer="2254" to-port="0" />
|
|
<edge from-layer="2253" from-port="0" to-layer="2254" to-port="1" />
|
|
<edge from-layer="2254" from-port="2" to-layer="2259" to-port="0" />
|
|
<edge from-layer="2255" from-port="0" to-layer="2259" to-port="1" />
|
|
<edge from-layer="2256" from-port="0" to-layer="2259" to-port="2" />
|
|
<edge from-layer="2257" from-port="0" to-layer="2259" to-port="3" />
|
|
<edge from-layer="2258" from-port="0" to-layer="2259" to-port="4" />
|
|
<edge from-layer="2259" from-port="5" to-layer="2264" to-port="0" />
|
|
<edge from-layer="2260" from-port="0" to-layer="2261" to-port="0" />
|
|
<edge from-layer="2261" from-port="1" to-layer="2263" to-port="0" />
|
|
<edge from-layer="2262" from-port="0" to-layer="2263" to-port="1" />
|
|
<edge from-layer="2263" from-port="2" to-layer="2264" to-port="1" />
|
|
<edge from-layer="2264" from-port="2" to-layer="2266" to-port="0" />
|
|
<edge from-layer="2265" from-port="0" to-layer="2266" to-port="1" />
|
|
<edge from-layer="2266" from-port="2" to-layer="2267" to-port="0" />
|
|
<edge from-layer="2267" from-port="2" to-layer="2269" to-port="0" />
|
|
<edge from-layer="2268" from-port="0" to-layer="2269" to-port="1" />
|
|
<edge from-layer="2269" from-port="2" to-layer="2271" to-port="0" />
|
|
<edge from-layer="2270" from-port="0" to-layer="2271" to-port="1" />
|
|
<edge from-layer="2271" from-port="2" to-layer="2273" to-port="0" />
|
|
<edge from-layer="2272" from-port="0" to-layer="2273" to-port="1" />
|
|
<edge from-layer="2273" from-port="2" to-layer="2303" to-port="1" />
|
|
<edge from-layer="2273" from-port="2" to-layer="2275" to-port="0" />
|
|
<edge from-layer="2274" from-port="0" to-layer="2275" to-port="1" />
|
|
<edge from-layer="2275" from-port="2" to-layer="2280" to-port="0" />
|
|
<edge from-layer="2276" from-port="0" to-layer="2280" to-port="1" />
|
|
<edge from-layer="2277" from-port="0" to-layer="2280" to-port="2" />
|
|
<edge from-layer="2278" from-port="0" to-layer="2280" to-port="3" />
|
|
<edge from-layer="2279" from-port="0" to-layer="2280" to-port="4" />
|
|
<edge from-layer="2280" from-port="5" to-layer="2285" to-port="0" />
|
|
<edge from-layer="2281" from-port="0" to-layer="2282" to-port="0" />
|
|
<edge from-layer="2282" from-port="1" to-layer="2284" to-port="0" />
|
|
<edge from-layer="2283" from-port="0" to-layer="2284" to-port="1" />
|
|
<edge from-layer="2284" from-port="2" to-layer="2285" to-port="1" />
|
|
<edge from-layer="2285" from-port="2" to-layer="2287" to-port="0" />
|
|
<edge from-layer="2286" from-port="0" to-layer="2287" to-port="1" />
|
|
<edge from-layer="2287" from-port="2" to-layer="2288" to-port="0" />
|
|
<edge from-layer="2288" from-port="1" to-layer="2290" to-port="0" />
|
|
<edge from-layer="2289" from-port="0" to-layer="2290" to-port="1" />
|
|
<edge from-layer="2290" from-port="2" to-layer="2295" to-port="0" />
|
|
<edge from-layer="2291" from-port="0" to-layer="2295" to-port="1" />
|
|
<edge from-layer="2292" from-port="0" to-layer="2295" to-port="2" />
|
|
<edge from-layer="2293" from-port="0" to-layer="2295" to-port="3" />
|
|
<edge from-layer="2294" from-port="0" to-layer="2295" to-port="4" />
|
|
<edge from-layer="2295" from-port="5" to-layer="2300" to-port="0" />
|
|
<edge from-layer="2296" from-port="0" to-layer="2297" to-port="0" />
|
|
<edge from-layer="2297" from-port="1" to-layer="2299" to-port="0" />
|
|
<edge from-layer="2298" from-port="0" to-layer="2299" to-port="1" />
|
|
<edge from-layer="2299" from-port="2" to-layer="2300" to-port="1" />
|
|
<edge from-layer="2300" from-port="2" to-layer="2302" to-port="0" />
|
|
<edge from-layer="2301" from-port="0" to-layer="2302" to-port="1" />
|
|
<edge from-layer="2302" from-port="2" to-layer="2303" to-port="0" />
|
|
<edge from-layer="2303" from-port="2" to-layer="2305" to-port="0" />
|
|
<edge from-layer="2304" from-port="0" to-layer="2305" to-port="1" />
|
|
<edge from-layer="2305" from-port="2" to-layer="2307" to-port="0" />
|
|
<edge from-layer="2306" from-port="0" to-layer="2307" to-port="1" />
|
|
<edge from-layer="2307" from-port="2" to-layer="2309" to-port="0" />
|
|
<edge from-layer="2308" from-port="0" to-layer="2309" to-port="1" />
|
|
<edge from-layer="2309" from-port="2" to-layer="2311" to-port="0" />
|
|
<edge from-layer="2309" from-port="2" to-layer="2379" to-port="1" />
|
|
<edge from-layer="2310" from-port="0" to-layer="2311" to-port="1" />
|
|
<edge from-layer="2311" from-port="2" to-layer="2316" to-port="0" />
|
|
<edge from-layer="2312" from-port="0" to-layer="2316" to-port="1" />
|
|
<edge from-layer="2313" from-port="0" to-layer="2316" to-port="2" />
|
|
<edge from-layer="2314" from-port="0" to-layer="2316" to-port="3" />
|
|
<edge from-layer="2315" from-port="0" to-layer="2316" to-port="4" />
|
|
<edge from-layer="2316" from-port="5" to-layer="2321" to-port="0" />
|
|
<edge from-layer="2316" from-port="5" to-layer="2337" to-port="0" />
|
|
<edge from-layer="2316" from-port="5" to-layer="2353" to-port="0" />
|
|
<edge from-layer="2317" from-port="0" to-layer="2318" to-port="0" />
|
|
<edge from-layer="2318" from-port="1" to-layer="2320" to-port="0" />
|
|
<edge from-layer="2319" from-port="0" to-layer="2320" to-port="1" />
|
|
<edge from-layer="2320" from-port="2" to-layer="2321" to-port="1" />
|
|
<edge from-layer="2321" from-port="2" to-layer="2323" to-port="0" />
|
|
<edge from-layer="2322" from-port="0" to-layer="2323" to-port="1" />
|
|
<edge from-layer="2323" from-port="2" to-layer="2328" to-port="0" />
|
|
<edge from-layer="2324" from-port="0" to-layer="2328" to-port="1" />
|
|
<edge from-layer="2325" from-port="0" to-layer="2328" to-port="2" />
|
|
<edge from-layer="2326" from-port="0" to-layer="2328" to-port="3" />
|
|
<edge from-layer="2327" from-port="0" to-layer="2328" to-port="4" />
|
|
<edge from-layer="2328" from-port="5" to-layer="2330" to-port="0" />
|
|
<edge from-layer="2329" from-port="0" to-layer="2330" to-port="1" />
|
|
<edge from-layer="2330" from-port="2" to-layer="2332" to-port="0" />
|
|
<edge from-layer="2331" from-port="0" to-layer="2332" to-port="1" />
|
|
<edge from-layer="2332" from-port="2" to-layer="2360" to-port="0" />
|
|
<edge from-layer="2333" from-port="0" to-layer="2334" to-port="0" />
|
|
<edge from-layer="2334" from-port="1" to-layer="2336" to-port="0" />
|
|
<edge from-layer="2335" from-port="0" to-layer="2336" to-port="1" />
|
|
<edge from-layer="2336" from-port="2" to-layer="2337" to-port="1" />
|
|
<edge from-layer="2337" from-port="2" to-layer="2339" to-port="0" />
|
|
<edge from-layer="2338" from-port="0" to-layer="2339" to-port="1" />
|
|
<edge from-layer="2339" from-port="2" to-layer="2344" to-port="0" />
|
|
<edge from-layer="2340" from-port="0" to-layer="2344" to-port="1" />
|
|
<edge from-layer="2341" from-port="0" to-layer="2344" to-port="2" />
|
|
<edge from-layer="2342" from-port="0" to-layer="2344" to-port="3" />
|
|
<edge from-layer="2343" from-port="0" to-layer="2344" to-port="4" />
|
|
<edge from-layer="2344" from-port="5" to-layer="2346" to-port="0" />
|
|
<edge from-layer="2345" from-port="0" to-layer="2346" to-port="1" />
|
|
<edge from-layer="2346" from-port="2" to-layer="2348" to-port="0" />
|
|
<edge from-layer="2347" from-port="0" to-layer="2348" to-port="1" />
|
|
<edge from-layer="2348" from-port="2" to-layer="2360" to-port="1" />
|
|
<edge from-layer="2349" from-port="0" to-layer="2350" to-port="0" />
|
|
<edge from-layer="2350" from-port="1" to-layer="2352" to-port="0" />
|
|
<edge from-layer="2351" from-port="0" to-layer="2352" to-port="1" />
|
|
<edge from-layer="2352" from-port="2" to-layer="2353" to-port="1" />
|
|
<edge from-layer="2353" from-port="2" to-layer="2355" to-port="0" />
|
|
<edge from-layer="2354" from-port="0" to-layer="2355" to-port="1" />
|
|
<edge from-layer="2355" from-port="2" to-layer="2357" to-port="0" />
|
|
<edge from-layer="2356" from-port="0" to-layer="2357" to-port="1" />
|
|
<edge from-layer="2357" from-port="2" to-layer="2359" to-port="0" />
|
|
<edge from-layer="2358" from-port="0" to-layer="2359" to-port="1" />
|
|
<edge from-layer="2359" from-port="2" to-layer="2360" to-port="2" />
|
|
<edge from-layer="2360" from-port="4" to-layer="2362" to-port="0" />
|
|
<edge from-layer="2361" from-port="0" to-layer="2362" to-port="1" />
|
|
<edge from-layer="2362" from-port="2" to-layer="2364" to-port="0" />
|
|
<edge from-layer="2363" from-port="0" to-layer="2364" to-port="1" />
|
|
<edge from-layer="2364" from-port="2" to-layer="2366" to-port="0" />
|
|
<edge from-layer="2365" from-port="0" to-layer="2366" to-port="1" />
|
|
<edge from-layer="2366" from-port="2" to-layer="2371" to-port="0" />
|
|
<edge from-layer="2367" from-port="0" to-layer="2371" to-port="1" />
|
|
<edge from-layer="2368" from-port="0" to-layer="2371" to-port="2" />
|
|
<edge from-layer="2369" from-port="0" to-layer="2371" to-port="3" />
|
|
<edge from-layer="2370" from-port="0" to-layer="2371" to-port="4" />
|
|
<edge from-layer="2371" from-port="5" to-layer="2376" to-port="0" />
|
|
<edge from-layer="2372" from-port="0" to-layer="2373" to-port="0" />
|
|
<edge from-layer="2373" from-port="1" to-layer="2375" to-port="0" />
|
|
<edge from-layer="2374" from-port="0" to-layer="2375" to-port="1" />
|
|
<edge from-layer="2375" from-port="2" to-layer="2376" to-port="1" />
|
|
<edge from-layer="2376" from-port="2" to-layer="2378" to-port="0" />
|
|
<edge from-layer="2377" from-port="0" to-layer="2378" to-port="1" />
|
|
<edge from-layer="2378" from-port="2" to-layer="2379" to-port="0" />
|
|
<edge from-layer="2379" from-port="2" to-layer="2381" to-port="0" />
|
|
<edge from-layer="2380" from-port="0" to-layer="2381" to-port="1" />
|
|
<edge from-layer="2381" from-port="2" to-layer="2383" to-port="0" />
|
|
<edge from-layer="2382" from-port="0" to-layer="2383" to-port="1" />
|
|
<edge from-layer="2383" from-port="2" to-layer="2385" to-port="0" />
|
|
<edge from-layer="2384" from-port="0" to-layer="2385" to-port="1" />
|
|
<edge from-layer="2385" from-port="2" to-layer="2387" to-port="0" />
|
|
<edge from-layer="2385" from-port="2" to-layer="2415" to-port="1" />
|
|
<edge from-layer="2386" from-port="0" to-layer="2387" to-port="1" />
|
|
<edge from-layer="2387" from-port="2" to-layer="2392" to-port="0" />
|
|
<edge from-layer="2388" from-port="0" to-layer="2392" to-port="1" />
|
|
<edge from-layer="2389" from-port="0" to-layer="2392" to-port="2" />
|
|
<edge from-layer="2390" from-port="0" to-layer="2392" to-port="3" />
|
|
<edge from-layer="2391" from-port="0" to-layer="2392" to-port="4" />
|
|
<edge from-layer="2392" from-port="5" to-layer="2397" to-port="0" />
|
|
<edge from-layer="2393" from-port="0" to-layer="2394" to-port="0" />
|
|
<edge from-layer="2394" from-port="1" to-layer="2396" to-port="0" />
|
|
<edge from-layer="2395" from-port="0" to-layer="2396" to-port="1" />
|
|
<edge from-layer="2396" from-port="2" to-layer="2397" to-port="1" />
|
|
<edge from-layer="2397" from-port="2" to-layer="2399" to-port="0" />
|
|
<edge from-layer="2398" from-port="0" to-layer="2399" to-port="1" />
|
|
<edge from-layer="2399" from-port="2" to-layer="2400" to-port="0" />
|
|
<edge from-layer="2400" from-port="1" to-layer="2402" to-port="0" />
|
|
<edge from-layer="2401" from-port="0" to-layer="2402" to-port="1" />
|
|
<edge from-layer="2402" from-port="2" to-layer="2407" to-port="0" />
|
|
<edge from-layer="2403" from-port="0" to-layer="2407" to-port="1" />
|
|
<edge from-layer="2404" from-port="0" to-layer="2407" to-port="2" />
|
|
<edge from-layer="2405" from-port="0" to-layer="2407" to-port="3" />
|
|
<edge from-layer="2406" from-port="0" to-layer="2407" to-port="4" />
|
|
<edge from-layer="2407" from-port="5" to-layer="2412" to-port="0" />
|
|
<edge from-layer="2408" from-port="0" to-layer="2409" to-port="0" />
|
|
<edge from-layer="2409" from-port="1" to-layer="2411" to-port="0" />
|
|
<edge from-layer="2410" from-port="0" to-layer="2411" to-port="1" />
|
|
<edge from-layer="2411" from-port="2" to-layer="2412" to-port="1" />
|
|
<edge from-layer="2412" from-port="2" to-layer="2414" to-port="0" />
|
|
<edge from-layer="2413" from-port="0" to-layer="2414" to-port="1" />
|
|
<edge from-layer="2414" from-port="2" to-layer="2415" to-port="0" />
|
|
<edge from-layer="2415" from-port="2" to-layer="2417" to-port="0" />
|
|
<edge from-layer="2416" from-port="0" to-layer="2417" to-port="1" />
|
|
<edge from-layer="2417" from-port="2" to-layer="2419" to-port="0" />
|
|
<edge from-layer="2418" from-port="0" to-layer="2419" to-port="1" />
|
|
<edge from-layer="2419" from-port="2" to-layer="2421" to-port="0" />
|
|
<edge from-layer="2420" from-port="0" to-layer="2421" to-port="1" />
|
|
<edge from-layer="2421" from-port="2" to-layer="2423" to-port="0" />
|
|
<edge from-layer="2421" from-port="2" to-layer="2491" to-port="1" />
|
|
<edge from-layer="2422" from-port="0" to-layer="2423" to-port="1" />
|
|
<edge from-layer="2423" from-port="2" to-layer="2428" to-port="0" />
|
|
<edge from-layer="2424" from-port="0" to-layer="2428" to-port="1" />
|
|
<edge from-layer="2425" from-port="0" to-layer="2428" to-port="2" />
|
|
<edge from-layer="2426" from-port="0" to-layer="2428" to-port="3" />
|
|
<edge from-layer="2427" from-port="0" to-layer="2428" to-port="4" />
|
|
<edge from-layer="2428" from-port="5" to-layer="2433" to-port="0" />
|
|
<edge from-layer="2428" from-port="5" to-layer="2449" to-port="0" />
|
|
<edge from-layer="2428" from-port="5" to-layer="2465" to-port="0" />
|
|
<edge from-layer="2429" from-port="0" to-layer="2430" to-port="0" />
|
|
<edge from-layer="2430" from-port="1" to-layer="2432" to-port="0" />
|
|
<edge from-layer="2431" from-port="0" to-layer="2432" to-port="1" />
|
|
<edge from-layer="2432" from-port="2" to-layer="2433" to-port="1" />
|
|
<edge from-layer="2433" from-port="2" to-layer="2435" to-port="0" />
|
|
<edge from-layer="2434" from-port="0" to-layer="2435" to-port="1" />
|
|
<edge from-layer="2435" from-port="2" to-layer="2440" to-port="0" />
|
|
<edge from-layer="2436" from-port="0" to-layer="2440" to-port="1" />
|
|
<edge from-layer="2437" from-port="0" to-layer="2440" to-port="2" />
|
|
<edge from-layer="2438" from-port="0" to-layer="2440" to-port="3" />
|
|
<edge from-layer="2439" from-port="0" to-layer="2440" to-port="4" />
|
|
<edge from-layer="2440" from-port="5" to-layer="2442" to-port="0" />
|
|
<edge from-layer="2441" from-port="0" to-layer="2442" to-port="1" />
|
|
<edge from-layer="2442" from-port="2" to-layer="2444" to-port="0" />
|
|
<edge from-layer="2443" from-port="0" to-layer="2444" to-port="1" />
|
|
<edge from-layer="2444" from-port="2" to-layer="2472" to-port="0" />
|
|
<edge from-layer="2445" from-port="0" to-layer="2446" to-port="0" />
|
|
<edge from-layer="2446" from-port="1" to-layer="2448" to-port="0" />
|
|
<edge from-layer="2447" from-port="0" to-layer="2448" to-port="1" />
|
|
<edge from-layer="2448" from-port="2" to-layer="2449" to-port="1" />
|
|
<edge from-layer="2449" from-port="2" to-layer="2451" to-port="0" />
|
|
<edge from-layer="2450" from-port="0" to-layer="2451" to-port="1" />
|
|
<edge from-layer="2451" from-port="2" to-layer="2456" to-port="0" />
|
|
<edge from-layer="2452" from-port="0" to-layer="2456" to-port="1" />
|
|
<edge from-layer="2453" from-port="0" to-layer="2456" to-port="2" />
|
|
<edge from-layer="2454" from-port="0" to-layer="2456" to-port="3" />
|
|
<edge from-layer="2455" from-port="0" to-layer="2456" to-port="4" />
|
|
<edge from-layer="2456" from-port="5" to-layer="2458" to-port="0" />
|
|
<edge from-layer="2457" from-port="0" to-layer="2458" to-port="1" />
|
|
<edge from-layer="2458" from-port="2" to-layer="2460" to-port="0" />
|
|
<edge from-layer="2459" from-port="0" to-layer="2460" to-port="1" />
|
|
<edge from-layer="2460" from-port="2" to-layer="2472" to-port="1" />
|
|
<edge from-layer="2461" from-port="0" to-layer="2462" to-port="0" />
|
|
<edge from-layer="2462" from-port="1" to-layer="2464" to-port="0" />
|
|
<edge from-layer="2463" from-port="0" to-layer="2464" to-port="1" />
|
|
<edge from-layer="2464" from-port="2" to-layer="2465" to-port="1" />
|
|
<edge from-layer="2465" from-port="2" to-layer="2467" to-port="0" />
|
|
<edge from-layer="2466" from-port="0" to-layer="2467" to-port="1" />
|
|
<edge from-layer="2467" from-port="2" to-layer="2469" to-port="0" />
|
|
<edge from-layer="2468" from-port="0" to-layer="2469" to-port="1" />
|
|
<edge from-layer="2469" from-port="2" to-layer="2471" to-port="0" />
|
|
<edge from-layer="2470" from-port="0" to-layer="2471" to-port="1" />
|
|
<edge from-layer="2471" from-port="2" to-layer="2472" to-port="2" />
|
|
<edge from-layer="2472" from-port="4" to-layer="2474" to-port="0" />
|
|
<edge from-layer="2473" from-port="0" to-layer="2474" to-port="1" />
|
|
<edge from-layer="2474" from-port="2" to-layer="2476" to-port="0" />
|
|
<edge from-layer="2475" from-port="0" to-layer="2476" to-port="1" />
|
|
<edge from-layer="2476" from-port="2" to-layer="2478" to-port="0" />
|
|
<edge from-layer="2477" from-port="0" to-layer="2478" to-port="1" />
|
|
<edge from-layer="2478" from-port="2" to-layer="2483" to-port="0" />
|
|
<edge from-layer="2479" from-port="0" to-layer="2483" to-port="1" />
|
|
<edge from-layer="2480" from-port="0" to-layer="2483" to-port="2" />
|
|
<edge from-layer="2481" from-port="0" to-layer="2483" to-port="3" />
|
|
<edge from-layer="2482" from-port="0" to-layer="2483" to-port="4" />
|
|
<edge from-layer="2483" from-port="5" to-layer="2488" to-port="0" />
|
|
<edge from-layer="2484" from-port="0" to-layer="2485" to-port="0" />
|
|
<edge from-layer="2485" from-port="1" to-layer="2487" to-port="0" />
|
|
<edge from-layer="2486" from-port="0" to-layer="2487" to-port="1" />
|
|
<edge from-layer="2487" from-port="2" to-layer="2488" to-port="1" />
|
|
<edge from-layer="2488" from-port="2" to-layer="2490" to-port="0" />
|
|
<edge from-layer="2489" from-port="0" to-layer="2490" to-port="1" />
|
|
<edge from-layer="2490" from-port="2" to-layer="2491" to-port="0" />
|
|
<edge from-layer="2491" from-port="2" to-layer="2493" to-port="0" />
|
|
<edge from-layer="2492" from-port="0" to-layer="2493" to-port="1" />
|
|
<edge from-layer="2493" from-port="2" to-layer="2495" to-port="0" />
|
|
<edge from-layer="2494" from-port="0" to-layer="2495" to-port="1" />
|
|
<edge from-layer="2495" from-port="2" to-layer="2497" to-port="0" />
|
|
<edge from-layer="2496" from-port="0" to-layer="2497" to-port="1" />
|
|
<edge from-layer="2497" from-port="2" to-layer="2527" to-port="1" />
|
|
<edge from-layer="2497" from-port="2" to-layer="2499" to-port="0" />
|
|
<edge from-layer="2498" from-port="0" to-layer="2499" to-port="1" />
|
|
<edge from-layer="2499" from-port="2" to-layer="2504" to-port="0" />
|
|
<edge from-layer="2500" from-port="0" to-layer="2504" to-port="1" />
|
|
<edge from-layer="2501" from-port="0" to-layer="2504" to-port="2" />
|
|
<edge from-layer="2502" from-port="0" to-layer="2504" to-port="3" />
|
|
<edge from-layer="2503" from-port="0" to-layer="2504" to-port="4" />
|
|
<edge from-layer="2504" from-port="5" to-layer="2509" to-port="0" />
|
|
<edge from-layer="2505" from-port="0" to-layer="2506" to-port="0" />
|
|
<edge from-layer="2506" from-port="1" to-layer="2508" to-port="0" />
|
|
<edge from-layer="2507" from-port="0" to-layer="2508" to-port="1" />
|
|
<edge from-layer="2508" from-port="2" to-layer="2509" to-port="1" />
|
|
<edge from-layer="2509" from-port="2" to-layer="2511" to-port="0" />
|
|
<edge from-layer="2510" from-port="0" to-layer="2511" to-port="1" />
|
|
<edge from-layer="2511" from-port="2" to-layer="2512" to-port="0" />
|
|
<edge from-layer="2512" from-port="1" to-layer="2514" to-port="0" />
|
|
<edge from-layer="2513" from-port="0" to-layer="2514" to-port="1" />
|
|
<edge from-layer="2514" from-port="2" to-layer="2519" to-port="0" />
|
|
<edge from-layer="2515" from-port="0" to-layer="2519" to-port="1" />
|
|
<edge from-layer="2516" from-port="0" to-layer="2519" to-port="2" />
|
|
<edge from-layer="2517" from-port="0" to-layer="2519" to-port="3" />
|
|
<edge from-layer="2518" from-port="0" to-layer="2519" to-port="4" />
|
|
<edge from-layer="2519" from-port="5" to-layer="2524" to-port="0" />
|
|
<edge from-layer="2520" from-port="0" to-layer="2521" to-port="0" />
|
|
<edge from-layer="2521" from-port="1" to-layer="2523" to-port="0" />
|
|
<edge from-layer="2522" from-port="0" to-layer="2523" to-port="1" />
|
|
<edge from-layer="2523" from-port="2" to-layer="2524" to-port="1" />
|
|
<edge from-layer="2524" from-port="2" to-layer="2526" to-port="0" />
|
|
<edge from-layer="2525" from-port="0" to-layer="2526" to-port="1" />
|
|
<edge from-layer="2526" from-port="2" to-layer="2527" to-port="0" />
|
|
<edge from-layer="2527" from-port="2" to-layer="2529" to-port="0" />
|
|
<edge from-layer="2528" from-port="0" to-layer="2529" to-port="1" />
|
|
<edge from-layer="2529" from-port="2" to-layer="2531" to-port="0" />
|
|
<edge from-layer="2530" from-port="0" to-layer="2531" to-port="1" />
|
|
<edge from-layer="2531" from-port="2" to-layer="2533" to-port="0" />
|
|
<edge from-layer="2532" from-port="0" to-layer="2533" to-port="1" />
|
|
<edge from-layer="2533" from-port="2" to-layer="2535" to-port="0" />
|
|
<edge from-layer="2533" from-port="2" to-layer="2603" to-port="1" />
|
|
<edge from-layer="2534" from-port="0" to-layer="2535" to-port="1" />
|
|
<edge from-layer="2535" from-port="2" to-layer="2540" to-port="0" />
|
|
<edge from-layer="2536" from-port="0" to-layer="2540" to-port="1" />
|
|
<edge from-layer="2537" from-port="0" to-layer="2540" to-port="2" />
|
|
<edge from-layer="2538" from-port="0" to-layer="2540" to-port="3" />
|
|
<edge from-layer="2539" from-port="0" to-layer="2540" to-port="4" />
|
|
<edge from-layer="2540" from-port="5" to-layer="2545" to-port="0" />
|
|
<edge from-layer="2540" from-port="5" to-layer="2561" to-port="0" />
|
|
<edge from-layer="2540" from-port="5" to-layer="2577" to-port="0" />
|
|
<edge from-layer="2541" from-port="0" to-layer="2542" to-port="0" />
|
|
<edge from-layer="2542" from-port="1" to-layer="2544" to-port="0" />
|
|
<edge from-layer="2543" from-port="0" to-layer="2544" to-port="1" />
|
|
<edge from-layer="2544" from-port="2" to-layer="2545" to-port="1" />
|
|
<edge from-layer="2545" from-port="2" to-layer="2547" to-port="0" />
|
|
<edge from-layer="2546" from-port="0" to-layer="2547" to-port="1" />
|
|
<edge from-layer="2547" from-port="2" to-layer="2552" to-port="0" />
|
|
<edge from-layer="2548" from-port="0" to-layer="2552" to-port="1" />
|
|
<edge from-layer="2549" from-port="0" to-layer="2552" to-port="2" />
|
|
<edge from-layer="2550" from-port="0" to-layer="2552" to-port="3" />
|
|
<edge from-layer="2551" from-port="0" to-layer="2552" to-port="4" />
|
|
<edge from-layer="2552" from-port="5" to-layer="2554" to-port="0" />
|
|
<edge from-layer="2553" from-port="0" to-layer="2554" to-port="1" />
|
|
<edge from-layer="2554" from-port="2" to-layer="2556" to-port="0" />
|
|
<edge from-layer="2555" from-port="0" to-layer="2556" to-port="1" />
|
|
<edge from-layer="2556" from-port="2" to-layer="2584" to-port="0" />
|
|
<edge from-layer="2557" from-port="0" to-layer="2558" to-port="0" />
|
|
<edge from-layer="2558" from-port="1" to-layer="2560" to-port="0" />
|
|
<edge from-layer="2559" from-port="0" to-layer="2560" to-port="1" />
|
|
<edge from-layer="2560" from-port="2" to-layer="2561" to-port="1" />
|
|
<edge from-layer="2561" from-port="2" to-layer="2563" to-port="0" />
|
|
<edge from-layer="2562" from-port="0" to-layer="2563" to-port="1" />
|
|
<edge from-layer="2563" from-port="2" to-layer="2568" to-port="0" />
|
|
<edge from-layer="2564" from-port="0" to-layer="2568" to-port="1" />
|
|
<edge from-layer="2565" from-port="0" to-layer="2568" to-port="2" />
|
|
<edge from-layer="2566" from-port="0" to-layer="2568" to-port="3" />
|
|
<edge from-layer="2567" from-port="0" to-layer="2568" to-port="4" />
|
|
<edge from-layer="2568" from-port="5" to-layer="2570" to-port="0" />
|
|
<edge from-layer="2569" from-port="0" to-layer="2570" to-port="1" />
|
|
<edge from-layer="2570" from-port="2" to-layer="2572" to-port="0" />
|
|
<edge from-layer="2571" from-port="0" to-layer="2572" to-port="1" />
|
|
<edge from-layer="2572" from-port="2" to-layer="2584" to-port="1" />
|
|
<edge from-layer="2573" from-port="0" to-layer="2574" to-port="0" />
|
|
<edge from-layer="2574" from-port="1" to-layer="2576" to-port="0" />
|
|
<edge from-layer="2575" from-port="0" to-layer="2576" to-port="1" />
|
|
<edge from-layer="2576" from-port="2" to-layer="2577" to-port="1" />
|
|
<edge from-layer="2577" from-port="2" to-layer="2579" to-port="0" />
|
|
<edge from-layer="2578" from-port="0" to-layer="2579" to-port="1" />
|
|
<edge from-layer="2579" from-port="2" to-layer="2581" to-port="0" />
|
|
<edge from-layer="2580" from-port="0" to-layer="2581" to-port="1" />
|
|
<edge from-layer="2581" from-port="2" to-layer="2583" to-port="0" />
|
|
<edge from-layer="2582" from-port="0" to-layer="2583" to-port="1" />
|
|
<edge from-layer="2583" from-port="2" to-layer="2584" to-port="2" />
|
|
<edge from-layer="2584" from-port="4" to-layer="2586" to-port="0" />
|
|
<edge from-layer="2585" from-port="0" to-layer="2586" to-port="1" />
|
|
<edge from-layer="2586" from-port="2" to-layer="2588" to-port="0" />
|
|
<edge from-layer="2587" from-port="0" to-layer="2588" to-port="1" />
|
|
<edge from-layer="2588" from-port="2" to-layer="2590" to-port="0" />
|
|
<edge from-layer="2589" from-port="0" to-layer="2590" to-port="1" />
|
|
<edge from-layer="2590" from-port="2" to-layer="2595" to-port="0" />
|
|
<edge from-layer="2591" from-port="0" to-layer="2595" to-port="1" />
|
|
<edge from-layer="2592" from-port="0" to-layer="2595" to-port="2" />
|
|
<edge from-layer="2593" from-port="0" to-layer="2595" to-port="3" />
|
|
<edge from-layer="2594" from-port="0" to-layer="2595" to-port="4" />
|
|
<edge from-layer="2595" from-port="5" to-layer="2600" to-port="0" />
|
|
<edge from-layer="2596" from-port="0" to-layer="2597" to-port="0" />
|
|
<edge from-layer="2597" from-port="1" to-layer="2599" to-port="0" />
|
|
<edge from-layer="2598" from-port="0" to-layer="2599" to-port="1" />
|
|
<edge from-layer="2599" from-port="2" to-layer="2600" to-port="1" />
|
|
<edge from-layer="2600" from-port="2" to-layer="2602" to-port="0" />
|
|
<edge from-layer="2601" from-port="0" to-layer="2602" to-port="1" />
|
|
<edge from-layer="2602" from-port="2" to-layer="2603" to-port="0" />
|
|
<edge from-layer="2603" from-port="2" to-layer="2605" to-port="0" />
|
|
<edge from-layer="2604" from-port="0" to-layer="2605" to-port="1" />
|
|
<edge from-layer="2605" from-port="2" to-layer="2607" to-port="0" />
|
|
<edge from-layer="2606" from-port="0" to-layer="2607" to-port="1" />
|
|
<edge from-layer="2607" from-port="2" to-layer="2609" to-port="0" />
|
|
<edge from-layer="2608" from-port="0" to-layer="2609" to-port="1" />
|
|
<edge from-layer="2609" from-port="2" to-layer="2611" to-port="0" />
|
|
<edge from-layer="2609" from-port="2" to-layer="2639" to-port="1" />
|
|
<edge from-layer="2610" from-port="0" to-layer="2611" to-port="1" />
|
|
<edge from-layer="2611" from-port="2" to-layer="2616" to-port="0" />
|
|
<edge from-layer="2612" from-port="0" to-layer="2616" to-port="1" />
|
|
<edge from-layer="2613" from-port="0" to-layer="2616" to-port="2" />
|
|
<edge from-layer="2614" from-port="0" to-layer="2616" to-port="3" />
|
|
<edge from-layer="2615" from-port="0" to-layer="2616" to-port="4" />
|
|
<edge from-layer="2616" from-port="5" to-layer="2621" to-port="0" />
|
|
<edge from-layer="2617" from-port="0" to-layer="2618" to-port="0" />
|
|
<edge from-layer="2618" from-port="1" to-layer="2620" to-port="0" />
|
|
<edge from-layer="2619" from-port="0" to-layer="2620" to-port="1" />
|
|
<edge from-layer="2620" from-port="2" to-layer="2621" to-port="1" />
|
|
<edge from-layer="2621" from-port="2" to-layer="2623" to-port="0" />
|
|
<edge from-layer="2622" from-port="0" to-layer="2623" to-port="1" />
|
|
<edge from-layer="2623" from-port="2" to-layer="2624" to-port="0" />
|
|
<edge from-layer="2624" from-port="1" to-layer="2626" to-port="0" />
|
|
<edge from-layer="2625" from-port="0" to-layer="2626" to-port="1" />
|
|
<edge from-layer="2626" from-port="2" to-layer="2631" to-port="0" />
|
|
<edge from-layer="2627" from-port="0" to-layer="2631" to-port="1" />
|
|
<edge from-layer="2628" from-port="0" to-layer="2631" to-port="2" />
|
|
<edge from-layer="2629" from-port="0" to-layer="2631" to-port="3" />
|
|
<edge from-layer="2630" from-port="0" to-layer="2631" to-port="4" />
|
|
<edge from-layer="2631" from-port="5" to-layer="2636" to-port="0" />
|
|
<edge from-layer="2632" from-port="0" to-layer="2633" to-port="0" />
|
|
<edge from-layer="2633" from-port="1" to-layer="2635" to-port="0" />
|
|
<edge from-layer="2634" from-port="0" to-layer="2635" to-port="1" />
|
|
<edge from-layer="2635" from-port="2" to-layer="2636" to-port="1" />
|
|
<edge from-layer="2636" from-port="2" to-layer="2638" to-port="0" />
|
|
<edge from-layer="2637" from-port="0" to-layer="2638" to-port="1" />
|
|
<edge from-layer="2638" from-port="2" to-layer="2639" to-port="0" />
|
|
<edge from-layer="2639" from-port="2" to-layer="2641" to-port="0" />
|
|
<edge from-layer="2640" from-port="0" to-layer="2641" to-port="1" />
|
|
<edge from-layer="2641" from-port="2" to-layer="2643" to-port="0" />
|
|
<edge from-layer="2642" from-port="0" to-layer="2643" to-port="1" />
|
|
<edge from-layer="2643" from-port="2" to-layer="2645" to-port="0" />
|
|
<edge from-layer="2644" from-port="0" to-layer="2645" to-port="1" />
|
|
<edge from-layer="2645" from-port="2" to-layer="2647" to-port="0" />
|
|
<edge from-layer="2645" from-port="2" to-layer="2715" to-port="1" />
|
|
<edge from-layer="2646" from-port="0" to-layer="2647" to-port="1" />
|
|
<edge from-layer="2647" from-port="2" to-layer="2652" to-port="0" />
|
|
<edge from-layer="2648" from-port="0" to-layer="2652" to-port="1" />
|
|
<edge from-layer="2649" from-port="0" to-layer="2652" to-port="2" />
|
|
<edge from-layer="2650" from-port="0" to-layer="2652" to-port="3" />
|
|
<edge from-layer="2651" from-port="0" to-layer="2652" to-port="4" />
|
|
<edge from-layer="2652" from-port="5" to-layer="2657" to-port="0" />
|
|
<edge from-layer="2652" from-port="5" to-layer="2673" to-port="0" />
|
|
<edge from-layer="2652" from-port="5" to-layer="2689" to-port="0" />
|
|
<edge from-layer="2653" from-port="0" to-layer="2654" to-port="0" />
|
|
<edge from-layer="2654" from-port="1" to-layer="2656" to-port="0" />
|
|
<edge from-layer="2655" from-port="0" to-layer="2656" to-port="1" />
|
|
<edge from-layer="2656" from-port="2" to-layer="2657" to-port="1" />
|
|
<edge from-layer="2657" from-port="2" to-layer="2659" to-port="0" />
|
|
<edge from-layer="2658" from-port="0" to-layer="2659" to-port="1" />
|
|
<edge from-layer="2659" from-port="2" to-layer="2664" to-port="0" />
|
|
<edge from-layer="2660" from-port="0" to-layer="2664" to-port="1" />
|
|
<edge from-layer="2661" from-port="0" to-layer="2664" to-port="2" />
|
|
<edge from-layer="2662" from-port="0" to-layer="2664" to-port="3" />
|
|
<edge from-layer="2663" from-port="0" to-layer="2664" to-port="4" />
|
|
<edge from-layer="2664" from-port="5" to-layer="2666" to-port="0" />
|
|
<edge from-layer="2665" from-port="0" to-layer="2666" to-port="1" />
|
|
<edge from-layer="2666" from-port="2" to-layer="2668" to-port="0" />
|
|
<edge from-layer="2667" from-port="0" to-layer="2668" to-port="1" />
|
|
<edge from-layer="2668" from-port="2" to-layer="2696" to-port="0" />
|
|
<edge from-layer="2669" from-port="0" to-layer="2670" to-port="0" />
|
|
<edge from-layer="2670" from-port="1" to-layer="2672" to-port="0" />
|
|
<edge from-layer="2671" from-port="0" to-layer="2672" to-port="1" />
|
|
<edge from-layer="2672" from-port="2" to-layer="2673" to-port="1" />
|
|
<edge from-layer="2673" from-port="2" to-layer="2675" to-port="0" />
|
|
<edge from-layer="2674" from-port="0" to-layer="2675" to-port="1" />
|
|
<edge from-layer="2675" from-port="2" to-layer="2680" to-port="0" />
|
|
<edge from-layer="2676" from-port="0" to-layer="2680" to-port="1" />
|
|
<edge from-layer="2677" from-port="0" to-layer="2680" to-port="2" />
|
|
<edge from-layer="2678" from-port="0" to-layer="2680" to-port="3" />
|
|
<edge from-layer="2679" from-port="0" to-layer="2680" to-port="4" />
|
|
<edge from-layer="2680" from-port="5" to-layer="2682" to-port="0" />
|
|
<edge from-layer="2681" from-port="0" to-layer="2682" to-port="1" />
|
|
<edge from-layer="2682" from-port="2" to-layer="2684" to-port="0" />
|
|
<edge from-layer="2683" from-port="0" to-layer="2684" to-port="1" />
|
|
<edge from-layer="2684" from-port="2" to-layer="2696" to-port="1" />
|
|
<edge from-layer="2685" from-port="0" to-layer="2686" to-port="0" />
|
|
<edge from-layer="2686" from-port="1" to-layer="2688" to-port="0" />
|
|
<edge from-layer="2687" from-port="0" to-layer="2688" to-port="1" />
|
|
<edge from-layer="2688" from-port="2" to-layer="2689" to-port="1" />
|
|
<edge from-layer="2689" from-port="2" to-layer="2691" to-port="0" />
|
|
<edge from-layer="2690" from-port="0" to-layer="2691" to-port="1" />
|
|
<edge from-layer="2691" from-port="2" to-layer="2693" to-port="0" />
|
|
<edge from-layer="2692" from-port="0" to-layer="2693" to-port="1" />
|
|
<edge from-layer="2693" from-port="2" to-layer="2695" to-port="0" />
|
|
<edge from-layer="2694" from-port="0" to-layer="2695" to-port="1" />
|
|
<edge from-layer="2695" from-port="2" to-layer="2696" to-port="2" />
|
|
<edge from-layer="2696" from-port="4" to-layer="2698" to-port="0" />
|
|
<edge from-layer="2697" from-port="0" to-layer="2698" to-port="1" />
|
|
<edge from-layer="2698" from-port="2" to-layer="2700" to-port="0" />
|
|
<edge from-layer="2699" from-port="0" to-layer="2700" to-port="1" />
|
|
<edge from-layer="2700" from-port="2" to-layer="2702" to-port="0" />
|
|
<edge from-layer="2701" from-port="0" to-layer="2702" to-port="1" />
|
|
<edge from-layer="2702" from-port="2" to-layer="2707" to-port="0" />
|
|
<edge from-layer="2703" from-port="0" to-layer="2707" to-port="1" />
|
|
<edge from-layer="2704" from-port="0" to-layer="2707" to-port="2" />
|
|
<edge from-layer="2705" from-port="0" to-layer="2707" to-port="3" />
|
|
<edge from-layer="2706" from-port="0" to-layer="2707" to-port="4" />
|
|
<edge from-layer="2707" from-port="5" to-layer="2712" to-port="0" />
|
|
<edge from-layer="2708" from-port="0" to-layer="2709" to-port="0" />
|
|
<edge from-layer="2709" from-port="1" to-layer="2711" to-port="0" />
|
|
<edge from-layer="2710" from-port="0" to-layer="2711" to-port="1" />
|
|
<edge from-layer="2711" from-port="2" to-layer="2712" to-port="1" />
|
|
<edge from-layer="2712" from-port="2" to-layer="2714" to-port="0" />
|
|
<edge from-layer="2713" from-port="0" to-layer="2714" to-port="1" />
|
|
<edge from-layer="2714" from-port="2" to-layer="2715" to-port="0" />
|
|
<edge from-layer="2715" from-port="2" to-layer="2717" to-port="0" />
|
|
<edge from-layer="2716" from-port="0" to-layer="2717" to-port="1" />
|
|
<edge from-layer="2717" from-port="2" to-layer="2719" to-port="0" />
|
|
<edge from-layer="2718" from-port="0" to-layer="2719" to-port="1" />
|
|
<edge from-layer="2719" from-port="2" to-layer="2721" to-port="0" />
|
|
<edge from-layer="2720" from-port="0" to-layer="2721" to-port="1" />
|
|
<edge from-layer="2721" from-port="2" to-layer="2723" to-port="0" />
|
|
<edge from-layer="2721" from-port="2" to-layer="2751" to-port="1" />
|
|
<edge from-layer="2722" from-port="0" to-layer="2723" to-port="1" />
|
|
<edge from-layer="2723" from-port="2" to-layer="2728" to-port="0" />
|
|
<edge from-layer="2724" from-port="0" to-layer="2728" to-port="1" />
|
|
<edge from-layer="2725" from-port="0" to-layer="2728" to-port="2" />
|
|
<edge from-layer="2726" from-port="0" to-layer="2728" to-port="3" />
|
|
<edge from-layer="2727" from-port="0" to-layer="2728" to-port="4" />
|
|
<edge from-layer="2728" from-port="5" to-layer="2733" to-port="0" />
|
|
<edge from-layer="2729" from-port="0" to-layer="2730" to-port="0" />
|
|
<edge from-layer="2730" from-port="1" to-layer="2732" to-port="0" />
|
|
<edge from-layer="2731" from-port="0" to-layer="2732" to-port="1" />
|
|
<edge from-layer="2732" from-port="2" to-layer="2733" to-port="1" />
|
|
<edge from-layer="2733" from-port="2" to-layer="2735" to-port="0" />
|
|
<edge from-layer="2734" from-port="0" to-layer="2735" to-port="1" />
|
|
<edge from-layer="2735" from-port="2" to-layer="2736" to-port="0" />
|
|
<edge from-layer="2736" from-port="1" to-layer="2738" to-port="0" />
|
|
<edge from-layer="2737" from-port="0" to-layer="2738" to-port="1" />
|
|
<edge from-layer="2738" from-port="2" to-layer="2743" to-port="0" />
|
|
<edge from-layer="2739" from-port="0" to-layer="2743" to-port="1" />
|
|
<edge from-layer="2740" from-port="0" to-layer="2743" to-port="2" />
|
|
<edge from-layer="2741" from-port="0" to-layer="2743" to-port="3" />
|
|
<edge from-layer="2742" from-port="0" to-layer="2743" to-port="4" />
|
|
<edge from-layer="2743" from-port="5" to-layer="2748" to-port="0" />
|
|
<edge from-layer="2744" from-port="0" to-layer="2745" to-port="0" />
|
|
<edge from-layer="2745" from-port="1" to-layer="2747" to-port="0" />
|
|
<edge from-layer="2746" from-port="0" to-layer="2747" to-port="1" />
|
|
<edge from-layer="2747" from-port="2" to-layer="2748" to-port="1" />
|
|
<edge from-layer="2748" from-port="2" to-layer="2750" to-port="0" />
|
|
<edge from-layer="2749" from-port="0" to-layer="2750" to-port="1" />
|
|
<edge from-layer="2750" from-port="2" to-layer="2751" to-port="0" />
|
|
<edge from-layer="2751" from-port="2" to-layer="2753" to-port="0" />
|
|
<edge from-layer="2752" from-port="0" to-layer="2753" to-port="1" />
|
|
<edge from-layer="2753" from-port="2" to-layer="2755" to-port="0" />
|
|
<edge from-layer="2754" from-port="0" to-layer="2755" to-port="1" />
|
|
<edge from-layer="2755" from-port="2" to-layer="2757" to-port="0" />
|
|
<edge from-layer="2756" from-port="0" to-layer="2757" to-port="1" />
|
|
<edge from-layer="2757" from-port="2" to-layer="2760" to-port="0" />
|
|
<edge from-layer="2758" from-port="0" to-layer="2760" to-port="1" />
|
|
<edge from-layer="2759" from-port="0" to-layer="2760" to-port="2" />
|
|
<edge from-layer="2760" from-port="3" to-layer="2762" to-port="0" />
|
|
<edge from-layer="2761" from-port="0" to-layer="2762" to-port="1" />
|
|
<edge from-layer="2762" from-port="2" to-layer="2767" to-port="0" />
|
|
<edge from-layer="2763" from-port="0" to-layer="2767" to-port="1" />
|
|
<edge from-layer="2764" from-port="0" to-layer="2767" to-port="2" />
|
|
<edge from-layer="2765" from-port="0" to-layer="2767" to-port="3" />
|
|
<edge from-layer="2766" from-port="0" to-layer="2767" to-port="4" />
|
|
<edge from-layer="2767" from-port="5" to-layer="2772" to-port="0" />
|
|
<edge from-layer="2768" from-port="0" to-layer="2769" to-port="0" />
|
|
<edge from-layer="2769" from-port="1" to-layer="2771" to-port="0" />
|
|
<edge from-layer="2770" from-port="0" to-layer="2771" to-port="1" />
|
|
<edge from-layer="2771" from-port="2" to-layer="2772" to-port="1" />
|
|
<edge from-layer="2772" from-port="2" to-layer="2774" to-port="0" />
|
|
<edge from-layer="2773" from-port="0" to-layer="2774" to-port="1" />
|
|
<edge from-layer="2774" from-port="2" to-layer="2775" to-port="0" />
|
|
<edge from-layer="2775" from-port="1" to-layer="2777" to-port="0" />
|
|
<edge from-layer="2776" from-port="0" to-layer="2777" to-port="1" />
|
|
<edge from-layer="2777" from-port="2" to-layer="2782" to-port="0" />
|
|
<edge from-layer="2778" from-port="0" to-layer="2782" to-port="1" />
|
|
<edge from-layer="2779" from-port="0" to-layer="2782" to-port="2" />
|
|
<edge from-layer="2780" from-port="0" to-layer="2782" to-port="3" />
|
|
<edge from-layer="2781" from-port="0" to-layer="2782" to-port="4" />
|
|
<edge from-layer="2782" from-port="5" to-layer="2787" to-port="0" />
|
|
<edge from-layer="2783" from-port="0" to-layer="2784" to-port="0" />
|
|
<edge from-layer="2784" from-port="1" to-layer="2786" to-port="0" />
|
|
<edge from-layer="2785" from-port="0" to-layer="2786" to-port="1" />
|
|
<edge from-layer="2786" from-port="2" to-layer="2787" to-port="1" />
|
|
<edge from-layer="2787" from-port="2" to-layer="2789" to-port="0" />
|
|
<edge from-layer="2788" from-port="0" to-layer="2789" to-port="1" />
|
|
<edge from-layer="2789" from-port="2" to-layer="2790" to-port="0" />
|
|
</edges>
|
|
<rt_info>
|
|
<Runtime_version value="2024.4.1-16618-643f23d1318-releases/2024/4" />
|
|
<conversion_parameters>
|
|
<framework value="pytorch" />
|
|
<is_python_object value="True" />
|
|
</conversion_parameters>
|
|
<nncf>
|
|
<friendly_names_were_updated value="True" />
|
|
<quantization>
|
|
<advanced_parameters value="{'overflow_fix': 'disable', 'quantize_outputs': False, 'inplace_statistics': True, 'disable_channel_alignment': True, 'disable_bias_correction': False, 'batchwise_statistics': None, 'activations_quantization_params': None, 'weights_quantization_params': None, 'activations_range_estimator_params': {'min': {'statistics_type': None, 'aggregator_type': None, 'clipping_value': None, 'quantile_outlier_prob': 0.0001}, 'max': {'statistics_type': None, 'aggregator_type': None, 'clipping_value': None, 'quantile_outlier_prob': 0.0001}}, 'weights_range_estimator_params': {'min': {'statistics_type': None, 'aggregator_type': None, 'clipping_value': None, 'quantile_outlier_prob': 0.0001}, 'max': {'statistics_type': None, 'aggregator_type': None, 'clipping_value': None, 'quantile_outlier_prob': 0.0001}}, 'bias_correction_params': {'apply_for_all_nodes': False, 'threshold': None}, 'smooth_quant_alphas': {'convolution': -1, 'matmul': 0.95}, 'smooth_quant_alpha': None, 'backend_params': {}}" />
|
|
<fast_bias_correction value="True" />
|
|
<ignored_scope>
|
|
<types value="['GroupNormalization']" />
|
|
</ignored_scope>
|
|
<model_type value="transformer" />
|
|
<preset value="mixed" />
|
|
<subset_size value="300" />
|
|
<target_device value="ANY" />
|
|
</quantization>
|
|
</nncf>
|
|
<optimum>
|
|
<optimum_intel_version value="1.20.1" />
|
|
<optimum_version value="1.24.0" />
|
|
<pytorch_version value="2.6.0+cu124" />
|
|
<transformers_version value="4.52.0.dev0" />
|
|
</optimum>
|
|
</rt_info>
|
|
</net>
|