diff --git a/tests/openvino/native/data/2025.1/reference_graphs/quantized/swin-block_performance_transformer.dot b/tests/openvino/native/data/2025.1/reference_graphs/quantized/swin-block_performance_transformer.dot index e9f9efc75de..e7bc88fe652 100644 --- a/tests/openvino/native/data/2025.1/reference_graphs/quantized/swin-block_performance_transformer.dot +++ b/tests/openvino/native/data/2025.1/reference_graphs/quantized/swin-block_performance_transformer.dot @@ -1,4 +1,4 @@ -strict digraph { +strict digraph { "0 input.1" [id=0, type=Parameter]; "1 /Add" [id=1, type=Add]; "2 MVN_19" [id=2, type=MVN]; @@ -12,211 +12,196 @@ strict digraph { "10 /Reshape_3" [id=10, type=Reshape]; "11 /mlp/fc1/Add" [id=11, type=Add]; "12 /attn/qkv/MatMul" [id=12, type=MatMul]; -"13 /mlp/act/Div" [id=13, type=Multiply]; -"14 /mlp/act/Mul" [id=14, type=Multiply]; -"15 /attn/qkv/Add" [id=15, type=Add]; -"16 /mlp/act/Erf" [id=16, type=Erf]; -"17 /mlp/act/Mul_1" [id=17, type=Multiply]; -"18 /attn/Reshape" [id=18, type=Reshape]; -"19 /mlp/act/Add" [id=19, type=Add]; -"20 /mlp/act/Mul_1/fq_output_0" [id=20, type=FakeQuantize]; -"21 /attn/Transpose" [id=21, type=Transpose]; -"22 /mlp/fc2/MatMul" [id=22, type=MatMul]; -"23 /attn/Gather" [id=23, type=Gather]; -"24 /attn/Gather_1/fq_input_0" [id=24, type=FakeQuantize]; -"25 /attn/Gather_2" [id=25, type=Gather]; -"26 /mlp/fc2/Add" [id=26, type=Add]; -"27 /attn/Mul" [id=27, type=Multiply]; -"28 /attn/Gather_1" [id=28, type=Gather]; -"29 /attn/MatMul_1" [id=29, type=ScaledDotProductAttention]; -"30 /attn/Mul/fq_output_0" [id=30, type=FakeQuantize]; -"31 /attn/MatMul_1/fq_output_0" [id=31, type=FakeQuantize]; -"32 /attn/Transpose_2" [id=32, type=Transpose]; -"33 /attn/Reshape_1" [id=33, type=Reshape]; -"34 /attn/proj/MatMul" [id=34, type=MatMul]; -"35 /attn/proj/Add" [id=35, type=Add]; -"36 /mlp/fc2/MatMul/fq_weights_1" [id=36, type=FakeQuantize]; -"37 /mlp/fc2/MatMul/fq_weights_1/output_high" [id=37, type=Constant]; -"38 /mlp/fc2/MatMul/fq_weights_1/output_low" [id=38, type=Constant]; -"39 /mlp/fc2/MatMul/fq_weights_1/input_high" [id=39, type=Constant]; -"40 /mlp/fc2/MatMul/fq_weights_1/input_low" [id=40, type=Constant]; -"41 Transpose_1888" [id=41, type=Constant]; -"42 /mlp/act/Mul_1/fq_output_0/output_high" [id=42, type=Constant]; -"43 /mlp/act/Mul_1/fq_output_0/output_low" [id=43, type=Constant]; -"44 /mlp/act/Mul_1/fq_output_0/input_high" [id=44, type=Constant]; -"45 /mlp/act/Mul_1/fq_output_0/input_low" [id=45, type=Constant]; -"46 Constant_1926" [id=46, type=Constant]; -"47 Constant_1925" [id=47, type=Constant]; -"48 Constant_1924" [id=48, type=Constant]; -"49 /mlp/fc1/MatMul/fq_weights_1" [id=49, type=FakeQuantize]; -"50 /mlp/fc1/MatMul/fq_weights_1/output_high" [id=50, type=Constant]; -"51 /mlp/fc1/MatMul/fq_weights_1/output_low" [id=51, type=Constant]; -"52 /mlp/fc1/MatMul/fq_weights_1/input_high" [id=52, type=Constant]; -"53 /mlp/fc1/MatMul/fq_weights_1/input_low" [id=53, type=Constant]; -"54 Transpose_1873" [id=54, type=Constant]; -"55 MVN_74/fq_output_0/output_high" [id=55, type=Constant]; -"56 MVN_74/fq_output_0/output_low" [id=56, type=Constant]; -"57 MVN_74/fq_output_0/input_high" [id=57, type=Constant]; -"58 MVN_74/fq_output_0/input_low" [id=58, type=Constant]; -"59 Range_73" [id=59, type=Constant]; -"60 /attn/proj/MatMul/fq_weights_1" [id=60, type=FakeQuantize]; -"61 /attn/proj/MatMul/fq_weights_1/output_high" [id=61, type=Constant]; -"62 /attn/proj/MatMul/fq_weights_1/output_low" [id=62, type=Constant]; -"63 /attn/proj/MatMul/fq_weights_1/input_high" [id=63, type=Constant]; -"64 /attn/proj/MatMul/fq_weights_1/input_low" [id=64, type=Constant]; -"65 Transpose_1862" [id=65, type=Constant]; -"66 /attn/Constant_2" [id=66, type=Constant]; -"67 Constant_53" [id=67, type=Constant]; -"68 /attn/MatMul_1/fq_output_0/output_high" [id=68, type=Constant]; -"69 /attn/MatMul_1/fq_output_0/output_low" [id=69, type=Constant]; -"70 /attn/MatMul_1/fq_output_0/input_high" [id=70, type=Constant]; -"71 /attn/MatMul_1/fq_output_0/input_low" [id=71, type=Constant]; -"72 Constant_1859" [id=72, type=Constant]; -"73 onnx^^Add_194" [id=73, label="73 onnx::Add_194", type=Constant]; -"74 Constant_43" [id=74, type=Constant]; -"75 /Constant_1" [id=75, type=Constant]; -"76 Constant_37" [id=76, type=Constant]; -"77 /attn/Constant" [id=77, type=Constant]; -"78 /attn/qkv/MatMul/fq_weights_1" [id=78, type=FakeQuantize]; -"79 /attn/qkv/MatMul/fq_weights_1/output_high" [id=79, type=Constant]; -"80 /attn/qkv/MatMul/fq_weights_1/output_low" [id=80, type=Constant]; -"81 /attn/qkv/MatMul/fq_weights_1/input_high" [id=81, type=Constant]; -"82 /attn/qkv/MatMul/fq_weights_1/input_low" [id=82, type=Constant]; -"83 Transpose_1847" [id=83, type=Constant]; -"84 Constant_1943" [id=84, type=Constant]; -"85 Multiply_20/fq_output_0/output_high" [id=85, type=Constant]; -"86 Multiply_20/fq_output_0/output_low" [id=86, type=Constant]; -"87 Multiply_20/fq_output_0/input_high" [id=87, type=Constant]; -"88 Multiply_20/fq_output_0/input_low" [id=88, type=Constant]; -"89 Constant_1919" [id=89, type=Constant]; -"90 Range_18" [id=90, type=Constant]; -"91 Constant_1920" [id=91, type=Constant]; -"92 Constant_41" [id=92, type=Constant]; -"93 /Constant_3" [id=93, type=Constant]; -"94 /attn/Gather_1/fq_input_0/output_high" [id=94, type=Constant]; -"95 /attn/Gather_1/fq_input_0/output_low" [id=95, type=Constant]; -"96 /attn/Gather_1/fq_input_0/input_high" [id=96, type=Constant]; -"97 /attn/Gather_1/fq_input_0/input_low" [id=97, type=Constant]; -"98 /attn/Mul/fq_output_0/output_high" [id=98, type=Constant]; -"99 /attn/Mul/fq_output_0/output_low" [id=99, type=Constant]; -"100 /attn/Mul/fq_output_0/input_high" [id=100, type=Constant]; -"101 /attn/Mul/fq_output_0/input_low" [id=101, type=Constant]; -"102 Constant_1921" [id=102, type=Constant]; -"103 Constant_39" [id=103, type=Constant]; -"104 /Constant" [id=104, type=Constant]; -"105 Constant_1922" [id=105, type=Constant]; -"106 Constant_1923" [id=106, type=Constant]; -"107 Constant_1927" [id=107, type=Constant]; -"0 input.1" -> "1 /Add" [label="[1, 16, 8]", style=solid]; -"0 input.1" -> "2 MVN_19" [label="[1, 16, 8]", style=solid]; -"1 /Add" -> "3 161" [label="[1, 16, 8]", style=solid]; -"1 /Add" -> "4 MVN_74" [label="[1, 16, 8]", style=solid]; -"2 MVN_19" -> "5 Multiply_20" [label="[1, 16, 8]", style=solid]; -"3 161" -> "6 161/sink_port_0" [label="[1, 16, 8]", style=solid]; -"4 MVN_74" -> "7 MVN_74/fq_output_0" [label="[1, 16, 8]", style=solid]; -"5 Multiply_20" -> "8 Multiply_20/fq_output_0" [label="[1, 16, 8]", style=solid]; -"7 MVN_74/fq_output_0" -> "9 /mlp/fc1/MatMul" [label="[1, 16, 8]", style=solid]; -"8 Multiply_20/fq_output_0" -> "10 /Reshape_3" [label="[1, 16, 8]", style=solid]; -"9 /mlp/fc1/MatMul" -> "11 /mlp/fc1/Add" [label="[1, 16, 32]", style=solid]; -"10 /Reshape_3" -> "12 /attn/qkv/MatMul" [label="[1, 16, 8]", style=solid]; -"11 /mlp/fc1/Add" -> "13 /mlp/act/Div" [label="[1, 16, 32]", style=solid]; -"11 /mlp/fc1/Add" -> "14 /mlp/act/Mul" [label="[1, 16, 32]", style=solid]; -"12 /attn/qkv/MatMul" -> "15 /attn/qkv/Add" [label="[1, 16, 24]", style=solid]; -"13 /mlp/act/Div" -> "16 /mlp/act/Erf" [label="[1, 16, 32]", style=solid]; -"14 /mlp/act/Mul" -> "17 /mlp/act/Mul_1" [label="[1, 16, 32]", style=solid]; -"15 /attn/qkv/Add" -> "18 /attn/Reshape" [label="[1, 16, 24]", style=solid]; -"16 /mlp/act/Erf" -> "19 /mlp/act/Add" [label="[1, 16, 32]", style=solid]; -"17 /mlp/act/Mul_1" -> "20 /mlp/act/Mul_1/fq_output_0" [label="[1, 16, 32]", style=solid]; -"18 /attn/Reshape" -> "21 /attn/Transpose" [label="[1, 16, 3, 2, 4]", style=solid]; -"19 /mlp/act/Add" -> "14 /mlp/act/Mul" [label="[1, 16, 32]", style=solid]; -"20 /mlp/act/Mul_1/fq_output_0" -> "22 /mlp/fc2/MatMul" [label="[1, 16, 32]", style=solid]; -"21 /attn/Transpose" -> "23 /attn/Gather" [label="[3, 1, 2, 16, 4]", style=solid]; -"21 /attn/Transpose" -> "24 /attn/Gather_1/fq_input_0" [label="[3, 1, 2, 16, 4]", style=solid]; -"21 /attn/Transpose" -> "25 /attn/Gather_2" [label="[3, 1, 2, 16, 4]", style=solid]; -"22 /mlp/fc2/MatMul" -> "26 /mlp/fc2/Add" [label="[1, 16, 8]", style=solid]; -"23 /attn/Gather" -> "27 /attn/Mul" [label="[1, 2, 16, 4]", style=solid]; -"24 /attn/Gather_1/fq_input_0" -> "28 /attn/Gather_1" [label="[3, 1, 2, 16, 4]", style=solid]; -"25 /attn/Gather_2" -> "29 /attn/MatMul_1" [label="[1, 2, 16, 4]", style=solid]; -"26 /mlp/fc2/Add" -> "3 161" [label="[1, 16, 8]", style=solid]; -"27 /attn/Mul" -> "30 /attn/Mul/fq_output_0" [label="[1, 2, 16, 4]", style=solid]; -"28 /attn/Gather_1" -> "29 /attn/MatMul_1" [label="[1, 2, 16, 4]", style=solid]; -"29 /attn/MatMul_1" -> "31 /attn/MatMul_1/fq_output_0" [label="[1, 2, 16, 4]", style=solid]; -"30 /attn/Mul/fq_output_0" -> "29 /attn/MatMul_1" [label="[1, 2, 16, 4]", style=solid]; -"31 /attn/MatMul_1/fq_output_0" -> "32 /attn/Transpose_2" [label="[1, 2, 16, 4]", style=solid]; -"32 /attn/Transpose_2" -> "33 /attn/Reshape_1" [label="[1, 16, 2, 4]", style=solid]; -"33 /attn/Reshape_1" -> "34 /attn/proj/MatMul" [label="[1, 16, 8]", style=solid]; -"34 /attn/proj/MatMul" -> "35 /attn/proj/Add" [label="[1, 16, 8]", style=solid]; -"35 /attn/proj/Add" -> "1 /Add" [label="[1, 16, 8]", style=solid]; -"36 /mlp/fc2/MatMul/fq_weights_1" -> "22 /mlp/fc2/MatMul" [label="[8, 32]", style=solid]; -"37 /mlp/fc2/MatMul/fq_weights_1/output_high" -> "36 /mlp/fc2/MatMul/fq_weights_1" [label="[8, 1]", style=solid]; -"38 /mlp/fc2/MatMul/fq_weights_1/output_low" -> "36 /mlp/fc2/MatMul/fq_weights_1" [label="[8, 1]", style=solid]; -"39 /mlp/fc2/MatMul/fq_weights_1/input_high" -> "36 /mlp/fc2/MatMul/fq_weights_1" [label="[8, 1]", style=solid]; -"40 /mlp/fc2/MatMul/fq_weights_1/input_low" -> "36 /mlp/fc2/MatMul/fq_weights_1" [label="[8, 1]", style=solid]; -"41 Transpose_1888" -> "36 /mlp/fc2/MatMul/fq_weights_1" [label="[8, 32]", style=solid]; -"42 /mlp/act/Mul_1/fq_output_0/output_high" -> "20 /mlp/act/Mul_1/fq_output_0" [label="[]", style=solid]; -"43 /mlp/act/Mul_1/fq_output_0/output_low" -> "20 /mlp/act/Mul_1/fq_output_0" [label="[]", style=solid]; -"44 /mlp/act/Mul_1/fq_output_0/input_high" -> "20 /mlp/act/Mul_1/fq_output_0" [label="[]", style=solid]; -"45 /mlp/act/Mul_1/fq_output_0/input_low" -> "20 /mlp/act/Mul_1/fq_output_0" [label="[]", style=solid]; -"46 Constant_1926" -> "17 /mlp/act/Mul_1" [label="[1, 1, 1]", style=solid]; -"47 Constant_1925" -> "19 /mlp/act/Add" [label="[1, 1, 1]", style=solid]; -"48 Constant_1924" -> "13 /mlp/act/Div" [label="[1, 1, 1]", style=solid]; -"49 /mlp/fc1/MatMul/fq_weights_1" -> "9 /mlp/fc1/MatMul" [label="[32, 8]", style=solid]; -"50 /mlp/fc1/MatMul/fq_weights_1/output_high" -> "49 /mlp/fc1/MatMul/fq_weights_1" [label="[32, 1]", style=solid]; -"51 /mlp/fc1/MatMul/fq_weights_1/output_low" -> "49 /mlp/fc1/MatMul/fq_weights_1" [label="[32, 1]", style=solid]; -"52 /mlp/fc1/MatMul/fq_weights_1/input_high" -> "49 /mlp/fc1/MatMul/fq_weights_1" [label="[32, 1]", style=solid]; -"53 /mlp/fc1/MatMul/fq_weights_1/input_low" -> "49 /mlp/fc1/MatMul/fq_weights_1" [label="[32, 1]", style=solid]; -"54 Transpose_1873" -> "49 /mlp/fc1/MatMul/fq_weights_1" [label="[32, 8]", style=solid]; -"55 MVN_74/fq_output_0/output_high" -> "7 MVN_74/fq_output_0" [label="[]", style=solid]; -"56 MVN_74/fq_output_0/output_low" -> "7 MVN_74/fq_output_0" [label="[]", style=solid]; -"57 MVN_74/fq_output_0/input_high" -> "7 MVN_74/fq_output_0" [label="[]", style=solid]; -"58 MVN_74/fq_output_0/input_low" -> "7 MVN_74/fq_output_0" [label="[]", style=solid]; -"59 Range_73" -> "4 MVN_74" [label="[1]", style=dashed]; -"60 /attn/proj/MatMul/fq_weights_1" -> "34 /attn/proj/MatMul" [label="[8, 8]", style=solid]; -"61 /attn/proj/MatMul/fq_weights_1/output_high" -> "60 /attn/proj/MatMul/fq_weights_1" [label="[8, 1]", style=solid]; -"62 /attn/proj/MatMul/fq_weights_1/output_low" -> "60 /attn/proj/MatMul/fq_weights_1" [label="[8, 1]", style=solid]; -"63 /attn/proj/MatMul/fq_weights_1/input_high" -> "60 /attn/proj/MatMul/fq_weights_1" [label="[8, 1]", style=solid]; -"64 /attn/proj/MatMul/fq_weights_1/input_low" -> "60 /attn/proj/MatMul/fq_weights_1" [label="[8, 1]", style=solid]; -"65 Transpose_1862" -> "60 /attn/proj/MatMul/fq_weights_1" [label="[8, 8]", style=solid]; -"66 /attn/Constant_2" -> "33 /attn/Reshape_1" [label="[3]", style=dashed]; -"67 Constant_53" -> "32 /attn/Transpose_2" [label="[4]", style=dashed]; -"68 /attn/MatMul_1/fq_output_0/output_high" -> "31 /attn/MatMul_1/fq_output_0" [label="[]", style=solid]; -"69 /attn/MatMul_1/fq_output_0/output_low" -> "31 /attn/MatMul_1/fq_output_0" [label="[]", style=solid]; -"70 /attn/MatMul_1/fq_output_0/input_high" -> "31 /attn/MatMul_1/fq_output_0" [label="[]", style=solid]; -"71 /attn/MatMul_1/fq_output_0/input_low" -> "31 /attn/MatMul_1/fq_output_0" [label="[]", style=solid]; -"72 Constant_1859" -> "29 /attn/MatMul_1" [label="[]", style=solid]; -"73 onnx^^Add_194" -> "29 /attn/MatMul_1" [label="[1, 2, 16, 16]", style=solid]; -"74 Constant_43" -> "25 /attn/Gather_2" [label="[]", style=dashed]; -"75 /Constant_1" -> "25 /attn/Gather_2" [label="[]", style=dashed]; -"76 Constant_37" -> "21 /attn/Transpose" [label="[5]", style=dashed]; -"77 /attn/Constant" -> "18 /attn/Reshape" [label="[5]", style=dashed]; -"78 /attn/qkv/MatMul/fq_weights_1" -> "12 /attn/qkv/MatMul" [label="[24, 8]", style=solid]; -"79 /attn/qkv/MatMul/fq_weights_1/output_high" -> "78 /attn/qkv/MatMul/fq_weights_1" [label="[24, 1]", style=solid]; -"80 /attn/qkv/MatMul/fq_weights_1/output_low" -> "78 /attn/qkv/MatMul/fq_weights_1" [label="[24, 1]", style=solid]; -"81 /attn/qkv/MatMul/fq_weights_1/input_high" -> "78 /attn/qkv/MatMul/fq_weights_1" [label="[24, 1]", style=solid]; -"82 /attn/qkv/MatMul/fq_weights_1/input_low" -> "78 /attn/qkv/MatMul/fq_weights_1" [label="[24, 1]", style=solid]; -"83 Transpose_1847" -> "78 /attn/qkv/MatMul/fq_weights_1" [label="[24, 8]", style=solid]; -"84 Constant_1943" -> "10 /Reshape_3" [label="[3]", style=dashed]; -"85 Multiply_20/fq_output_0/output_high" -> "8 Multiply_20/fq_output_0" [label="[]", style=solid]; -"86 Multiply_20/fq_output_0/output_low" -> "8 Multiply_20/fq_output_0" [label="[]", style=solid]; -"87 Multiply_20/fq_output_0/input_high" -> "8 Multiply_20/fq_output_0" [label="[]", style=solid]; -"88 Multiply_20/fq_output_0/input_low" -> "8 Multiply_20/fq_output_0" [label="[]", style=solid]; -"89 Constant_1919" -> "5 Multiply_20" [label="[1, 1, 8]", style=solid]; -"90 Range_18" -> "2 MVN_19" [label="[1]", style=dashed]; -"91 Constant_1920" -> "15 /attn/qkv/Add" [label="[1, 1, 24]", style=solid]; -"92 Constant_41" -> "28 /attn/Gather_1" [label="[]", style=dashed]; -"93 /Constant_3" -> "28 /attn/Gather_1" [label="[]", style=dashed]; -"94 /attn/Gather_1/fq_input_0/output_high" -> "24 /attn/Gather_1/fq_input_0" [label="[]", style=solid]; -"95 /attn/Gather_1/fq_input_0/output_low" -> "24 /attn/Gather_1/fq_input_0" [label="[]", style=solid]; -"96 /attn/Gather_1/fq_input_0/input_high" -> "24 /attn/Gather_1/fq_input_0" [label="[]", style=solid]; -"97 /attn/Gather_1/fq_input_0/input_low" -> "24 /attn/Gather_1/fq_input_0" [label="[]", style=solid]; -"98 /attn/Mul/fq_output_0/output_high" -> "30 /attn/Mul/fq_output_0" [label="[]", style=solid]; -"99 /attn/Mul/fq_output_0/output_low" -> "30 /attn/Mul/fq_output_0" [label="[]", style=solid]; -"100 /attn/Mul/fq_output_0/input_high" -> "30 /attn/Mul/fq_output_0" [label="[]", style=solid]; -"101 /attn/Mul/fq_output_0/input_low" -> "30 /attn/Mul/fq_output_0" [label="[]", style=solid]; -"102 Constant_1921" -> "27 /attn/Mul" [label="[1, 1, 1, 1]", style=solid]; -"103 Constant_39" -> "23 /attn/Gather" [label="[]", style=dashed]; -"104 /Constant" -> "23 /attn/Gather" [label="[]", style=dashed]; -"105 Constant_1922" -> "35 /attn/proj/Add" [label="[1, 1, 8]", style=solid]; -"106 Constant_1923" -> "11 /mlp/fc1/Add" [label="[1, 1, 32]", style=solid]; -"107 Constant_1927" -> "26 /mlp/fc2/Add" [label="[1, 1, 8]", style=solid]; +"13 /mlp/act/Mul_1" [id=13, type=Gelu]; +"14 /attn/qkv/Add" [id=14, type=Add]; +"15 /mlp/act/Mul_1/fq_output_0" [id=15, type=FakeQuantize]; +"16 /attn/Reshape" [id=16, type=Reshape]; +"17 /mlp/fc2/MatMul" [id=17, type=MatMul]; +"18 /attn/Transpose" [id=18, type=Transpose]; +"19 /mlp/fc2/Add" [id=19, type=Add]; +"20 /attn/Gather" [id=20, type=Gather]; +"21 /attn/Gather_1/fq_input_0" [id=21, type=FakeQuantize]; +"22 /attn/Gather_2" [id=22, type=Gather]; +"23 /attn/Mul" [id=23, type=Multiply]; +"24 /attn/Gather_1" [id=24, type=Gather]; +"25 /attn/MatMul_1" [id=25, type=ScaledDotProductAttention]; +"26 /attn/Mul/fq_output_0" [id=26, type=FakeQuantize]; +"27 /attn/MatMul_1/fq_output_0" [id=27, type=FakeQuantize]; +"28 /attn/Transpose_2" [id=28, type=Transpose]; +"29 /attn/Reshape_1" [id=29, type=Reshape]; +"30 /attn/proj/MatMul" [id=30, type=MatMul]; +"31 /attn/proj/Add" [id=31, type=Add]; +"32 /mlp/fc2/MatMul/fq_weights_1" [id=32, type=FakeQuantize]; +"33 /mlp/fc2/MatMul/fq_weights_1/output_high" [id=33, type=Constant]; +"34 /mlp/fc2/MatMul/fq_weights_1/output_low" [id=34, type=Constant]; +"35 /mlp/fc2/MatMul/fq_weights_1/input_high" [id=35, type=Constant]; +"36 /mlp/fc2/MatMul/fq_weights_1/input_low" [id=36, type=Constant]; +"37 Transpose_1952" [id=37, type=Constant]; +"38 /mlp/act/Mul_1/fq_output_0/output_high" [id=38, type=Constant]; +"39 /mlp/act/Mul_1/fq_output_0/output_low" [id=39, type=Constant]; +"40 /mlp/act/Mul_1/fq_output_0/input_high" [id=40, type=Constant]; +"41 /mlp/act/Mul_1/fq_output_0/input_low" [id=41, type=Constant]; +"42 /mlp/fc1/MatMul/fq_weights_1" [id=42, type=FakeQuantize]; +"43 /mlp/fc1/MatMul/fq_weights_1/output_high" [id=43, type=Constant]; +"44 /mlp/fc1/MatMul/fq_weights_1/output_low" [id=44, type=Constant]; +"45 /mlp/fc1/MatMul/fq_weights_1/input_high" [id=45, type=Constant]; +"46 /mlp/fc1/MatMul/fq_weights_1/input_low" [id=46, type=Constant]; +"47 Transpose_1945" [id=47, type=Constant]; +"48 MVN_74/fq_output_0/output_high" [id=48, type=Constant]; +"49 MVN_74/fq_output_0/output_low" [id=49, type=Constant]; +"50 MVN_74/fq_output_0/input_high" [id=50, type=Constant]; +"51 MVN_74/fq_output_0/input_low" [id=51, type=Constant]; +"52 Range_73" [id=52, type=Constant]; +"53 /attn/proj/MatMul/fq_weights_1" [id=53, type=FakeQuantize]; +"54 /attn/proj/MatMul/fq_weights_1/output_high" [id=54, type=Constant]; +"55 /attn/proj/MatMul/fq_weights_1/output_low" [id=55, type=Constant]; +"56 /attn/proj/MatMul/fq_weights_1/input_high" [id=56, type=Constant]; +"57 /attn/proj/MatMul/fq_weights_1/input_low" [id=57, type=Constant]; +"58 Transpose_1934" [id=58, type=Constant]; +"59 /attn/Constant_2" [id=59, type=Constant]; +"60 Constant_53" [id=60, type=Constant]; +"61 /attn/MatMul_1/fq_output_0/output_high" [id=61, type=Constant]; +"62 /attn/MatMul_1/fq_output_0/output_low" [id=62, type=Constant]; +"63 /attn/MatMul_1/fq_output_0/input_high" [id=63, type=Constant]; +"64 /attn/MatMul_1/fq_output_0/input_low" [id=64, type=Constant]; +"65 Constant_1931" [id=65, type=Constant]; +"66 onnx^^Add_194" [id=66, type=Constant, label="66 onnx::Add_194"]; +"67 Constant_43" [id=67, type=Constant]; +"68 /Constant_1" [id=68, type=Constant]; +"69 Constant_37" [id=69, type=Constant]; +"70 /attn/Constant" [id=70, type=Constant]; +"71 /attn/qkv/MatMul/fq_weights_1" [id=71, type=FakeQuantize]; +"72 /attn/qkv/MatMul/fq_weights_1/output_high" [id=72, type=Constant]; +"73 /attn/qkv/MatMul/fq_weights_1/output_low" [id=73, type=Constant]; +"74 /attn/qkv/MatMul/fq_weights_1/input_high" [id=74, type=Constant]; +"75 /attn/qkv/MatMul/fq_weights_1/input_low" [id=75, type=Constant]; +"76 Transpose_1919" [id=76, type=Constant]; +"77 Constant_2004" [id=77, type=Constant]; +"78 Multiply_20/fq_output_0/output_high" [id=78, type=Constant]; +"79 Multiply_20/fq_output_0/output_low" [id=79, type=Constant]; +"80 Multiply_20/fq_output_0/input_high" [id=80, type=Constant]; +"81 Multiply_20/fq_output_0/input_low" [id=81, type=Constant]; +"82 Constant_1983" [id=82, type=Constant]; +"83 Range_18" [id=83, type=Constant]; +"84 Constant_1984" [id=84, type=Constant]; +"85 Constant_41" [id=85, type=Constant]; +"86 /Constant_3" [id=86, type=Constant]; +"87 /attn/Gather_1/fq_input_0/output_high" [id=87, type=Constant]; +"88 /attn/Gather_1/fq_input_0/output_low" [id=88, type=Constant]; +"89 /attn/Gather_1/fq_input_0/input_high" [id=89, type=Constant]; +"90 /attn/Gather_1/fq_input_0/input_low" [id=90, type=Constant]; +"91 /attn/Mul/fq_output_0/output_high" [id=91, type=Constant]; +"92 /attn/Mul/fq_output_0/output_low" [id=92, type=Constant]; +"93 /attn/Mul/fq_output_0/input_high" [id=93, type=Constant]; +"94 /attn/Mul/fq_output_0/input_low" [id=94, type=Constant]; +"95 Constant_1985" [id=95, type=Constant]; +"96 Constant_39" [id=96, type=Constant]; +"97 /Constant" [id=97, type=Constant]; +"98 Constant_1986" [id=98, type=Constant]; +"99 Constant_1987" [id=99, type=Constant]; +"100 Constant_1988" [id=100, type=Constant]; +"0 input.1" -> "1 /Add" [style=solid, label="[1, 16, 8]"]; +"0 input.1" -> "2 MVN_19" [style=solid, label="[1, 16, 8]"]; +"1 /Add" -> "3 161" [style=solid, label="[1, 16, 8]"]; +"1 /Add" -> "4 MVN_74" [style=solid, label="[1, 16, 8]"]; +"2 MVN_19" -> "5 Multiply_20" [style=solid, label="[1, 16, 8]"]; +"3 161" -> "6 161/sink_port_0" [style=solid, label="[1, 16, 8]"]; +"4 MVN_74" -> "7 MVN_74/fq_output_0" [style=solid, label="[1, 16, 8]"]; +"5 Multiply_20" -> "8 Multiply_20/fq_output_0" [style=solid, label="[1, 16, 8]"]; +"7 MVN_74/fq_output_0" -> "9 /mlp/fc1/MatMul" [style=solid, label="[1, 16, 8]"]; +"8 Multiply_20/fq_output_0" -> "10 /Reshape_3" [style=solid, label="[1, 16, 8]"]; +"9 /mlp/fc1/MatMul" -> "11 /mlp/fc1/Add" [style=solid, label="[1, 16, 32]"]; +"10 /Reshape_3" -> "12 /attn/qkv/MatMul" [style=solid, label="[1, 16, 8]"]; +"11 /mlp/fc1/Add" -> "13 /mlp/act/Mul_1" [style=solid, label="[1, 16, 32]"]; +"12 /attn/qkv/MatMul" -> "14 /attn/qkv/Add" [style=solid, label="[1, 16, 24]"]; +"13 /mlp/act/Mul_1" -> "15 /mlp/act/Mul_1/fq_output_0" [style=solid, label="[1, 16, 32]"]; +"14 /attn/qkv/Add" -> "16 /attn/Reshape" [style=solid, label="[1, 16, 24]"]; +"15 /mlp/act/Mul_1/fq_output_0" -> "17 /mlp/fc2/MatMul" [style=solid, label="[1, 16, 32]"]; +"16 /attn/Reshape" -> "18 /attn/Transpose" [style=solid, label="[1, 16, 3, 2, 4]"]; +"17 /mlp/fc2/MatMul" -> "19 /mlp/fc2/Add" [style=solid, label="[1, 16, 8]"]; +"18 /attn/Transpose" -> "20 /attn/Gather" [style=solid, label="[3, 1, 2, 16, 4]"]; +"18 /attn/Transpose" -> "21 /attn/Gather_1/fq_input_0" [style=solid, label="[3, 1, 2, 16, 4]"]; +"18 /attn/Transpose" -> "22 /attn/Gather_2" [style=solid, label="[3, 1, 2, 16, 4]"]; +"19 /mlp/fc2/Add" -> "3 161" [style=solid, label="[1, 16, 8]"]; +"20 /attn/Gather" -> "23 /attn/Mul" [style=solid, label="[1, 2, 16, 4]"]; +"21 /attn/Gather_1/fq_input_0" -> "24 /attn/Gather_1" [style=solid, label="[3, 1, 2, 16, 4]"]; +"22 /attn/Gather_2" -> "25 /attn/MatMul_1" [style=solid, label="[1, 2, 16, 4]"]; +"23 /attn/Mul" -> "26 /attn/Mul/fq_output_0" [style=solid, label="[1, 2, 16, 4]"]; +"24 /attn/Gather_1" -> "25 /attn/MatMul_1" [style=solid, label="[1, 2, 16, 4]"]; +"25 /attn/MatMul_1" -> "27 /attn/MatMul_1/fq_output_0" [style=solid, label="[1, 2, 16, 4]"]; +"26 /attn/Mul/fq_output_0" -> "25 /attn/MatMul_1" [style=solid, label="[1, 2, 16, 4]"]; +"27 /attn/MatMul_1/fq_output_0" -> "28 /attn/Transpose_2" [style=solid, label="[1, 2, 16, 4]"]; +"28 /attn/Transpose_2" -> "29 /attn/Reshape_1" [style=solid, label="[1, 16, 2, 4]"]; +"29 /attn/Reshape_1" -> "30 /attn/proj/MatMul" [style=solid, label="[1, 16, 8]"]; +"30 /attn/proj/MatMul" -> "31 /attn/proj/Add" [style=solid, label="[1, 16, 8]"]; +"31 /attn/proj/Add" -> "1 /Add" [style=solid, label="[1, 16, 8]"]; +"32 /mlp/fc2/MatMul/fq_weights_1" -> "17 /mlp/fc2/MatMul" [style=solid, label="[8, 32]"]; +"33 /mlp/fc2/MatMul/fq_weights_1/output_high" -> "32 /mlp/fc2/MatMul/fq_weights_1" [style=solid, label="[8, 1]"]; +"34 /mlp/fc2/MatMul/fq_weights_1/output_low" -> "32 /mlp/fc2/MatMul/fq_weights_1" [style=solid, label="[8, 1]"]; +"35 /mlp/fc2/MatMul/fq_weights_1/input_high" -> "32 /mlp/fc2/MatMul/fq_weights_1" [style=solid, label="[8, 1]"]; +"36 /mlp/fc2/MatMul/fq_weights_1/input_low" -> "32 /mlp/fc2/MatMul/fq_weights_1" [style=solid, label="[8, 1]"]; +"37 Transpose_1952" -> "32 /mlp/fc2/MatMul/fq_weights_1" [style=solid, label="[8, 32]"]; +"38 /mlp/act/Mul_1/fq_output_0/output_high" -> "15 /mlp/act/Mul_1/fq_output_0" [style=solid, label="[]"]; +"39 /mlp/act/Mul_1/fq_output_0/output_low" -> "15 /mlp/act/Mul_1/fq_output_0" [style=solid, label="[]"]; +"40 /mlp/act/Mul_1/fq_output_0/input_high" -> "15 /mlp/act/Mul_1/fq_output_0" [style=solid, label="[]"]; +"41 /mlp/act/Mul_1/fq_output_0/input_low" -> "15 /mlp/act/Mul_1/fq_output_0" [style=solid, label="[]"]; +"42 /mlp/fc1/MatMul/fq_weights_1" -> "9 /mlp/fc1/MatMul" [style=solid, label="[32, 8]"]; +"43 /mlp/fc1/MatMul/fq_weights_1/output_high" -> "42 /mlp/fc1/MatMul/fq_weights_1" [style=solid, label="[32, 1]"]; +"44 /mlp/fc1/MatMul/fq_weights_1/output_low" -> "42 /mlp/fc1/MatMul/fq_weights_1" [style=solid, label="[32, 1]"]; +"45 /mlp/fc1/MatMul/fq_weights_1/input_high" -> "42 /mlp/fc1/MatMul/fq_weights_1" [style=solid, label="[32, 1]"]; +"46 /mlp/fc1/MatMul/fq_weights_1/input_low" -> "42 /mlp/fc1/MatMul/fq_weights_1" [style=solid, label="[32, 1]"]; +"47 Transpose_1945" -> "42 /mlp/fc1/MatMul/fq_weights_1" [style=solid, label="[32, 8]"]; +"48 MVN_74/fq_output_0/output_high" -> "7 MVN_74/fq_output_0" [style=solid, label="[]"]; +"49 MVN_74/fq_output_0/output_low" -> "7 MVN_74/fq_output_0" [style=solid, label="[]"]; +"50 MVN_74/fq_output_0/input_high" -> "7 MVN_74/fq_output_0" [style=solid, label="[]"]; +"51 MVN_74/fq_output_0/input_low" -> "7 MVN_74/fq_output_0" [style=solid, label="[]"]; +"52 Range_73" -> "4 MVN_74" [style=dashed, label="[1]"]; +"53 /attn/proj/MatMul/fq_weights_1" -> "30 /attn/proj/MatMul" [style=solid, label="[8, 8]"]; +"54 /attn/proj/MatMul/fq_weights_1/output_high" -> "53 /attn/proj/MatMul/fq_weights_1" [style=solid, label="[8, 1]"]; +"55 /attn/proj/MatMul/fq_weights_1/output_low" -> "53 /attn/proj/MatMul/fq_weights_1" [style=solid, label="[8, 1]"]; +"56 /attn/proj/MatMul/fq_weights_1/input_high" -> "53 /attn/proj/MatMul/fq_weights_1" [style=solid, label="[8, 1]"]; +"57 /attn/proj/MatMul/fq_weights_1/input_low" -> "53 /attn/proj/MatMul/fq_weights_1" [style=solid, label="[8, 1]"]; +"58 Transpose_1934" -> "53 /attn/proj/MatMul/fq_weights_1" [style=solid, label="[8, 8]"]; +"59 /attn/Constant_2" -> "29 /attn/Reshape_1" [style=dashed, label="[3]"]; +"60 Constant_53" -> "28 /attn/Transpose_2" [style=dashed, label="[4]"]; +"61 /attn/MatMul_1/fq_output_0/output_high" -> "27 /attn/MatMul_1/fq_output_0" [style=solid, label="[]"]; +"62 /attn/MatMul_1/fq_output_0/output_low" -> "27 /attn/MatMul_1/fq_output_0" [style=solid, label="[]"]; +"63 /attn/MatMul_1/fq_output_0/input_high" -> "27 /attn/MatMul_1/fq_output_0" [style=solid, label="[]"]; +"64 /attn/MatMul_1/fq_output_0/input_low" -> "27 /attn/MatMul_1/fq_output_0" [style=solid, label="[]"]; +"65 Constant_1931" -> "25 /attn/MatMul_1" [style=solid, label="[]"]; +"66 onnx^^Add_194" -> "25 /attn/MatMul_1" [style=solid, label="[1, 2, 16, 16]"]; +"67 Constant_43" -> "22 /attn/Gather_2" [style=dashed, label="[]"]; +"68 /Constant_1" -> "22 /attn/Gather_2" [style=dashed, label="[]"]; +"69 Constant_37" -> "18 /attn/Transpose" [style=dashed, label="[5]"]; +"70 /attn/Constant" -> "16 /attn/Reshape" [style=dashed, label="[5]"]; +"71 /attn/qkv/MatMul/fq_weights_1" -> "12 /attn/qkv/MatMul" [style=solid, label="[24, 8]"]; +"72 /attn/qkv/MatMul/fq_weights_1/output_high" -> "71 /attn/qkv/MatMul/fq_weights_1" [style=solid, label="[24, 1]"]; +"73 /attn/qkv/MatMul/fq_weights_1/output_low" -> "71 /attn/qkv/MatMul/fq_weights_1" [style=solid, label="[24, 1]"]; +"74 /attn/qkv/MatMul/fq_weights_1/input_high" -> "71 /attn/qkv/MatMul/fq_weights_1" [style=solid, label="[24, 1]"]; +"75 /attn/qkv/MatMul/fq_weights_1/input_low" -> "71 /attn/qkv/MatMul/fq_weights_1" [style=solid, label="[24, 1]"]; +"76 Transpose_1919" -> "71 /attn/qkv/MatMul/fq_weights_1" [style=solid, label="[24, 8]"]; +"77 Constant_2004" -> "10 /Reshape_3" [style=dashed, label="[3]"]; +"78 Multiply_20/fq_output_0/output_high" -> "8 Multiply_20/fq_output_0" [style=solid, label="[]"]; +"79 Multiply_20/fq_output_0/output_low" -> "8 Multiply_20/fq_output_0" [style=solid, label="[]"]; +"80 Multiply_20/fq_output_0/input_high" -> "8 Multiply_20/fq_output_0" [style=solid, label="[]"]; +"81 Multiply_20/fq_output_0/input_low" -> "8 Multiply_20/fq_output_0" [style=solid, label="[]"]; +"82 Constant_1983" -> "5 Multiply_20" [style=solid, label="[1, 1, 8]"]; +"83 Range_18" -> "2 MVN_19" [style=dashed, label="[1]"]; +"84 Constant_1984" -> "14 /attn/qkv/Add" [style=solid, label="[1, 1, 24]"]; +"85 Constant_41" -> "24 /attn/Gather_1" [style=dashed, label="[]"]; +"86 /Constant_3" -> "24 /attn/Gather_1" [style=dashed, label="[]"]; +"87 /attn/Gather_1/fq_input_0/output_high" -> "21 /attn/Gather_1/fq_input_0" [style=solid, label="[]"]; +"88 /attn/Gather_1/fq_input_0/output_low" -> "21 /attn/Gather_1/fq_input_0" [style=solid, label="[]"]; +"89 /attn/Gather_1/fq_input_0/input_high" -> "21 /attn/Gather_1/fq_input_0" [style=solid, label="[]"]; +"90 /attn/Gather_1/fq_input_0/input_low" -> "21 /attn/Gather_1/fq_input_0" [style=solid, label="[]"]; +"91 /attn/Mul/fq_output_0/output_high" -> "26 /attn/Mul/fq_output_0" [style=solid, label="[]"]; +"92 /attn/Mul/fq_output_0/output_low" -> "26 /attn/Mul/fq_output_0" [style=solid, label="[]"]; +"93 /attn/Mul/fq_output_0/input_high" -> "26 /attn/Mul/fq_output_0" [style=solid, label="[]"]; +"94 /attn/Mul/fq_output_0/input_low" -> "26 /attn/Mul/fq_output_0" [style=solid, label="[]"]; +"95 Constant_1985" -> "23 /attn/Mul" [style=solid, label="[1, 1, 1, 1]"]; +"96 Constant_39" -> "20 /attn/Gather" [style=dashed, label="[]"]; +"97 /Constant" -> "20 /attn/Gather" [style=dashed, label="[]"]; +"98 Constant_1986" -> "31 /attn/proj/Add" [style=solid, label="[1, 1, 8]"]; +"99 Constant_1987" -> "11 /mlp/fc1/Add" [style=solid, label="[1, 1, 32]"]; +"100 Constant_1988" -> "19 /mlp/fc2/Add" [style=solid, label="[1, 1, 8]"]; } diff --git a/tests/openvino/native/data/2025.1/reference_graphs/quantized/swin-block_sq.dot b/tests/openvino/native/data/2025.1/reference_graphs/quantized/swin-block_sq.dot index 17edf422a64..c757d09045f 100644 --- a/tests/openvino/native/data/2025.1/reference_graphs/quantized/swin-block_sq.dot +++ b/tests/openvino/native/data/2025.1/reference_graphs/quantized/swin-block_sq.dot @@ -12,61 +12,54 @@ strict digraph { "10 /Reshape_3_0_0/nncf_smooth_quant" [id=10, type=Multiply]; "11 /mlp/fc1/Add" [id=11, type=Add]; "12 /attn/qkv/MatMul" [id=12, type=MatMul]; -"13 /mlp/act/Div" [id=13, type=Multiply]; -"14 /mlp/act/Mul" [id=14, type=Multiply]; -"15 /attn/qkv/Add" [id=15, type=Add]; -"16 /mlp/act/Erf" [id=16, type=Erf]; -"17 /mlp/act/Mul_1" [id=17, type=Multiply]; -"18 /attn/Reshape" [id=18, type=Reshape]; -"19 /mlp/act/Add" [id=19, type=Add]; -"20 /mlp/act/Mul_1_0_0/nncf_smooth_quant" [id=20, type=Multiply]; -"21 /attn/Transpose" [id=21, type=Transpose]; -"22 /mlp/fc2/MatMul" [id=22, type=MatMul]; -"23 /attn/Gather" [id=23, type=Gather]; -"24 /attn/Gather_1" [id=24, type=Gather]; -"25 /attn/Gather_2" [id=25, type=Gather]; -"26 /mlp/fc2/Add" [id=26, type=Add]; -"27 /attn/Mul" [id=27, type=Multiply]; -"28 /attn/MatMul_1" [id=28, type=ScaledDotProductAttention]; -"29 /attn/Transpose_2" [id=29, type=Transpose]; -"30 /attn/Reshape_1" [id=30, type=Reshape]; -"31 /attn/Reshape_1_0_0/nncf_smooth_quant" [id=31, type=Multiply]; -"32 /attn/proj/MatMul" [id=32, type=MatMul]; -"33 /attn/proj/Add" [id=33, type=Add]; -"34 Transpose_1888" [id=34, type=Constant]; -"35 /mlp/act/Mul_1_0_0/nncf_smooth_quant/scale" [id=35, type=Constant]; -"36 Constant_1926" [id=36, type=Constant]; -"37 Constant_1925" [id=37, type=Constant]; -"38 Constant_1924" [id=38, type=Constant]; -"39 Transpose_1873" [id=39, type=Constant]; -"40 MVN_74_0_0/nncf_smooth_quant/scale" [id=40, type=Constant]; -"41 Range_73" [id=41, type=Constant]; -"42 Transpose_1862" [id=42, type=Constant]; -"43 /attn/Reshape_1_0_0/nncf_smooth_quant/scale" [id=43, type=Constant]; -"44 /attn/Constant_2" [id=44, type=Constant]; -"45 Constant_53" [id=45, type=Constant]; -"46 Constant_1859" [id=46, type=Constant]; -"47 onnx^^Add_194" [id=47, type=Constant, label="47 onnx::Add_194"]; -"48 Constant_43" [id=48, type=Constant]; -"49 /Constant_1" [id=49, type=Constant]; -"50 Constant_37" [id=50, type=Constant]; -"51 /attn/Constant" [id=51, type=Constant]; -"52 Transpose_1847" [id=52, type=Constant]; -"53 /Reshape_3_0_0/nncf_smooth_quant/scale" [id=53, type=Constant]; -"54 Constant_1943" [id=54, type=Constant]; -"55 Constant_1919" [id=55, type=Constant]; -"56 Range_18" [id=56, type=Constant]; -"57 Constant_1920" [id=57, type=Constant]; -"58 Constant_41" [id=58, type=Constant]; -"59 /Constant_3" [id=59, type=Constant]; -"60 Constant_1921" [id=60, type=Constant]; -"61 Constant_39" [id=61, type=Constant]; -"62 /Constant" [id=62, type=Constant]; -"63 Constant_1922" [id=63, type=Constant]; -"64 Constant_1923" [id=64, type=Constant]; -"65 Constant_1927" [id=65, type=Constant]; -"0 input.1" -> "2 MVN_19" [style=solid, label="[1, 16, 8]"]; +"13 /mlp/act/Mul_1" [id=13, type=Gelu]; +"14 /attn/qkv/Add" [id=14, type=Add]; +"15 /mlp/act/Mul_1_0_0/nncf_smooth_quant" [id=15, type=Multiply]; +"16 /attn/Reshape" [id=16, type=Reshape]; +"17 /mlp/fc2/MatMul" [id=17, type=MatMul]; +"18 /attn/Transpose" [id=18, type=Transpose]; +"19 /mlp/fc2/Add" [id=19, type=Add]; +"20 /attn/Gather" [id=20, type=Gather]; +"21 /attn/Gather_1" [id=21, type=Gather]; +"22 /attn/Gather_2" [id=22, type=Gather]; +"23 /attn/Mul" [id=23, type=Multiply]; +"24 /attn/MatMul_1" [id=24, type=ScaledDotProductAttention]; +"25 /attn/Transpose_2" [id=25, type=Transpose]; +"26 /attn/Reshape_1" [id=26, type=Reshape]; +"27 /attn/Reshape_1_0_0/nncf_smooth_quant" [id=27, type=Multiply]; +"28 /attn/proj/MatMul" [id=28, type=MatMul]; +"29 /attn/proj/Add" [id=29, type=Add]; +"30 Transpose_1952" [id=30, type=Constant]; +"31 /mlp/act/Mul_1_0_0/nncf_smooth_quant/scale" [id=31, type=Constant]; +"32 Transpose_1945" [id=32, type=Constant]; +"33 MVN_74_0_0/nncf_smooth_quant/scale" [id=33, type=Constant]; +"34 Range_73" [id=34, type=Constant]; +"35 Transpose_1934" [id=35, type=Constant]; +"36 /attn/Reshape_1_0_0/nncf_smooth_quant/scale" [id=36, type=Constant]; +"37 /attn/Constant_2" [id=37, type=Constant]; +"38 Constant_53" [id=38, type=Constant]; +"39 Constant_1931" [id=39, type=Constant]; +"40 onnx^^Add_194" [id=40, type=Constant, label="40 onnx::Add_194"]; +"41 Constant_43" [id=41, type=Constant]; +"42 /Constant_1" [id=42, type=Constant]; +"43 Constant_37" [id=43, type=Constant]; +"44 /attn/Constant" [id=44, type=Constant]; +"45 Transpose_1919" [id=45, type=Constant]; +"46 /Reshape_3_0_0/nncf_smooth_quant/scale" [id=46, type=Constant]; +"47 Constant_2004" [id=47, type=Constant]; +"48 Constant_1983" [id=48, type=Constant]; +"49 Range_18" [id=49, type=Constant]; +"50 Constant_1984" [id=50, type=Constant]; +"51 Constant_41" [id=51, type=Constant]; +"52 /Constant_3" [id=52, type=Constant]; +"53 Constant_1985" [id=53, type=Constant]; +"54 Constant_39" [id=54, type=Constant]; +"55 /Constant" [id=55, type=Constant]; +"56 Constant_1986" [id=56, type=Constant]; +"57 Constant_1987" [id=57, type=Constant]; +"58 Constant_1988" [id=58, type=Constant]; "0 input.1" -> "1 /Add" [style=solid, label="[1, 16, 8]"]; +"0 input.1" -> "2 MVN_19" [style=solid, label="[1, 16, 8]"]; "1 /Add" -> "3 161" [style=solid, label="[1, 16, 8]"]; "1 /Add" -> "4 MVN_74" [style=solid, label="[1, 16, 8]"]; "2 MVN_19" -> "5 Multiply_20" [style=solid, label="[1, 16, 8]"]; @@ -77,62 +70,54 @@ strict digraph { "8 /Reshape_3" -> "10 /Reshape_3_0_0/nncf_smooth_quant" [style=solid, label="[1, 16, 8]"]; "9 /mlp/fc1/MatMul" -> "11 /mlp/fc1/Add" [style=solid, label="[1, 16, 32]"]; "10 /Reshape_3_0_0/nncf_smooth_quant" -> "12 /attn/qkv/MatMul" [style=solid, label="[1, 16, 8]"]; -"11 /mlp/fc1/Add" -> "14 /mlp/act/Mul" [style=solid, label="[1, 16, 32]"]; -"11 /mlp/fc1/Add" -> "13 /mlp/act/Div" [style=solid, label="[1, 16, 32]"]; -"12 /attn/qkv/MatMul" -> "15 /attn/qkv/Add" [style=solid, label="[1, 16, 24]"]; -"13 /mlp/act/Div" -> "16 /mlp/act/Erf" [style=solid, label="[1, 16, 32]"]; -"14 /mlp/act/Mul" -> "17 /mlp/act/Mul_1" [style=solid, label="[1, 16, 32]"]; -"15 /attn/qkv/Add" -> "18 /attn/Reshape" [style=solid, label="[1, 16, 24]"]; -"16 /mlp/act/Erf" -> "19 /mlp/act/Add" [style=solid, label="[1, 16, 32]"]; -"17 /mlp/act/Mul_1" -> "20 /mlp/act/Mul_1_0_0/nncf_smooth_quant" [style=solid, label="[1, 16, 32]"]; -"18 /attn/Reshape" -> "21 /attn/Transpose" [style=solid, label="[1, 16, 3, 2, 4]"]; -"19 /mlp/act/Add" -> "14 /mlp/act/Mul" [style=solid, label="[1, 16, 32]"]; -"20 /mlp/act/Mul_1_0_0/nncf_smooth_quant" -> "22 /mlp/fc2/MatMul" [style=solid, label="[1, 16, 32]"]; -"21 /attn/Transpose" -> "23 /attn/Gather" [style=solid, label="[3, 1, 2, 16, 4]"]; -"21 /attn/Transpose" -> "24 /attn/Gather_1" [style=solid, label="[3, 1, 2, 16, 4]"]; -"21 /attn/Transpose" -> "25 /attn/Gather_2" [style=solid, label="[3, 1, 2, 16, 4]"]; -"22 /mlp/fc2/MatMul" -> "26 /mlp/fc2/Add" [style=solid, label="[1, 16, 8]"]; -"23 /attn/Gather" -> "27 /attn/Mul" [style=solid, label="[1, 2, 16, 4]"]; -"24 /attn/Gather_1" -> "28 /attn/MatMul_1" [style=solid, label="[1, 2, 16, 4]"]; -"25 /attn/Gather_2" -> "28 /attn/MatMul_1" [style=solid, label="[1, 2, 16, 4]"]; -"26 /mlp/fc2/Add" -> "3 161" [style=solid, label="[1, 16, 8]"]; -"27 /attn/Mul" -> "28 /attn/MatMul_1" [style=solid, label="[1, 2, 16, 4]"]; -"28 /attn/MatMul_1" -> "29 /attn/Transpose_2" [style=solid, label="[1, 2, 16, 4]"]; -"29 /attn/Transpose_2" -> "30 /attn/Reshape_1" [style=solid, label="[1, 16, 2, 4]"]; -"30 /attn/Reshape_1" -> "31 /attn/Reshape_1_0_0/nncf_smooth_quant" [style=solid, label="[1, 16, 8]"]; -"31 /attn/Reshape_1_0_0/nncf_smooth_quant" -> "32 /attn/proj/MatMul" [style=solid, label="[1, 16, 8]"]; -"32 /attn/proj/MatMul" -> "33 /attn/proj/Add" [style=solid, label="[1, 16, 8]"]; -"33 /attn/proj/Add" -> "1 /Add" [style=solid, label="[1, 16, 8]"]; -"34 Transpose_1888" -> "22 /mlp/fc2/MatMul" [style=solid, label="[8, 32]"]; -"35 /mlp/act/Mul_1_0_0/nncf_smooth_quant/scale" -> "20 /mlp/act/Mul_1_0_0/nncf_smooth_quant" [style=solid, label="[1, 1, 32]"]; -"36 Constant_1926" -> "17 /mlp/act/Mul_1" [style=solid, label="[1, 1, 1]"]; -"37 Constant_1925" -> "19 /mlp/act/Add" [style=solid, label="[1, 1, 1]"]; -"38 Constant_1924" -> "13 /mlp/act/Div" [style=solid, label="[1, 1, 1]"]; -"39 Transpose_1873" -> "9 /mlp/fc1/MatMul" [style=solid, label="[32, 8]"]; -"40 MVN_74_0_0/nncf_smooth_quant/scale" -> "7 MVN_74_0_0/nncf_smooth_quant" [style=solid, label="[1, 1, 8]"]; -"41 Range_73" -> "4 MVN_74" [style=dashed, label="[1]"]; -"42 Transpose_1862" -> "32 /attn/proj/MatMul" [style=solid, label="[8, 8]"]; -"43 /attn/Reshape_1_0_0/nncf_smooth_quant/scale" -> "31 /attn/Reshape_1_0_0/nncf_smooth_quant" [style=solid, label="[1, 1, 8]"]; -"44 /attn/Constant_2" -> "30 /attn/Reshape_1" [style=dashed, label="[3]"]; -"45 Constant_53" -> "29 /attn/Transpose_2" [style=dashed, label="[4]"]; -"46 Constant_1859" -> "28 /attn/MatMul_1" [style=solid, label="[]"]; -"47 onnx^^Add_194" -> "28 /attn/MatMul_1" [style=solid, label="[1, 2, 16, 16]"]; -"48 Constant_43" -> "25 /attn/Gather_2" [style=dashed, label="[]"]; -"49 /Constant_1" -> "25 /attn/Gather_2" [style=dashed, label="[]"]; -"50 Constant_37" -> "21 /attn/Transpose" [style=dashed, label="[5]"]; -"51 /attn/Constant" -> "18 /attn/Reshape" [style=dashed, label="[5]"]; -"52 Transpose_1847" -> "12 /attn/qkv/MatMul" [style=solid, label="[24, 8]"]; -"53 /Reshape_3_0_0/nncf_smooth_quant/scale" -> "10 /Reshape_3_0_0/nncf_smooth_quant" [style=solid, label="[1, 1, 8]"]; -"54 Constant_1943" -> "8 /Reshape_3" [style=dashed, label="[3]"]; -"55 Constant_1919" -> "5 Multiply_20" [style=solid, label="[1, 1, 8]"]; -"56 Range_18" -> "2 MVN_19" [style=dashed, label="[1]"]; -"57 Constant_1920" -> "15 /attn/qkv/Add" [style=solid, label="[1, 1, 24]"]; -"58 Constant_41" -> "24 /attn/Gather_1" [style=dashed, label="[]"]; -"59 /Constant_3" -> "24 /attn/Gather_1" [style=dashed, label="[]"]; -"60 Constant_1921" -> "27 /attn/Mul" [style=solid, label="[1, 1, 1, 1]"]; -"61 Constant_39" -> "23 /attn/Gather" [style=dashed, label="[]"]; -"62 /Constant" -> "23 /attn/Gather" [style=dashed, label="[]"]; -"63 Constant_1922" -> "33 /attn/proj/Add" [style=solid, label="[1, 1, 8]"]; -"64 Constant_1923" -> "11 /mlp/fc1/Add" [style=solid, label="[1, 1, 32]"]; -"65 Constant_1927" -> "26 /mlp/fc2/Add" [style=solid, label="[1, 1, 8]"]; +"11 /mlp/fc1/Add" -> "13 /mlp/act/Mul_1" [style=solid, label="[1, 16, 32]"]; +"12 /attn/qkv/MatMul" -> "14 /attn/qkv/Add" [style=solid, label="[1, 16, 24]"]; +"13 /mlp/act/Mul_1" -> "15 /mlp/act/Mul_1_0_0/nncf_smooth_quant" [style=solid, label="[1, 16, 32]"]; +"14 /attn/qkv/Add" -> "16 /attn/Reshape" [style=solid, label="[1, 16, 24]"]; +"15 /mlp/act/Mul_1_0_0/nncf_smooth_quant" -> "17 /mlp/fc2/MatMul" [style=solid, label="[1, 16, 32]"]; +"16 /attn/Reshape" -> "18 /attn/Transpose" [style=solid, label="[1, 16, 3, 2, 4]"]; +"17 /mlp/fc2/MatMul" -> "19 /mlp/fc2/Add" [style=solid, label="[1, 16, 8]"]; +"18 /attn/Transpose" -> "20 /attn/Gather" [style=solid, label="[3, 1, 2, 16, 4]"]; +"18 /attn/Transpose" -> "21 /attn/Gather_1" [style=solid, label="[3, 1, 2, 16, 4]"]; +"18 /attn/Transpose" -> "22 /attn/Gather_2" [style=solid, label="[3, 1, 2, 16, 4]"]; +"19 /mlp/fc2/Add" -> "3 161" [style=solid, label="[1, 16, 8]"]; +"20 /attn/Gather" -> "23 /attn/Mul" [style=solid, label="[1, 2, 16, 4]"]; +"21 /attn/Gather_1" -> "24 /attn/MatMul_1" [style=solid, label="[1, 2, 16, 4]"]; +"22 /attn/Gather_2" -> "24 /attn/MatMul_1" [style=solid, label="[1, 2, 16, 4]"]; +"23 /attn/Mul" -> "24 /attn/MatMul_1" [style=solid, label="[1, 2, 16, 4]"]; +"24 /attn/MatMul_1" -> "25 /attn/Transpose_2" [style=solid, label="[1, 2, 16, 4]"]; +"25 /attn/Transpose_2" -> "26 /attn/Reshape_1" [style=solid, label="[1, 16, 2, 4]"]; +"26 /attn/Reshape_1" -> "27 /attn/Reshape_1_0_0/nncf_smooth_quant" [style=solid, label="[1, 16, 8]"]; +"27 /attn/Reshape_1_0_0/nncf_smooth_quant" -> "28 /attn/proj/MatMul" [style=solid, label="[1, 16, 8]"]; +"28 /attn/proj/MatMul" -> "29 /attn/proj/Add" [style=solid, label="[1, 16, 8]"]; +"29 /attn/proj/Add" -> "1 /Add" [style=solid, label="[1, 16, 8]"]; +"30 Transpose_1952" -> "17 /mlp/fc2/MatMul" [style=solid, label="[8, 32]"]; +"31 /mlp/act/Mul_1_0_0/nncf_smooth_quant/scale" -> "15 /mlp/act/Mul_1_0_0/nncf_smooth_quant" [style=solid, label="[1, 1, 32]"]; +"32 Transpose_1945" -> "9 /mlp/fc1/MatMul" [style=solid, label="[32, 8]"]; +"33 MVN_74_0_0/nncf_smooth_quant/scale" -> "7 MVN_74_0_0/nncf_smooth_quant" [style=solid, label="[1, 1, 8]"]; +"34 Range_73" -> "4 MVN_74" [style=dashed, label="[1]"]; +"35 Transpose_1934" -> "28 /attn/proj/MatMul" [style=solid, label="[8, 8]"]; +"36 /attn/Reshape_1_0_0/nncf_smooth_quant/scale" -> "27 /attn/Reshape_1_0_0/nncf_smooth_quant" [style=solid, label="[1, 1, 8]"]; +"37 /attn/Constant_2" -> "26 /attn/Reshape_1" [style=dashed, label="[3]"]; +"38 Constant_53" -> "25 /attn/Transpose_2" [style=dashed, label="[4]"]; +"39 Constant_1931" -> "24 /attn/MatMul_1" [style=solid, label="[]"]; +"40 onnx^^Add_194" -> "24 /attn/MatMul_1" [style=solid, label="[1, 2, 16, 16]"]; +"41 Constant_43" -> "22 /attn/Gather_2" [style=dashed, label="[]"]; +"42 /Constant_1" -> "22 /attn/Gather_2" [style=dashed, label="[]"]; +"43 Constant_37" -> "18 /attn/Transpose" [style=dashed, label="[5]"]; +"44 /attn/Constant" -> "16 /attn/Reshape" [style=dashed, label="[5]"]; +"45 Transpose_1919" -> "12 /attn/qkv/MatMul" [style=solid, label="[24, 8]"]; +"46 /Reshape_3_0_0/nncf_smooth_quant/scale" -> "10 /Reshape_3_0_0/nncf_smooth_quant" [style=solid, label="[1, 1, 8]"]; +"47 Constant_2004" -> "8 /Reshape_3" [style=dashed, label="[3]"]; +"48 Constant_1983" -> "5 Multiply_20" [style=solid, label="[1, 1, 8]"]; +"49 Range_18" -> "2 MVN_19" [style=dashed, label="[1]"]; +"50 Constant_1984" -> "14 /attn/qkv/Add" [style=solid, label="[1, 1, 24]"]; +"51 Constant_41" -> "21 /attn/Gather_1" [style=dashed, label="[]"]; +"52 /Constant_3" -> "21 /attn/Gather_1" [style=dashed, label="[]"]; +"53 Constant_1985" -> "23 /attn/Mul" [style=solid, label="[1, 1, 1, 1]"]; +"54 Constant_39" -> "20 /attn/Gather" [style=dashed, label="[]"]; +"55 /Constant" -> "20 /attn/Gather" [style=dashed, label="[]"]; +"56 Constant_1986" -> "29 /attn/proj/Add" [style=solid, label="[1, 1, 8]"]; +"57 Constant_1987" -> "11 /mlp/fc1/Add" [style=solid, label="[1, 1, 32]"]; +"58 Constant_1988" -> "19 /mlp/fc2/Add" [style=solid, label="[1, 1, 8]"]; }