From 224014268e4da3c3dcfcb8f6ce03b0f9be386a4a Mon Sep 17 00:00:00 2001
From: heliqi <heliqi@baidu.com>
Date: Mon, 6 Dec 2021 20:36:01 +0800
Subject: [PATCH] add test_unsqueeze2_eltwise_fuse_pass (#37647)

* add test_unsqueeze2_eltwise_fuse_pass

* fix name conflictn

* rebuild CI
---
 paddle/fluid/framework/ir/CMakeLists.txt      |   2 +-
 .../test_unsqueeze2_eltwise_fuse_pass.py      | 103 ++++++++++++++++++
 tools/parallel_UT_rule.py                     |   6 +-
 3 files changed, 107 insertions(+), 4 deletions(-)
 create mode 100644 python/paddle/fluid/tests/unittests/ir/inference/test_unsqueeze2_eltwise_fuse_pass.py

diff --git a/paddle/fluid/framework/ir/CMakeLists.txt b/paddle/fluid/framework/ir/CMakeLists.txt
index e384cb46337..b98a2288682 100644
--- a/paddle/fluid/framework/ir/CMakeLists.txt
+++ b/paddle/fluid/framework/ir/CMakeLists.txt
@@ -161,7 +161,7 @@ cc_test(test_skip_layernorm_fuse_pass SRCS skip_layernorm_fuse_pass_tester.cc DE
 cc_test(test_multihead_matmul_fuse_pass SRCS multihead_matmul_fuse_pass_tester.cc DEPS multihead_matmul_fuse_pass)
 cc_test(test_conv_bn_fuse_pass_cc SRCS conv_bn_fuse_pass_tester.cc DEPS conv_bn_fuse_pass)
 cc_test(test_adaptive_pool2d_convert_global_pass SRCS adaptive_pool2d_convert_global_pass_tester.cc DEPS adaptive_pool2d_convert_global_pass)
-cc_test(test_unsqueeze2_eltwise_fuse_pass SRCS unsqueeze2_eltwise_fuse_pass_tester.cc DEPS unsqueeze2_eltwise_fuse_pass)
+cc_test(test_unsqueeze2_eltwise_fuse_pass_cc SRCS unsqueeze2_eltwise_fuse_pass_tester.cc DEPS unsqueeze2_eltwise_fuse_pass)
 cc_test(test_layer_norm_fuse_pass_cc SRCS layer_norm_fuse_pass_tester.cc DEPS layer_norm_fuse_pass pass_test_util naive_executor)
 cc_test(test_generate_pass_cc SRCS generate_pass_tester.cc DEPS generate_pass pass_desc_proto)
 if(WITH_GPU OR WITH_ROCM)
diff --git a/python/paddle/fluid/tests/unittests/ir/inference/test_unsqueeze2_eltwise_fuse_pass.py b/python/paddle/fluid/tests/unittests/ir/inference/test_unsqueeze2_eltwise_fuse_pass.py
new file mode 100644
index 00000000000..81acd9856cf
--- /dev/null
+++ b/python/paddle/fluid/tests/unittests/ir/inference/test_unsqueeze2_eltwise_fuse_pass.py
@@ -0,0 +1,103 @@
+# Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from auto_scan_test import PassAutoScanTest, SkipReasons
+from program_config import TensorConfig, ProgramConfig, OpConfig
+import numpy as np
+import paddle.inference as paddle_infer
+from functools import partial
+from typing import Optional, List, Callable, Dict, Any, Set
+import unittest
+
+import hypothesis
+from hypothesis import given, settings, seed, example, assume, reproduce_failure
+import hypothesis.strategies as st
+
+
+class TestUnsqueezeEltwiseFusePass(PassAutoScanTest):
+    """
+        y_var  
+          |          
+       unsqueeze2 
+          \
+    unsqueeze2_out_var    x_var
+             \           /
+            elementwise_mul 
+    """
+
+    def sample_predictor_configs(self, program_config):
+        # TRT
+        config = self.create_trt_inference_config()
+        config.enable_tensorrt_engine(
+            max_batch_size=10,
+            workspace_size=102400,
+            min_subgraph_size=0,
+            precision_mode=paddle_infer.PrecisionType.Float32,
+            use_static=False,
+            use_calib_mode=False)
+        yield config, ['elementwise_mul', ], (1e-5, 1e-5)
+
+    def sample_program_config(self, draw):
+        # 1. Generate shape and attr of mul
+        x_shape = draw(
+            st.lists(
+                st.integers(
+                    min_value=1, max_value=10), min_size=4, max_size=4))
+        axis = -1
+
+        # 2. Generate legal shape and attr of input:Y of unsqueeze2
+        y_shape = x_shape[:2]
+        unsqueeze2_axes = [2, 3]
+
+        unsqueeze2_op = OpConfig(
+            "unsqueeze2",
+            inputs={
+                "X": ["unsqueeze2_x"],
+                "AxesTensor": [],
+                "AxesTensorList": []
+            },
+            axes=unsqueeze2_axes,
+            outputs={"Out": ["unsqueeze2_out"],
+                     "XShape": ["xshape"]}, )
+        mul_op = OpConfig(
+            "elementwise_mul",
+            inputs={"Y": ["unsqueeze2_out"],
+                    "X": ["mul_x"]},
+            axis=axis,
+            outputs={"Out": ["mul_out"]}, )
+
+        ops = [
+            unsqueeze2_op,
+            mul_op,
+        ]
+
+        program_config = ProgramConfig(
+            ops=ops,
+            weights={},
+            inputs={
+                "mul_x": TensorConfig(shape=x_shape),
+                "unsqueeze2_x": TensorConfig(shape=y_shape),
+            },
+            outputs=ops[-1].outputs["Out"], )
+        return program_config
+
+    def test(self):
+        self.run_and_statis(
+            quant=False,
+            max_examples=300,
+            passes=["unsqueeze2_eltwise_fuse_pass"])
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/tools/parallel_UT_rule.py b/tools/parallel_UT_rule.py
index b38a305c1b8..0d106102aa2 100644
--- a/tools/parallel_UT_rule.py
+++ b/tools/parallel_UT_rule.py
@@ -136,7 +136,7 @@ HIGH_PARALLEL_JOB_NEW = [
     'test_conv_concat_relu_mkldnn_fuse_pass',
     'test_bf16_utils',
     'test_sum_bf16_mkldnn_op',
-    'test_unsqueeze2_eltwise_fuse_pass',
+    'test_unsqueeze2_eltwise_fuse_pass_cc',
     'dense_table_test',
     'test_collective_optimizer',
     'test_origin_info',
@@ -1715,7 +1715,7 @@ CPU_PARALLEL_JOB = [
     'test_recv_save_op',
     'heter_listen_and_server_test',
     'test_analyzer_capi_ner',
-    'test_unsqueeze2_eltwise_fuse_pass',
+    'test_unsqueeze2_eltwise_fuse_pass_cc',
     'test_dgc_optimizer',
     'test_fleet_cc',
     'test_repeated_fc_relu_fuse_pass_cc',
@@ -1775,7 +1775,7 @@ TETRAD_PARALLEL_JOB = [
     'test_fc_gru_fuse_pass_cc',
     'test_conv_bn_fuse_pass_cc',
     'test_adaptive_pool2d_convert_global_pass',
-    'test_unsqueeze2_eltwise_fuse_pass',
+    'test_unsqueeze2_eltwise_fuse_pass_cc',
     'test_layer_norm_fuse_pass_cc',
     'test_fc_act_mkldnn_fuse_pass',
     'test_fleet_cc',
-- 
GitLab