【Paddle-TensorRT】fix pd_op.any (#72192)

lizexu123 · YuanRisheng · web-flow · commit d6dc5420c620 · 2025-04-15T19:23:23.000+08:00
* support fp32

* fix pd_op.fused_conv2d

* simplified code

* fix pd_op.any

* fix pd_op.fused_conv2d_add_act

* fix

---------

Co-authored-by: YuanRisheng &lt;yuanrisheng@baidu.com&gt;
diff --git a/python/paddle/tensorrt/converter_utils.py b/python/paddle/tensorrt/converter_utils.py
@@ -669,38 +669,16 @@ def convert_conv2d(network, paddle_op, inputs):
     if paddle_op.name() == "pd_op.fused_conv2d_add_act":
         constant_manager = TensorRTConstantManager()
         bias_source_op = paddle_op.operands()[2].source().get_defining_op()
-
-        def get_bias_weights(current_op):
-            if current_op.name() == "builtin.parameter":
-                bias_name = current_op.attrs()["parameter_name"]
-            elif current_op.name() == "builtin.constant":
-                bias_name = current_op.attrs()["value"]
-            else:
-                raise ValueError(
-                    f"Unsupported bias source operation: {current_op.name()}"
-                )
-
-            bias_np = constant_manager.get_constant_value(bias_name)
-            return trt.Weights(bias_np)
-
-        if bias_source_op.name() in ["builtin.parameter", "builtin.constant"]:
-            bias_weights = get_bias_weights(bias_source_op)
+        if bias_source_op.name() == "builtin.parameter":
+            bias_name = bias_source_op.attrs()['parameter_name']
+        elif bias_source_op.name() == "builtin.constant":
+            bias_np = bias_source_op.attrs()['value']
         else:
-            while bias_source_op.name() == "pd_op.reshape":
-                bias_source_op = (
-                    bias_source_op.operands()[0].source().get_defining_op()
-                )
-                if bias_source_op.name() in [
-                    "builtin.parameter",
-                    "builtin.constant",
-                ]:
-                    bias_weights = get_bias_weights(bias_source_op)
-                    break
-            else:
-                raise ValueError(
-                    f"Unsupported bias source operation: {bias_source_op.name()}"
-                )
-
+            raise ValueError(
+                f"Unsupported bias source op: {bias_source_op.name()}"
+            )
+        bias_np = constant_manager.get_constant_value(bias_name)
+        bias_weights = trt.Weights(bias_np)
         layer = network.add_convolution_nd(
             input=input_tensor,
             num_output_maps=n_output,
@@ -897,27 +875,32 @@ def add_cast_reduce_layer(network, paddle_op, inputs, op_type):
 
     axis = paddle_op.attrs().get("axis")
     input_shape = paddle_op.operands()[0].source().shape
-    keepdim = paddle_op.attrs()["keepdim"]
-    if network.has_implicit_batch_dimension:
-        assert (
-            axis != 0
-        ), "can't reduce on axis == 0 when network has implicit batch dimension"
-    output_shape = []
+    input_dims = len(input_shape)
+    keepdim = paddle_op.attrs().get("keepdim")
+
     if len(axis) == 0:
-        axis = list(range(len(input_shape)))
-    for i in range(len(axis)):
-        if axis[i] < 0:
-            axis[i] = len(input_shape) + axis[i]
-    layer = network.add_reduce(
+        axes = 0
+        for i in range(input_dims):
+            axes |= 1 << i
+    else:
+        for i in range(len(axis)):
+            if axis[i] < 0:
+                axis[i] += input_dims
+
+        axes = get_axes_for_reduce_op(axis)
+
+    reduce_layer = network.add_reduce(
         cast_layer.get_output(0),
         op_type,
-        axes=get_axes_for_reduce_op(axis),
+        axes=axes,
         keep_dims=keepdim,
     )
-    set_layer_name(layer, paddle_op)
-    layer.set_output_type(0, trt.bool)
-    layer.get_output(0).dtype = cast_layer.get_output(0).dtype
-    return layer.get_output(0)
+    set_layer_name(reduce_layer, paddle_op)
+    bool_layer = network.add_identity(reduce_layer.get_output(0))
+    set_layer_name(bool_layer, paddle_op)
+    bool_layer.set_output_type(0, trt.bool)
+    bool_layer.get_output(0).dtype = trt.bool
+    return bool_layer.get_output(0)
 
 
 def fix_negative_indices(network, input_shape, indices, name=None):
diff --git a/python/paddle/tensorrt/impls/activation.py b/python/paddle/tensorrt/impls/activation.py
@@ -150,7 +150,7 @@ def gelu_converter(network, paddle_op, inputs):
         )
         constant_layer_sqrt = add_constant_layer(
             network,
-            [0.7978845608028654],
+            [0.79788456080286535587989211986876],
             const_shape,
             np.float32,
             name=[paddle_op.name(), "constant_layer_sqrt"],
diff --git a/test/tensorrt/CMakeLists.txt b/test/tensorrt/CMakeLists.txt
@@ -16,8 +16,8 @@ if(NOT WIN32 AND TENSORRT_FOUND)
   set_tests_properties(test_converter_norm PROPERTIES TIMEOUT "300")
   set_tests_properties(test_converter_ops PROPERTIES TIMEOUT "600")
   set_tests_properties(test_converter_stat PROPERTIES TIMEOUT "300")
-  set_tests_properties(test_converter_math PROPERTIES TIMEOUT "600")
-  set_tests_properties(test_converter_activation PROPERTIES TIMEOUT "600")
+  set_tests_properties(test_converter_math PROPERTIES TIMEOUT "900")
+  set_tests_properties(test_converter_activation PROPERTIES TIMEOUT "900")
   set_tests_properties(test_converter_others PROPERTIES TIMEOUT "300")
   set_tests_properties(test_converter_manipulation PROPERTIES TIMEOUT "600")
   set_tests_properties(test_converter_creation PROPERTIES TIMEOUT "300")
diff --git a/test/tensorrt/test_converter_math.py b/test/tensorrt/test_converter_math.py
@@ -260,7 +260,7 @@ def setUp(self):
         self.python_api = paddle.any
         self.api_args = {
             "x": np.random.randn(2, 3, 2).astype("bool"),
-            "axis": [1, 1],
+            "axis": [1],
             "keepdim": True,
         }
         self.program_config = {"feed_list": ["x"]}
@@ -277,7 +277,24 @@ def setUp(self):
         self.python_api = paddle.any
         self.api_args = {
             "x": np.random.randn(2, 3, 2).astype("bool"),
-            "axis": [1, 1],
+            "axis": [1],
+            "keepdim": False,
+        }
+        self.program_config = {"feed_list": ["x"]}
+        self.min_shape = {"x": [1, 3, 2]}
+        self.opt_shape = {"x": [2, 3, 2]}
+        self.max_shape = {"x": [5, 3, 2]}
+
+    def test_trt_result(self):
+        self.check_trt_result()
+
+
+class TestAny2TRTPattern(TensorRTBaseTest):
+    def setUp(self):
+        self.python_api = paddle.any
+        self.api_args = {
+            "x": np.random.randn(2, 3, 2).astype("bool"),
+            "axis": [-1],
             "keepdim": False,
         }
         self.program_config = {"feed_list": ["x"]}
@@ -288,6 +305,9 @@ def setUp(self):
     def test_trt_result(self):
         self.check_trt_result()
 
+    def test_trt_result_fp16(self):
+        self.check_trt_result(precision_mode="fp16")
+
 
 class TestAllTRTPattern(TensorRTBaseTest):
     def setUp(self):

Original file line number	Diff line number	Diff line change
`@@ -150,7 +150,7 @@ def gelu_converter(network, paddle_op, inputs):`
`150`	`150`	`)`
`151`	`151`	`constant_layer_sqrt = add_constant_layer(`
`152`	`152`	`network,`
`153`		`- [0.7978845608028654],`
	`153`	`+ [0.79788456080286535587989211986876],`
`154`	`154`	`const_shape,`
`155`	`155`	`np.float32,`
`156`	`156`	`name=[paddle_op.name(), "constant_layer_sqrt"],`