【Paddle TensorRT】add Bool output type support for fill_any_like with tensorrt > 8.5 (#71718)

PolaKuma · web-flow · commit 09961b00ecb7 · 2025-03-20T11:54:13.000+08:00
* add_fill_any_like_bool

* fix codestyle

* add bool test

* fix

* fix codestyle

* Update test_trt_convert_fill_any_like.py

* Update test_trt_convert_fill_any_like.py

* Update CMakeLists.txt

* fix codestyle

* ban fill_any_like in win32
diff --git a/paddle/fluid/inference/tensorrt/convert/fill_any_like_op.cc b/paddle/fluid/inference/tensorrt/convert/fill_any_like_op.cc
@@ -40,6 +40,11 @@ class FillAnyLikeOpConverter : public OpConverter {
                       "will be cast to int32.";
       value_tensor = Add1DConstantLayer(static_cast<int32_t>(value),
                                         output_name + "_value_tensor_");
+    } else if (dtype == 0) {
+      LOG(WARNING) << "the fill_any_like has int32 dtype and 0 dtype, it "
+                      "will be cast to bool.";
+      value_tensor = Add1DConstantLayer(static_cast<bool>(value),
+                                        output_name + "_value_tensor_");
     } else {
       value_tensor = Add1DConstantLayer(value, output_name + "_value_tensor_");
     }
diff --git a/paddle/fluid/inference/tensorrt/convert/op_converter.h b/paddle/fluid/inference/tensorrt/convert/op_converter.h
@@ -734,7 +734,7 @@ class OpConverter {
                                         bool scalar = false) {
     if (!(std::is_same<T, float>::value ||
           std::is_same<T, phi::dtype::float16>::value ||
-          std::is_same<T, int32_t>::value)) {
+          std::is_same<T, int32_t>::value || std::is_same<T, bool>::value)) {
       PADDLE_THROW(common::errors::InvalidArgument(
           "Unsupported data type (%s) for TensorRT AddConstantLayer, only "
           "supports float, half or int32_t."));
@@ -750,7 +750,9 @@ class OpConverter {
     engine_->SetWeights(weight_name, std::move(tmp_tensor));
 
     nvinfer1::DataType trt_dtype = nvinfer1::DataType::kFLOAT;
-    if (std::is_integral<T>::value) {
+    if (std::is_same<T, bool>::value) {
+      trt_dtype = nvinfer1::DataType::kBOOL;
+    } else if (std::is_integral<T>::value) {
       trt_dtype = nvinfer1::DataType::kINT32;
     }
 
diff --git a/test/ir/inference/CMakeLists.txt b/test/ir/inference/CMakeLists.txt
@@ -73,6 +73,9 @@ if(WIN32)
        "test_trt_explicit_quantization_mobilenet")
   list(REMOVE_ITEM TEST_INFERENCE_IR_PASSES
        "test_trt_explicit_quantization_mobilenet")
+  list(REMOVE_ITEM TEST_TRT_IR_PASSES "test_trt_convert_fill_any_like")
+  list(REMOVE_ITEM TEST_INFERENCE_IR_PASSES "test_trt_convert_fill_any_like")
+  list(REMOVE_ITEM TEST_TRT_CONVERTER "test_trt_convert_fill_any_like")
 endif()
 
 foreach(TEST_INFERENCE_IR_PASS ${TEST_TRT_IR_PASSES})
diff --git a/test/ir/inference/test_trt_convert_fill_any_like.py b/test/ir/inference/test_trt_convert_fill_any_like.py
@@ -192,5 +192,163 @@ def test(self):
         self.run_test(run_pir=True)
 
 
+class TrtConvertExpandV2BoolTest(TrtLayerAutoScanTest):
+    def is_program_valid(self, program_config: ProgramConfig) -> bool:
+        if self.dtype in [1, 4]:
+            return False
+        if self.dims != 4 and self.dtype != 2:
+            return False
+        return True
+
+    def sample_program_configs(self):
+        def generate_input1(attrs: list[dict[str, Any]]):
+            if self.dims == 4:
+                self.input_shape = [1, 1, 4, 6]
+                if self.dtype == 0:
+                    return np.random.random([1, 1, 4, 6]).astype(np.bool_)
+            elif self.dims == 3:
+                self.input_shape = [1, 8, 6]
+                return np.random.random([1, 8, 6]).astype(np.int32)
+            elif self.dims == 2:
+                self.input_shape = [1, 48]
+                return np.random.random([1, 48]).astype(np.int32)
+            elif self.dims == 1:
+                self.input_shape = [48]
+                return np.random.random([48]).astype(np.int32)
+
+        def generate_weight1(attrs: list[dict[str, Any]]):
+            return np.array([1, 48]).astype(np.int32)
+
+        def generate_shapeT1_data(attrs: list[dict[str, Any]]):
+            return np.array([2]).astype(np.int32)
+
+        def generate_shapeT2_data(attrs: list[dict[str, Any]]):
+            return np.array([24]).astype(np.int32)
+
+        for dims in [1, 2, 3, 4]:
+            for value in [0, 1]:
+                for dtype in [0]:
+                    dics = [
+                        {
+                            "value": value,
+                            "dtype": dtype,
+                        },
+                    ]
+                    self.dims = dims
+                    self.dtype = dtype
+                    dics_input = [{"X": ["fill_any_like_input"]}]
+
+                    ops_config = [
+                        {
+                            "op_type": "fill_any_like",
+                            "op_inputs": dics_input[0],
+                            "op_outputs": {"Out": ["fill_any_like_out"]},
+                            "op_attrs": dics[0],
+                        }
+                    ]
+                    ops = self.generate_op_config(ops_config)
+                    program_config = ProgramConfig(
+                        ops=ops,
+                        weights={},
+                        inputs={
+                            "fill_any_like_input": TensorConfig(
+                                data_gen=partial(generate_input1, dics)
+                            )
+                        },
+                        outputs=["fill_any_like_out"],
+                    )
+
+                    yield program_config
+
+    def sample_predictor_configs(
+        self, program_config
+    ) -> tuple[paddle_infer.Config, list[int], int]:
+
+        def generate_dynamic_shape(attrs):
+            if self.dims == 4:
+                self.dynamic_shape.min_input_shape = {
+                    "fill_any_like_input": [1, 1, 4, 6]
+                }
+                self.dynamic_shape.max_input_shape = {
+                    "fill_any_like_input": [10, 1, 4, 6]
+                }
+                self.dynamic_shape.opt_input_shape = {
+                    "fill_any_like_input": [1, 1, 4, 6]
+                }
+            elif self.dims == 3:
+                self.dynamic_shape.min_input_shape = {
+                    "fill_any_like_input": [1, 8, 6]
+                }
+                self.dynamic_shape.max_input_shape = {
+                    "fill_any_like_input": [4, 8, 6]
+                }
+                self.dynamic_shape.opt_input_shape = {
+                    "fill_any_like_input": [1, 8, 6]
+                }
+            elif self.dims == 2:
+                self.dynamic_shape.min_input_shape = {
+                    "fill_any_like_input": [1, 48]
+                }
+                self.dynamic_shape.max_input_shape = {
+                    "fill_any_like_input": [4, 48]
+                }
+                self.dynamic_shape.opt_input_shape = {
+                    "fill_any_like_input": [1, 48]
+                }
+            elif self.dims == 1:
+                self.dynamic_shape.min_input_shape = {
+                    "fill_any_like_input": [48]
+                }
+                self.dynamic_shape.max_input_shape = {
+                    "fill_any_like_input": [48]
+                }
+                self.dynamic_shape.opt_input_shape = {
+                    "fill_any_like_input": [48]
+                }
+
+        def clear_dynamic_shape():
+            self.dynamic_shape.min_input_shape = {}
+            self.dynamic_shape.max_input_shape = {}
+            self.dynamic_shape.opt_input_shape = {}
+
+        def generate_trt_nodes_num(attrs, dynamic_shape):
+            if not dynamic_shape:
+                return 0, 3
+            else:
+                return 1, 2
+
+        attrs = [
+            program_config.ops[i].attrs for i in range(len(program_config.ops))
+        ]
+
+        clear_dynamic_shape()
+        self.trt_param.precision = paddle_infer.PrecisionType.Float32
+        yield self.create_inference_config(), generate_trt_nodes_num(
+            attrs, False
+        ), 1e-5
+        self.trt_param.precision = paddle_infer.PrecisionType.Half
+        yield self.create_inference_config(), generate_trt_nodes_num(
+            attrs, False
+        ), 1e-5
+
+        # for dynamic_shape
+        generate_dynamic_shape(attrs)
+        self.trt_param.precision = paddle_infer.PrecisionType.Float32
+        yield self.create_inference_config(), generate_trt_nodes_num(
+            attrs, True
+        ), 1e-5
+        self.trt_param.precision = paddle_infer.PrecisionType.Half
+        yield self.create_inference_config(), generate_trt_nodes_num(
+            attrs, True
+        ), 1e-5
+
+    def add_skip_trt_case(self):
+        pass
+
+    def test(self):
+        self.add_skip_trt_case()
+        self.run_test()
+
+
 if __name__ == "__main__":
     unittest.main()