[CINN] Clean some code (#69520)

ooooo-create · web-flow · commit 803909e5822f · 2024-11-20T21:31:19.000+08:00
* fused_attention

* Fix compile

* refine code

* refine code

* clean useless code

* clean useless code

* use const &amp;&amp; some todo
diff --git a/paddle/fluid/pir/dialect/operator/interface/infer_symbolic_shape/binary_infer_sym.cc b/paddle/fluid/pir/dialect/operator/interface/infer_symbolic_shape/binary_infer_sym.cc
@@ -2385,8 +2385,9 @@ bool WeightDequantizeOpInferSymbolicShape(
                     common::errors::InvalidArgument(
                         "The x tensor of dequantize op must be 2D, but got[%d]",
                         x_shape.size()));
-  int group_size = op->attribute<pir::Int32Attribute>("group_size").data();
-  std::string algo = op->attribute<pir::StrAttribute>("algo").AsString();
+  const int group_size =
+      op->attribute<pir::Int32Attribute>("group_size").data();
+  const std::string algo = op->attribute<pir::StrAttribute>("algo").AsString();
   PADDLE_ENFORCE_EQ(
       (group_size == -1 || group_size == 64 || group_size == 128),
       true,
diff --git a/paddle/fluid/pir/dialect/operator/interface/infer_symbolic_shape/multiary_infer_sym.cc b/paddle/fluid/pir/dialect/operator/interface/infer_symbolic_shape/multiary_infer_sym.cc
@@ -1676,14 +1676,14 @@ bool FusedAttentionOpInferSymbolicShape(
   symbol::DimExpr dim_head = 0;
   symbol::DimExpr hidden_size = 0;
   symbol::DimExpr nranks = 1;
-  bool transpose_qkv_wb =
+  const bool transpose_qkv_wb =
       op->attribute<pir::BoolAttribute>("transpose_qkv_wb").data();
-  int num_heads_ = op->attribute<pir::Int32Attribute>("num_heads").data();
+  const int num_heads_ = op->attribute<pir::Int32Attribute>("num_heads").data();
   symbol::DimExpr num_heads = symbol::DimExpr(num_heads_);
-  int ring_id = op->attribute<pir::Int32Attribute>("ring_id").data();
-  bool pre_layer_norm =
+  const int ring_id = op->attribute<pir::Int32Attribute>("ring_id").data();
+  const bool pre_layer_norm =
       op->attribute<pir::BoolAttribute>("pre_layer_norm").data();
-  bool is_test = op->attribute<pir::BoolAttribute>("is_test").data();
+  const bool is_test = op->attribute<pir::BoolAttribute>("is_test").data();
   if (transpose_qkv_wb) {
     PADDLE_ENFORCE_EQ(qkv_weight_shape.size(),
                       2,
@@ -1747,7 +1747,7 @@ bool FusedAttentionOpInferSymbolicShape(
         symbol::ShapeOrDataDimExprs{
             symbol::TensorShapeOrDataDimExprs(x_shape)});
   } else {
-    // The follwing three code used to set unoptional output value.
+    // The following three code used to set unoptional output value.
     // Now it's result related to the infermeta.
     infer_context->SetSymbolForValueByStaticShape(op->result(0));
     infer_context->SetSymbolForValueByStaticShape(op->result(1));
@@ -1793,6 +1793,8 @@ bool FusedAttentionOpInferSymbolicShape(
                x_shape[1],
                symbol::DimExpr(3) * num_heads * dim_head})});
     } else {
+      // The following code used to set unoptional output value.
+      // Now it's result related to the infermeta.
       infer_context->SetSymbolForValueByStaticShape(op->result(4));
     }
   } else {
@@ -1815,6 +1817,8 @@ bool FusedAttentionOpInferSymbolicShape(
                                                  num_heads,
                                                  dim_head})});
     } else {
+      // The following code used to set unoptional output value.
+      // Now it's result related to the infermeta.
       infer_context->SetSymbolForValueByStaticShape(op->result(4));
     }
   }
@@ -1863,7 +1867,7 @@ bool FusedAttentionOpInferSymbolicShape(
         symbol::ShapeOrDataDimExprs{symbol::TensorShapeOrDataDimExprs(
             {x_shape[0], num_heads, x_shape[1], out_seq_len})});
   } else {
-    // The follwing code used to set unoptional output value.
+    // The following code used to set unoptional output value.
     // Now it's result related to the infermeta.
     infer_context->SetSymbolForValueByStaticShape(op->result(11));
   }
@@ -1878,7 +1882,7 @@ bool FusedAttentionOpInferSymbolicShape(
         symbol::ShapeOrDataDimExprs{symbol::TensorShapeOrDataDimExprs(
             {x_shape[0], num_heads, x_shape[1], out_seq_len})});
   } else {
-    // The follwing code used to set unoptional output value.
+    // The following code used to set unoptional output value.
     // Now it's result related to the infermeta.
     infer_context->SetSymbolForValueByStaticShape(op->result(9));
   }
@@ -1910,7 +1914,7 @@ bool FusedAttentionOpInferSymbolicShape(
         symbol::ShapeOrDataDimExprs{
             symbol::TensorShapeOrDataDimExprs(x_shape)});
   } else {
-    // The follwing code used to set unoptional output value.
+    // The following code used to set unoptional output value.
     // Now it's result related to the infermeta.
     infer_context->SetSymbolForValueByStaticShape(op->result(14));
   }
@@ -3350,9 +3354,8 @@ bool LstmOpInferSymbolicShape(pir::Operation *op,
   const symbol::ShapeOrDataDimExprs &bias_shape_or_data =
       infer_context->GetShapeOrDataForValue(op->operand_source(4));
   const auto &bias_shape = bias_shape_or_data.shape();
-  bool use_peepholes =
+  const bool use_peepholes =
       op->attribute<pir::BoolAttribute>("use_peepholes").data();
-  bool is_test = op->attribute<pir::BoolAttribute>("is_test").data();
   PADDLE_ENFORCE_EQ(
       input_shape.size(),
       2,
@@ -3394,19 +3397,15 @@ bool LstmOpInferSymbolicShape(pir::Operation *op,
       symbol::ShapeOrDataDimExprs{symbol::TensorShapeOrDataDimExprs(out_shape)};
   infer_context->SetShapeOrDataForValue(op->result(0), out_shape_or_data);
   infer_context->SetShapeOrDataForValue(op->result(1), out_shape_or_data);
-  if (!is_test) {
-    infer_context->SetShapeOrDataForValue(
-        op->result(2),
-        symbol::ShapeOrDataDimExprs{
-            symbol::TensorShapeOrDataDimExprs(input_shape)});
-    infer_context->SetShapeOrDataForValue(op->result(3), out_shape_or_data);
-  } else {
-    infer_context->SetShapeOrDataForValue(
-        op->result(2),
-        symbol::ShapeOrDataDimExprs{
-            symbol::TensorShapeOrDataDimExprs(input_shape)});
-    infer_context->SetShapeOrDataForValue(op->result(3), out_shape_or_data);
-  }
+
+  // Based on the kernel and infermeta, the inferred results are the same
+  // regardless of whether is_test is true or false.
+  infer_context->SetShapeOrDataForValue(
+      op->result(2),
+      symbol::ShapeOrDataDimExprs{
+          symbol::TensorShapeOrDataDimExprs(input_shape)});
+  infer_context->SetShapeOrDataForValue(op->result(3), out_shape_or_data);
+
   return true;
 }
 
diff --git a/paddle/fluid/pir/dialect/operator/interface/infer_symbolic_shape/unary_infer_sym.cc b/paddle/fluid/pir/dialect/operator/interface/infer_symbolic_shape/unary_infer_sym.cc
@@ -4454,8 +4454,9 @@ bool WeightQuantizeOpInferSymbolicShape(
                                         x_shape_1));
   }
 
-  int group_size = op->attribute<pir::Int32Attribute>("group_size").data();
-  std::string algo = op->attribute<pir::StrAttribute>("algo").AsString();
+  const int group_size =
+      op->attribute<pir::Int32Attribute>("group_size").data();
+  const std::string algo = op->attribute<pir::StrAttribute>("algo").AsString();
   PADDLE_ENFORCE_EQ(
       ((group_size == -1) || (group_size == 64) || (group_size == 128)),
       true,
diff --git a/test/legacy_test/test_fused_attention_op_api.py b/test/legacy_test/test_fused_attention_op_api.py
@@ -20,24 +20,6 @@
 from paddle.incubate.nn.layer.fused_transformer import FusedMultiHeadAttention
 
 
-def check_symbolic_result(program, fetch_vars, outs, op_type):
-    if paddle.base.libpaddle.pir.all_ops_defined_symbol_infer(program):
-        shape_analysis = (
-            paddle.base.libpaddle.pir.get_shape_constraint_ir_analysis(program)
-        )
-        for i, var in enumerate(fetch_vars):
-            if var.is_dense_tensor_type() or var.is_selected_row_type():
-                shape_or_data = shape_analysis.get_shape_or_data_for_var(var)
-                expect_shape = outs[i].shape
-                expect_data = []
-                if not shape_or_data.is_equal(expect_shape, expect_data):
-                    raise AssertionError(
-                        f"The shape or data of Operator {op_type}'s result is different from expected."
-                    )
-    else:
-        pass
-
-
 def fc(x, weight):
     return np.matmul(x, weight)
 
@@ -425,20 +407,6 @@ def run_static(self):
                             fused_attn.pre_ln_scale,
                         ],
                     )
-                    fetch_list = exe._check_fetch_list(
-                        [
-                            final_out,
-                            fused_attn.qkv_weight,
-                            fused_attn.linear_weight,
-                            fused_attn.pre_ln_scale,
-                        ]
-                    )
-                    check_symbolic_result(
-                        paddle.static.default_main_program(),
-                        fetch_list,
-                        [out, qkv_weight, out_linear_weight, ln_scale],
-                        'fused_attention',
-                    )
                 else:
                     out, qkv_weight, out_linear_weight, ln_2_scale = exe.run(
                         paddle.static.default_main_program(),
@@ -450,20 +418,6 @@ def run_static(self):
                             fused_attn.ln_scale,
                         ],
                     )
-                    fetch_list = exe._check_fetch_list(
-                        [
-                            final_out,
-                            fused_attn.qkv_weight,
-                            fused_attn.linear_weight,
-                            fused_attn.ln_scale,
-                        ]
-                    )
-                    check_symbolic_result(
-                        paddle.static.default_main_program(),
-                        fetch_list,
-                        [out, qkv_weight, out_linear_weight, ln_2_scale],
-                        'fused_attention',
-                    )
             else:
                 if self.pre_layer_norm:
                     (
@@ -487,31 +441,6 @@ def run_static(self):
                             fused_attn.pre_ln_bias,
                         ],
                     )
-                    fetch_list = exe._check_fetch_list(
-                        [
-                            final_out,
-                            fused_attn.qkv_weight,
-                            fused_attn.qkv_bias,
-                            fused_attn.linear_weight,
-                            fused_attn.linear_bias,
-                            fused_attn.pre_ln_scale,
-                            fused_attn.pre_ln_bias,
-                        ]
-                    )
-                    check_symbolic_result(
-                        paddle.static.default_main_program(),
-                        fetch_list,
-                        [
-                            out,
-                            qkv_weight,
-                            qkv_bias,
-                            out_linear_weight,
-                            linear_bias,
-                            ln_scale,
-                            ln_bias,
-                        ],
-                        'fused_attention',
-                    )
                 else:
                     (
                         out,
@@ -534,31 +463,6 @@ def run_static(self):
                             fused_attn.ln_bias,
                         ],
                     )
-                    fetch_list = exe._check_fetch_list(
-                        [
-                            final_out,
-                            fused_attn.qkv_weight,
-                            fused_attn.qkv_bias,
-                            fused_attn.linear_weight,
-                            fused_attn.linear_bias,
-                            fused_attn.ln_scale,
-                            fused_attn.ln_bias,
-                        ]
-                    )
-                    check_symbolic_result(
-                        paddle.static.default_main_program(),
-                        fetch_list,
-                        [
-                            out,
-                            qkv_weight,
-                            qkv_bias,
-                            out_linear_weight,
-                            linear_bias,
-                            ln_2_scale,
-                            ln_2_bias,
-                        ],
-                        'fused_attention',
-                    )
         else:
             if self.bias_attr is False:
                 if self.pre_layer_norm:
@@ -574,20 +478,6 @@ def run_static(self):
                             fused_attn.pre_ln_scale,
                         ],
                     )
-                    fetch_list = exe._check_fetch_list(
-                        [
-                            final_out,
-                            fused_attn.qkv_weight,
-                            fused_attn.linear_weight,
-                            fused_attn.pre_ln_scale,
-                        ]
-                    )
-                    check_symbolic_result(
-                        paddle.static.default_main_program(),
-                        fetch_list,
-                        [out, qkv_weight, out_linear_weight, ln_scale],
-                        'fused_attention',
-                    )
                 else:
                     out, qkv_weight, out_linear_weight, ln_2_scale = exe.run(
                         paddle.static.default_main_program(),
@@ -601,20 +491,6 @@ def run_static(self):
                             fused_attn.ln_scale,
                         ],
                     )
-                    fetch_list = exe._check_fetch_list(
-                        [
-                            final_out,
-                            fused_attn.qkv_weight,
-                            fused_attn.linear_weight,
-                            fused_attn.ln_scale,
-                        ]
-                    )
-                    check_symbolic_result(
-                        paddle.static.default_main_program(),
-                        fetch_list,
-                        [out, qkv_weight, out_linear_weight, ln_2_scale],
-                        'fused_attention',
-                    )
             else:
                 if self.pre_layer_norm:
                     (
@@ -640,31 +516,6 @@ def run_static(self):
                             fused_attn.pre_ln_bias,
                         ],
                     )
-                    fetch_list = exe._check_fetch_list(
-                        [
-                            final_out,
-                            fused_attn.qkv_weight,
-                            fused_attn.qkv_bias,
-                            fused_attn.linear_weight,
-                            fused_attn.linear_bias,
-                            fused_attn.pre_ln_scale,
-                            fused_attn.pre_ln_bias,
-                        ]
-                    )
-                    check_symbolic_result(
-                        paddle.static.default_main_program(),
-                        fetch_list,
-                        [
-                            out,
-                            qkv_weight,
-                            qkv_bias,
-                            out_linear_weight,
-                            linear_bias,
-                            ln_scale,
-                            ln_bias,
-                        ],
-                        'fused_attention',
-                    )
                 else:
                     (
                         out,
@@ -689,31 +540,6 @@ def run_static(self):
                             fused_attn.ln_bias,
                         ],
                     )
-                    fetch_list = exe._check_fetch_list(
-                        [
-                            final_out,
-                            fused_attn.qkv_weight,
-                            fused_attn.qkv_bias,
-                            fused_attn.linear_weight,
-                            fused_attn.linear_bias,
-                            fused_attn.ln_scale,
-                            fused_attn.ln_bias,
-                        ]
-                    )
-                    check_symbolic_result(
-                        paddle.static.default_main_program(),
-                        fetch_list,
-                        [
-                            out,
-                            qkv_weight,
-                            qkv_bias,
-                            out_linear_weight,
-                            linear_bias,
-                            ln_2_scale,
-                            ln_2_bias,
-                        ],
-                        'fused_attention',
-                    )
         return (
             out,
             qkv_weight,