Skip to content

Commit 5edb171

Browse files
修复 groupwwise weight only bug (#72710)
1 parent dc813e5 commit 5edb171

File tree

1 file changed

+2
-1
lines changed
  • paddle/phi/kernels/fusion/cutlass/cutlass_extensions/gemm/threadblock

1 file changed

+2
-1
lines changed

paddle/phi/kernels/fusion/cutlass/cutlass_extensions/gemm/threadblock/dq_mma_base.h

+2-1
Original file line numberDiff line numberDiff line change
@@ -169,7 +169,8 @@ class DqMmaBase {
169169
AlignedBuffer<typename Operator::ElementB, ShapeB::kCount> operand_B;
170170

171171
/// Buffer to hold scales for threadblock
172-
AlignedBuffer<ElementScale, Shape::kN> operand_scale;
172+
/// Note(zkk): allocate more used in group wise weight-only.
173+
AlignedBuffer<ElementScale, Shape::kN * kStages> operand_scale;
173174

174175
public:
175176
//

0 commit comments

Comments
 (0)