Skip to content

Commit 3d507f6

Browse files
authored
update moe ffn tune config (#72583)
1 parent cefc437 commit 3d507f6

File tree

2 files changed

+8
-1
lines changed

2 files changed

+8
-1
lines changed

paddle/phi/kernels/fusion/cutlass/cutlass_extensions/ft_gemm_configs.h

+3-1
Original file line numberDiff line numberDiff line change
@@ -48,16 +48,18 @@ enum class CutlassTileConfig {
4848
// Warp configs for M=16
4949
CtaShape16x128x64_WarpShape16x32x64,
5050
CtaShape16x256x64_WarpShape16x64x64,
51-
51+
CtaShape16x256x64_WarpShape64x16x128,
5252
// Warp configs for M=32
5353
CtaShape32x128x64_WarpShape32x32x64,
5454

5555
// Warp configs for M=64
56+
CtaShape64x64x64_WarpShape32x32x64,
5657
CtaShape64x128x64_WarpShape32x64x64,
5758
CtaShape64x128x64_WarpShape64x32x64,
5859
CtaShape64x128x64_WarpShape64x64x64,
5960

6061
// Warp configs for M=128
62+
CtaShape128x64x64_WarpShape64x32x64,
6163
CtaShape128x128x64_WarpShape64x32x64,
6264
CtaShape128x128x64_WarpShape64x64x64,
6365
CtaShape128x128x64_WarpShape128x32x64,

paddle/phi/kernels/fusion/cutlass/cutlass_kernels/cutlass_heuristic.h

+5
Original file line numberDiff line numberDiff line change
@@ -60,9 +60,14 @@ static std::vector<CutlassTileConfig> get_candidate_tiles(
6060
};
6161
std::vector<CutlassTileConfig> quant_B_configs_sm80{
6262
CutlassTileConfig::CtaShape16x128x64_WarpShape16x32x64,
63+
CutlassTileConfig::CtaShape16x256x64_WarpShape16x64x64,
6364
CutlassTileConfig::CtaShape32x128x64_WarpShape32x32x64,
65+
CutlassTileConfig::CtaShape64x64x64_WarpShape32x32x64,
66+
CutlassTileConfig::CtaShape64x128x64_WarpShape64x32x64,
6467
CutlassTileConfig::CtaShape64x128x64_WarpShape64x64x64,
68+
CutlassTileConfig::CtaShape128x64x64_WarpShape64x32x64,
6569
CutlassTileConfig::CtaShape128x128x64_WarpShape64x64x64,
70+
CutlassTileConfig::CtaShape128x128x64_WarpShape128x32x64,
6671
CutlassTileConfig::CtaShape128x256x64_WarpShape64x64x64,
6772
};
6873
if (is_moe) {

0 commit comments

Comments
 (0)