Skip to content

Commit f060ab9

Browse files
committed
fix typo
Signed-off-by: Siyuan Fu <[email protected]>
1 parent 7995977 commit f060ab9

File tree

1 file changed

+3
-3
lines changed

1 file changed

+3
-3
lines changed

csrc/trtllm_fused_moe_kernel_launcher.cu

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -369,7 +369,7 @@ void trtllm_fp8_per_tensor_scale_moe(
369369
auto const hidden_size = hidden_states.size(1);
370370
bool mUseDeepSeekFp8{false}; // FP8 per-tensor doesn't use DeepSeek FP8
371371

372-
std::vector<int32_t> mSupportedTileN = {8, 16, 32, 64, 128, 192, 256};
372+
std::vector<int32_t> mSupportedTileN = {8, 16, 32, 64, 128};
373373
std::set<int32_t> selected_tile_nums =
374374
computeSelectedTileN(mSupportedTileN, num_tokens, top_k, local_num_experts);
375375

@@ -1314,8 +1314,8 @@ Array<Array<int64_t>> trtllm_get_valid_moe_configs(
13141314
supported_tile_nums.push_back(128);
13151315
} else if (is_fp8_per_tensor) {
13161316
supported_tile_nums.push_back(128);
1317-
supported_tile_nums.push_back(192);
1318-
supported_tile_nums.push_back(256);
1317+
// supported_tile_nums.push_back(192);
1318+
// supported_tile_nums.push_back(256);
13191319
} else if (is_fp4_without_bf16_act) {
13201320
supported_tile_nums.push_back(128);
13211321
}

0 commit comments

Comments
 (0)