Skip to content

Commit 7217db5

Browse files
committed
Disable useSingleBlock
1 parent 903591c commit 7217db5

File tree

1 file changed

+3
-1
lines changed

1 file changed

+3
-1
lines changed

csrc/trtllm_fused_moe_routing_renormalize.cu

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -434,7 +434,9 @@ void run(Data const& data, void* stream) {
434434
TVM_FFI_ICHECK_EQ(data.mNumExperts % 4, 0)
435435
<< "Routing kernel expects #experts " << data.mNumExperts << " to be a multiple of 4.";
436436

437-
bool const useSingleBlock = data.mNumTokens <= BlockKernelMaxNumTokens;
437+
// FIXME: routingIndicesBlockKernel brreaks the vllm + gpt-oss DeepEP
438+
// bool const useSingleBlock = data.mNumTokens <= BlockKernelMaxNumTokens;
439+
bool const useSingleBlock = false;
438440

439441
bool const useSingleCluster =
440442
data.mNumTokens <= ((data.mPtrScores != nullptr || data.mPtrTopKIds != nullptr)

0 commit comments

Comments
 (0)