Skip to content

Commit 0f33230

Browse files
committed
lint and revert some change
Signed-off-by: jiahanc <[email protected]>
1 parent 83dfa85 commit 0f33230

File tree

3 files changed

+3
-2
lines changed

3 files changed

+3
-2
lines changed

csrc/trtllm_batched_gemm_runner.cu

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -169,6 +169,7 @@ void TrtllmGenBatchedGemmRunner::run(
169169
auto const configs = bmm.getBatchedGemmConfigs();
170170

171171
auto const& config = configs[configIndex];
172+
172173
FLASHINFER_CHECK(numBatches > 0, "Batched GEMM requires numBatches > 0");
173174
if (!mOptions.staticBatch) {
174175
FLASHINFER_CHECK(totalNumPaddedTokens,

include/flashinfer/trtllm/fused_moe/RoutingKernelTopK.cuh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -217,7 +217,7 @@ __forceinline__ __device__ void reduceTopK(cg::thread_block_tile<WarpSize> const
217217

218218
for (int ii = 0; ii < numResults; ++ii) {
219219
topKBufferValue[ii] = minValue;
220-
topKBufferIdx[ii] = ii * WarpSize - 1; //@todo: check if this is correct
220+
topKBufferIdx[ii] = ii * WarpSize - 1;
221221
}
222222
for (int loop = 0; loop < numLoops; ++loop) {
223223
int start = loop * 4;

tests/moe/test_trtllm_gen_fused_moe.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1914,7 +1914,7 @@ def cache_permute_indices():
19141914
"routed_scaling": None,
19151915
"has_routing_bias": False,
19161916
"routing_method_type": RoutingMethodType.Renormalize,
1917-
"compatible_moe_impls": [FP8BlockScaleMoe, FP4Moe],
1917+
"compatible_moe_impls": [FP8BlockScaleMoe, FP8PerTensorMoe, FP4Moe],
19181918
},
19191919
id="Renorm",
19201920
marks=pytest.mark.skip(

0 commit comments

Comments
 (0)