lint and revert some change

jiahanc · jiahanc · commit 0f332304716b · 2025-10-18T13:39:41.000-07:00
Signed-off-by: jiahanc &lt;173873397+jiahanc@users.noreply.github.com&gt;
diff --git a/csrc/trtllm_batched_gemm_runner.cu b/csrc/trtllm_batched_gemm_runner.cu
@@ -169,6 +169,7 @@ void TrtllmGenBatchedGemmRunner::run(
   auto const configs = bmm.getBatchedGemmConfigs();
 
   auto const& config = configs[configIndex];
+
   FLASHINFER_CHECK(numBatches > 0, "Batched GEMM requires numBatches > 0");
   if (!mOptions.staticBatch) {
     FLASHINFER_CHECK(totalNumPaddedTokens,
diff --git a/include/flashinfer/trtllm/fused_moe/RoutingKernelTopK.cuh b/include/flashinfer/trtllm/fused_moe/RoutingKernelTopK.cuh
@@ -217,7 +217,7 @@ __forceinline__ __device__ void reduceTopK(cg::thread_block_tile<WarpSize> const
 
     for (int ii = 0; ii < numResults; ++ii) {
       topKBufferValue[ii] = minValue;
-      topKBufferIdx[ii] = ii * WarpSize - 1;  //@todo: check if this is correct
+      topKBufferIdx[ii] = ii * WarpSize - 1;
     }
     for (int loop = 0; loop < numLoops; ++loop) {
       int start = loop * 4;
diff --git a/tests/moe/test_trtllm_gen_fused_moe.py b/tests/moe/test_trtllm_gen_fused_moe.py
@@ -1914,7 +1914,7 @@ def cache_permute_indices():
                 "routed_scaling": None,
                 "has_routing_bias": False,
                 "routing_method_type": RoutingMethodType.Renormalize,
-                "compatible_moe_impls": [FP8BlockScaleMoe, FP4Moe],
+                "compatible_moe_impls": [FP8BlockScaleMoe, FP8PerTensorMoe, FP4Moe],
             },
             id="Renorm",
             marks=pytest.mark.skip(

Original file line number	Diff line number	Diff line change
`@@ -217,7 +217,7 @@ __forceinline__ __device__ void reduceTopK(cg::thread_block_tile<WarpSize> const`
`217`	`217`
`218`	`218`	`for (int ii = 0; ii < numResults; ++ii) {`
`219`	`219`	`topKBufferValue[ii] = minValue;`
`220`		`- topKBufferIdx[ii] = ii * WarpSize - 1; //@todo: check if this is correct`
	`220`	`+ topKBufferIdx[ii] = ii * WarpSize - 1;`
`221`	`221`	`}`
`222`	`222`	`for (int loop = 0; loop < numLoops; ++loop) {`
`223`	`223`	`int start = loop * 4;`