NVIDIA · hyukn · Nov 26, 2025 · Nov 24, 2025 · Nov 26, 2025
@@ -66,7 +66,7 @@ repos:
         additional_dependencies:
         - tomli
         # add ignore words list
-        args: ["-L", "Mor,ans,thirdparty"]
+        args: ["-L", "Mor,ans,thirdparty", "--skip", "security_scanning/*"]
 -   repo: https://github.com/astral-sh/ruff-pre-commit
     rev: v0.9.4
     hooks:

@@ -300,9 +300,9 @@ def create_output(self, q: torch.Tensor, out_dtype: torch.dtype):
                  size_per_token // num_nvfp4_elements_per_container),
                 dtype=torch.uint8)
             # Create a sf (scaling factors) tensor for NVFP4 (use INT8 as the container dtype).
-            output_sf = q.new_empty(compute_swizzled_sf_shape(
-                num_tokens, size_per_token // scaling_vector_size),
-                                    dtype=torch.uint8)
+            padded_row, padded_col = compute_swizzled_sf_shape(
+                num_tokens, size_per_token // scaling_vector_size)
+            output_sf = q.new_empty(padded_row * padded_col, dtype=torch.uint8)
         else:
             output = q.new_empty((num_tokens, self.num_heads * v_head_size),
                                  dtype=out_dtype)