vllm-project · bitborne · May 18, 2026 · hsliuustc0106 · May 19, 2026
@@ -291,8 +291,7 @@ def test_sp_correctness(model_name: str):
     print("=" * 70)
 
 
-# TODO: After PR#1272 is merged, add markers
-# @pytest.mark.advanced_model
+@pytest.mark.advanced_model
 @pytest.mark.diffusion
 @pytest.mark.parallel
 @hardware_test(res={"cuda": "L4", "rocm": "MI325"}, num_cards={"cuda": 4, "rocm": 2})

@@ -54,7 +54,7 @@ def weights_iterator(self) -> Generator[tuple[str, torch.Tensor], None, None]:
         raise NotImplementedError
 
 
-# FIXME(Isotr0py): Sync implemnentation with upstream vLLM?
+# FIXME(Isotr0py): Sync implementation with upstream vLLM?
 def gguf_quant_weights_iterator(gguf_file: str) -> Generator[tuple[str, torch.Tensor]]:
     """
     Iterate over the quant weights in the model gguf files and convert