diff --git a/tests/diffusion/distributed/test_sequence_parallel.py b/tests/diffusion/distributed/test_sequence_parallel.py index 9f76b3b75c5..f39bfd82a94 100644 --- a/tests/diffusion/distributed/test_sequence_parallel.py +++ b/tests/diffusion/distributed/test_sequence_parallel.py @@ -291,8 +291,7 @@ def test_sp_correctness(model_name: str): print("=" * 70) -# TODO: After PR#1272 is merged, add markers -# @pytest.mark.advanced_model +@pytest.mark.advanced_model @pytest.mark.diffusion @pytest.mark.parallel @hardware_test(res={"cuda": "L4", "rocm": "MI325"}, num_cards={"cuda": 4, "rocm": 2}) diff --git a/vllm_omni/diffusion/model_loader/gguf_adapters/base.py b/vllm_omni/diffusion/model_loader/gguf_adapters/base.py index 3bc38f16d96..5dc48f9a4c3 100644 --- a/vllm_omni/diffusion/model_loader/gguf_adapters/base.py +++ b/vllm_omni/diffusion/model_loader/gguf_adapters/base.py @@ -54,7 +54,7 @@ def weights_iterator(self) -> Generator[tuple[str, torch.Tensor], None, None]: raise NotImplementedError -# FIXME(Isotr0py): Sync implemnentation with upstream vLLM? +# FIXME(Isotr0py): Sync implementation with upstream vLLM? def gguf_quant_weights_iterator(gguf_file: str) -> Generator[tuple[str, torch.Tensor]]: """ Iterate over the quant weights in the model gguf files and convert