[Spyre-Next] Custom fixtures for upstream tests #884

tjohnson31415 · 2026-04-01T17:04:36Z

My AI questioning tells me that torch.device is a native C++ type defined by torch and that is why it is not possible to monkeypatch (some code using torch.device may even resolve fully at import time):
https://github.com/pytorch/pytorch/blob/main/torch/csrc/Device.cpp#L242

Yup, that's what I was running into. For some cases it's possible to patch it with a simple function, but there are a lot of usages likeisinstance(thing, torch.device) that expect torch.device to still be a class which I couldn't find a way to work around :/

-Original file line number
+Diff line change
@@ Expand Up / @@ -51,6 +51,8 @@ class AllowEntry: @@
             param_allows:    Parameter combinations to allow (whitelist). If specified,
                              only these parameter values will run.
             param_overrides: Parameter values to replace upstream defaults with.
+            fixture_names:   Fixture names to inject for this test (e.g. "foo" for a
+                             custom fixture that prints "hello world").
         """
         test: str
@@ Expand All / @@ -59,6 +61,7 @@ class AllowEntry: @@
         param_skips: tuple[ParamSkip, ...] = ()
         param_allows: tuple[ParamAllow, ...] = ()
         param_overrides: tuple[ParamOverride, ...] = ()
+        fixture_names: tuple[str, ...] = ()
     @dataclass(frozen=True)
@@ Expand Down @@

-Original file line number
+Diff line change
@@ Expand Up / @@ -43,6 +43,7 @@ @@
     from pathlib import Path
     import pytest
+    from vllm.v1.attention.backends.registry import AttentionBackendEnum
     import yaml
     from vllm_spyre_next.testing.models import (
@@ Expand Down Expand Up / @@ -119,6 +120,7 @@ def _parse_config(raw_tests: dict) -> UpstreamTestConfig: @@
                         param_skips=tuple(param_skips),
                         param_allows=tuple(param_allows),
                         param_overrides=tuple(param_overrides),
+                        fixture_names=tuple(allow.get("fixture_names", ())),
                     )
                 )
             block_list = [BlockEntry(test=b["test"]) for b in file_entry.get("block_list", [])]
@@ Expand Down Expand Up / @@ -325,6 +327,26 @@ def _prepare_upstream_tests_dir() -> Path: @@
         return tests_dir
+    def _temp_upstream_code_edits(upstream_tests_dir: Path):
+        """Apply small code edits to the upstream tests directory before importing.
+        These should be _temporary_ edits to source code for vllm tests while we work to make them more
+        portable. This should only be used where mocking is not possible or too cumbersome.
+        """
+        # Mocking out torch.device seems impossible to do (at least multiple rounds of Bob and Claude
+        # were unsuccessful). So we patch the source code to change the hardcoded
+        # `torch.device("cuda:0")` to `torch.device("cpu")`.
+        hardcoded_cuda_test_path = (
+            upstream_tests_dir / "v1" / "attention" / "test_attention_backends.py"
+        )
+        with open(hardcoded_cuda_test_path) as f:
+            content = f.read()
+        content = content.replace('torch.device("cuda:0")', 'torch.device("cpu")')
+        with open(hardcoded_cuda_test_path, "w") as f:
+            f.write(content)
     # ---------------------------------------------------------------------------
     # Pytest Hooks
     # ---------------------------------------------------------------------------
@@ Expand Down Expand Up / @@ -365,6 +387,7 @@ def pytest_configure(config): @@
             try:
                 # Clone vLLM to cache
                 upstream_tests_base = _prepare_upstream_tests_dir()
+                _temp_upstream_code_edits(upstream_tests_base)
                 config._upstream_tests_base = upstream_tests_base
                 # Determine which test paths to inject
@@ Expand Down Expand Up @@
             elif allow_entry.mode == "xfail_strict":
                 item.add_marker(pytest.mark.xfail(strict=True))
+            # Inject fixtures for tests that have fixture_names defined
+            for fixture_name in allow_entry.fixture_names:
+                item.fixturenames.append(fixture_name)
         # Reorder tests so that tests with "model" in the name run first
         _reorder_tests_by_name(items)
@@ Expand Down Expand Up / @@ -597,6 +624,33 @@ def should_do_global_cleanup_after_test(): @@
         return False
+    @pytest.fixture()
+    def patch_backend_list(request, monkeypatch):
+        """This fixture patches things for tests/v1/attention/test_attention_backends.py"""
+        # The BACKENDS_TO_TEST list has to be patched with only our backend
+        our_backend_list = [
+            AttentionBackendEnum.CUSTOM,
+        ]
+        test_module = request.node.module
+        monkeypatch.setattr(test_module, "BACKENDS_TO_TEST", our_backend_list)
+        # _test_backend_correctness may be called with a hardcoded AttentionBackendEnum.FLASH_ATTN,
+        # which we want to ignore
+        orig_tbc = test_module._test_backend_correctness
+        def tbc_wrapper(
+            batch_spec, model, backend_to_test: list[AttentionBackendEnum | str], *args, **kwargs
+        ):
+            if "AttentionBackendEnum.FLEX_ATTENTION" in str(backend_to_test):
+                return
+            return orig_tbc(batch_spec, model, backend_to_test, *args, **kwargs)
+        monkeypatch.setattr(test_module, "_test_backend_correctness", tbc_wrapper)
+        yield
     @pytest.hookimpl(tryfirst=True)
     def pytest_fixture_setup(fixturedef, request):
         """Override fixtures when running upstream vLLM tests."""
@@ Expand Down @@

-Original file line number
+Diff line change
@@ -1,7 +1,7 @@
     # Upstream test filter configuration for vllm-spyre-next.
     #
     # Only tests listed here will run from upstream vLLM. All other upstream
-    # tests are skipped by default (opt-in / whitelist model).
+    # tests are skipped by default (opt-in / allowlist model).
     #
     # block_list entries take precedence over allow_list entries.
     #
@@ Expand All / @@ -14,6 +14,9 @@ @@
     #                     Parameter name -> list of values to skip
     #   allow_list[].params.override
     #                     Parameter name -> replacement values (replaces upstream defaults)
+    #   allow_list[].fixture_names Fixture names to inject for this test.
+    #                              These fixtures are automatically added to the test's
+    #                              fixturenames during collection.
     #   block_list[].test fnmatch glob matched against test function name
     tests:
@@ Expand Down Expand Up / @@ -42,8 +45,18 @@ tests: @@
               tags: [facebook, upstream, uses_subprocess]
               params:
                 allow:  # skip every model except facebook/opt-125m
-                  model:
+                  model:
                   - facebook/opt-125m
-          block_list:
-            - test: "test_fused_rms_norm_quant"
+        - rel_path: tests/v1/attention/test_attention_backends.py
+          allow_list:
+            - test: "test_causal_backend_correctness"
+              mode: mandatory_pass
+              tags: [attention, upstream]
+              params:
+                allow:  # skip TP cases that we don't support
+                  tensor_parallel_size:
+                  - 1
+              fixture_names:
+              - "patch_backend_list"

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

[Spyre-Next] Custom fixtures for upstream tests #884

Diff view

Diff view

There are no files selected for viewing

tjohnson31415 Apr 1, 2026

Uh oh!

joerunde Apr 2, 2026

Uh oh!

Uh oh!

[Spyre-Next] Custom fixtures for upstream tests #884

Are you sure you want to change the base?

[Spyre-Next] Custom fixtures for upstream tests #884

Uh oh!

Uh oh!

Diff view

Diff view

There are no files selected for viewing

tjohnson31415 Apr 1, 2026

Choose a reason for hiding this comment

Uh oh!

joerunde Apr 2, 2026

Choose a reason for hiding this comment

Uh oh!

Uh oh!