diff --git a/onnxruntime/test/python/transformers/test_gqa.py b/onnxruntime/test/python/transformers/test_gqa.py index 9cbe2a01698ae..e800c22f92efb 100644 --- a/onnxruntime/test/python/transformers/test_gqa.py +++ b/onnxruntime/test/python/transformers/test_gqa.py @@ -1775,6 +1775,7 @@ def test_flash_decode_parity(self): del os.environ["ORT_DISABLE_FLASH_DECODE"] +@unittest.skipIf(not has_flash_attention(), "Flash Attention is not available, skipping tests.") class TestGQARegressions(unittest.TestCase): """Specific regression tests for historical bugs."""