diff --git a/tests/conftest.py b/tests/conftest.py index 294805a8164f..27724b9c111a 100644 --- a/tests/conftest.py +++ b/tests/conftest.py @@ -33,6 +33,7 @@ from vllm.logger import init_logger from vllm.outputs import RequestOutput from vllm.sampling_params import BeamSearchParams +from vllm.transformers_utils.utils import maybe_model_redirect from vllm.utils import cuda_device_count_stateless logger = init_logger(__name__) @@ -318,6 +319,7 @@ def __init__( skip_tokenizer_init: bool = False, auto_cls: type[_BaseAutoModelClass] = AutoModelForCausalLM, ) -> None: + model_name = maybe_model_redirect(model_name) self.model_name = model_name self.config = AutoConfig.from_pretrained(