diff --git a/vllm_omni/worker_v2/omni_model_runner.py b/vllm_omni/worker_v2/omni_model_runner.py index 31fb83dc947..e63be5636fc 100644 --- a/vllm_omni/worker_v2/omni_model_runner.py +++ b/vllm_omni/worker_v2/omni_model_runner.py @@ -281,7 +281,7 @@ def execute_model( if hasattr(self.model, "_last_captured_layers"): self.model._last_captured_layers = self._last_aux_output else: - raise TypeError(f"Unexpected model output type: {type(model_output)}") + hidden_states = model_output # ★ POST-FORWARD: per-request postprocess if not dummy_run and isinstance(hidden_states, torch.Tensor):