diff --git a/vllm/model_executor/models/qwen3_vl.py b/vllm/model_executor/models/qwen3_vl.py index 1d3929b936a9..1076dcf2fb56 100644 --- a/vllm/model_executor/models/qwen3_vl.py +++ b/vllm/model_executor/models/qwen3_vl.py @@ -538,6 +538,7 @@ def forward( grid_thw_list = grid_thw grid_thw = np.array(grid_thw, dtype=np.int32) else: + grid_thw = grid_thw.to("cpu") grid_thw_list = grid_thw.tolist() grid_thw = grid_thw.numpy()