diff --git a/vllm/entrypoints/pooling/pooling/serving.py b/vllm/entrypoints/pooling/pooling/serving.py index 5c5d649f67fd..2d04d4e1462e 100644 --- a/vllm/entrypoints/pooling/pooling/serving.py +++ b/vllm/entrypoints/pooling/pooling/serving.py @@ -103,7 +103,7 @@ async def create_pooling( "offline inference example for more details." ) - validated_prompt = self.io_processor.parse_data(request.data) + validated_prompt = self.io_processor.parse_data(request) raw_prompts = await self.io_processor.pre_process_async( prompt=validated_prompt, request_id=request_id