vllm-project · staugust · Feb 12, 2026 · gemini-code-assist · Feb 12, 2026
@@ -103,7 +103,7 @@ async def create_pooling(
                         "offline inference example for more details."
                     )
 
-                validated_prompt = self.io_processor.parse_data(request.data)
+                validated_prompt = self.io_processor.parse_data(request)
 
                 raw_prompts = await self.io_processor.pre_process_async(
                     prompt=validated_prompt, request_id=request_id