Skip to content

Commit c225a90

Browse files
author
Andrew Xia
committed
merge fixes
Signed-off-by: Andrew Xia <[email protected]>
1 parent 1584cb0 commit c225a90

File tree

2 files changed

+15
-20
lines changed

2 files changed

+15
-20
lines changed

vllm/entrypoints/context.py

Lines changed: 13 additions & 16 deletions
Original file line numberDiff line numberDiff line change
@@ -239,24 +239,21 @@ def __init__(
239239
self.chat_template_content_format = chat_template_content_format
240240
self.tool_dicts = tool_dicts
241241

242-
def append_output(
243-
self, output: RequestOutput | list[CustomChatCompletionMessageParam]
244-
) -> None:
242+
def append_output(self, output: RequestOutput) -> None:
245243
self.last_output = output
246-
if isinstance(output, RequestOutput):
247-
self.num_prompt_tokens = len(output.prompt_token_ids or [])
248-
self.num_cached_tokens = output.num_cached_tokens or 0
249-
self.num_output_tokens += len(output.outputs[0].token_ids or [])
250-
251-
# output_token_ids = output.outputs[0].token_ids
252-
# for token_id in output_token_ids:
253-
# self.parser.process(token_id)
254-
self.parser.process(output.outputs[0])
255-
else:
256-
self.parser.chat_completion_messages.extend(output)
244+
self.num_prompt_tokens = len(output.prompt_token_ids or [])
245+
self.num_cached_tokens = output.num_cached_tokens or 0
246+
self.num_output_tokens += len(output.outputs[0].token_ids or [])
257247

258-
def append_tool_output(self, output) -> None:
259-
raise NotImplementedError("Should not be called.")
248+
# output_token_ids = output.outputs[0].token_ids
249+
# for token_id in output_token_ids:
250+
# self.parser.process(token_id)
251+
self.parser.process(output.outputs[0])
252+
253+
def append_tool_output(
254+
self, output: list[CustomChatCompletionMessageParam]
255+
) -> None:
256+
self.parser.chat_completion_messages.extend(output)
260257

261258
def need_builtin_tool_call(self) -> bool:
262259
"""Return true if the last message is a MCP tool call"""

vllm/entrypoints/openai/parser/parser.py

Lines changed: 2 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -54,10 +54,8 @@ def render_for_completion(self):
5454
pass
5555

5656
def process(self, output: CompletionOutput) -> "StreamableParser":
57-
reasoning_content, content = (
58-
self.reasoning_parser_instance.extract_reasoning_content(
59-
output.text, request=None
60-
)
57+
reasoning_content, content = self.reasoning_parser_instance.extract_reasoning(
58+
output.text, request=None
6159
)
6260
if reasoning_content:
6361
new_content = ChatCompletionContentPartTextParam(

0 commit comments

Comments
 (0)