diff --git a/nemo_skills/inference/model/vllm.py b/nemo_skills/inference/model/vllm.py index c055f7c2bc..ad0c0ff1b7 100644 --- a/nemo_skills/inference/model/vllm.py +++ b/nemo_skills/inference/model/vllm.py @@ -76,6 +76,7 @@ def _build_completion_request_params( "logprobs": top_logprobs, "stream": stream, "echo": False, + "skip_special_tokens": False, "n": 1, "logit_bias": None, "frequency_penalty": 0.0, @@ -123,4 +124,3 @@ def _build_chat_request_params( request["allowed_openai_params"] = ["reasoning_effort"] request["reasoning_effort"] = reasoning_effort return request -