From 56a8e8bcbb0a3fae90655d5eff84c9de62bb0413 Mon Sep 17 00:00:00 2001 From: Jishnu Ray Chowdhury Date: Tue, 27 Jun 2023 23:53:05 -0500 Subject: [PATCH 1/2] Add abstraction for Custom Tokenizer Related to https://github.com/vllm-project/vllm/issues/111 ``` model = LLM(abcd) model.set_tokenizer(custom_tokenizer) ``` --- vllm/entrypoints/llm.py | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/vllm/entrypoints/llm.py b/vllm/entrypoints/llm.py index d9079cc1a7b9..fb1c1d197c9d 100644 --- a/vllm/entrypoints/llm.py +++ b/vllm/entrypoints/llm.py @@ -60,6 +60,11 @@ def get_tokenizer( ) -> Union[PreTrainedTokenizer, PreTrainedTokenizerFast]: return self.llm_engine.tokenizer + def set_tokenizer( + self, tokenizer: Union[PreTrainedTokenizer, PreTrainedTokenizerFast] + ): + self.llm_engine.tokenizer = tokenizer + def generate( self, prompts: Optional[Union[str, List[str]]] = None, From 582692d4cbe8cea02ea2d889a9fdd1dd5f753179 Mon Sep 17 00:00:00 2001 From: Jishnu Ray Chowdhury Date: Wed, 28 Jun 2023 01:48:18 -0500 Subject: [PATCH 2/2] Update vllm/entrypoints/llm.py Co-authored-by: Woosuk Kwon --- vllm/entrypoints/llm.py | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/vllm/entrypoints/llm.py b/vllm/entrypoints/llm.py index fb1c1d197c9d..1895103b123a 100644 --- a/vllm/entrypoints/llm.py +++ b/vllm/entrypoints/llm.py @@ -61,8 +61,9 @@ def get_tokenizer( return self.llm_engine.tokenizer def set_tokenizer( - self, tokenizer: Union[PreTrainedTokenizer, PreTrainedTokenizerFast] - ): + self, + tokenizer: Union[PreTrainedTokenizer, PreTrainedTokenizerFast], + ) -> None: self.llm_engine.tokenizer = tokenizer def generate(