Skip to content

Commit 95fb025

Browse files
committed
Tokenizer to xpu
1 parent 9ff1cf8 commit 95fb025

File tree

1 file changed

+3
-1
lines changed

1 file changed

+3
-1
lines changed

backend/python/transformers/transformers_server.py

+3-1
Original file line numberDiff line numberDiff line change
@@ -93,7 +93,7 @@ def LoadModel(self, request, context):
9393
self.XPU = True
9494
try:
9595
print("Optimizing model", model_name, "to XPU.", file=sys.stderr)
96-
self.model = ipex.optimize_transformers(self.model, inplace=True, dtype=torch.float16, woq=True, device="xpu")
96+
self.model = ipex.optimize_transformers(self.model, inplace=True, dtype=torch.float16, device="xpu")
9797
except Exception as err:
9898
print("Not using XPU:", err, file=sys.stderr)
9999

@@ -160,6 +160,8 @@ def Predict(self, request, context):
160160
inputs = self.tokenizer(request.Prompt, return_tensors="pt").input_ids
161161
if self.CUDA:
162162
inputs = inputs.to("cuda")
163+
if XPU:
164+
inputs = inputs.to("xpu")
163165

164166
outputs = self.model.generate(inputs,max_new_tokens=max_tokens, temperature=request.Temperature, top_p=request.TopP)
165167

0 commit comments

Comments
 (0)