vllm-project · wangxiyuan · Jan 5, 2026 · Dec 15, 2025 · Dec 15, 2025 · Dec 15, 2025
diff --git a/pyproject.toml b/pyproject.toml
@@ -27,7 +27,8 @@ requires = [
     "numba",
     "fastapi<0.124.0",
     "opencv-python-headless<=4.11.0.86", # Required to avoid numpy version conflict with vllm
-    "compressed_tensors>=0.11.0"
+    "compressed_tensors>=0.11.0",
+    "arctic-inference==0.1.1"
 ]
 build-backend = "setuptools.build_meta"
 

@@ -30,5 +30,6 @@ numba
 #--extra-index-url https://mirrors.huaweicloud.com/ascend/repos/pypi
 torch-npu==2.8.0
 
+arctic-inference==0.1.1
 transformers>=4.57.3
 fastapi<0.124.0