conda-forge · mediocretech · Dec 7, 2023 · Dec 21, 2023 · Dec 21, 2023 · Jan 19, 2024
diff --git a/recipes/vllm/build.sh b/recipes/vllm/build.sh
@@ -0,0 +1,8 @@
+#!/bin/bash -e
+export MAX_JOBS=1
+# needed to find libcrypt headers
+export CPATH=${BUILD_PREFIX}/include
+export VLLM_TARGET_DEVICE="cuda"
+
+${PYTHON} use_existing_torch.py
+${PYTHON} -m pip install . --no-deps -vv --no-deps --no-build-isolation
diff --git a/recipes/vllm/meta.yaml b/recipes/vllm/meta.yaml
@@ -0,0 +1,99 @@
+{% set name = "vllm" %}
+{% set version = "0.8.1" %}
+
+package:
+  name: {{ name|lower }}
+  version: {{ version }}
+
+source:
+  url: https://pypi.io/packages/source/{{ name[0] }}/{{ name }}/vllm-{{ version }}.tar.gz
+  sha256: 03d641f10d0181b630243c096484da0b5fdf608befe026af831ab87a51c09ab1
+
+build:
+  # noarch: python
+
+  rpaths:
+    - lib/
+
+  script_env:
+    - TORCH_CUDA_ARCH_LIST=3.5;5.0;6.0;6.1;7.0;7.5;8.0;8.6+PTX      # [cuda_compiler_version == "11.2"]
+    - TORCH_CUDA_ARCH_LIST=3.5;5.0;6.0;6.1;7.0;7.5;8.0;8.6;8.9+PTX  # [cuda_compiler_version == "11.8"]
+    - TORCH_CUDA_ARCH_LIST=5.0;6.0;6.1;7.0;7.5;8.0;8.6;8.9;9.0+PTX  # [(cuda_compiler_version or "").startswith("12")]
+
+  number: 0
+  skip: True  # [cuda_compiler_version == "None"]
+  skip: True  # [osx or win]
+  skip: True  # [py < 312] 
+  missing_dso_whitelist:
+    - '*/libtorch_python.so'
+    - '*/libcuda.so.1'
+
+requirements:
+  build:
+    - cmake
+    - make
+    - {{ stdlib("c") }}
+    - {{ compiler('c') }}
+    - {{ compiler('cxx') }}
+    - {{ compiler('cuda') }}
+
+  host:
+    - cuda-version {{ cuda_compiler_version }}
+    - python
+    - ninja
+    - packaging
+    - setuptools
+    - setuptools-scm
+    - pytorch
+    - torchvision
+    - wheel
+    - pip
+    - libxcrypt
+
+  run:
+    - python
+    - ninja
+    - psutil
+    # - ray-core >=2.9.0
+    - pandas
+    - pyarrow
+    - sentencepiece
+    - numpy
+    - einops
+    - pytorch
+    - transformers >=4.34.0
+    - xformers
+    - fastapi
+    - uvicorn
+    - pydantic
+    - aioprometheus
+    - prometheus_client
+    - triton
+    # - libtorch
+    # - cuda-version {{ cuda_compiler_version }}  # [cuda_compiler_version != "None"]
+    # - cuda-cupti-dev    # [(cuda_compiler_version or "").startswith("12")]
+    # - cuda-cudart-dev   # [(cuda_compiler_version or "").startswith("12")]
+    # - cuda-nvml-dev     # [(cuda_compiler_version or "").startswith("12")]
+    # - cuda-nvtx-dev     # [(cuda_compiler_version or "").startswith("12")]
+    # - libstdcxx-ng
+    # - libgcc-ng
+    # - libxcrypt
+
+test:
+  imports:
+    - vllm
+  # commands:
+  #  - pip check
+  requires:
+    - pip
+
+about:
+  home: https://github.com/vllm-project/vllm
+  summary: A high-throughput and memory-efficient inference and serving engine for LLMs
+  license: Apache-2.0
+  license_file: LICENSE
+
+extra:
+  recipe-maintainers:
+    - mediocretech
+    - iamthebot