Skip to content

Commit 99e67e6

Browse files
authored
chore: update dynamo and nixl versions for 0.3.1 (#1517)
1 parent 50afb81 commit 99e67e6

File tree

10 files changed

+41
-41
lines changed

10 files changed

+41
-41
lines changed

Cargo.lock

Lines changed: 13 additions & 13 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

Cargo.toml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -28,7 +28,7 @@ members = [
2828
resolver = "3"
2929

3030
[workspace.package]
31-
version = "0.3.0"
31+
version = "0.3.1"
3232
edition = "2021"
3333
description = "Dynamo Inference Framework"
3434
authors = ["NVIDIA Inc. <[email protected]>"]
@@ -39,9 +39,9 @@ keywords = ["llm", "genai", "inference", "nvidia", "distributed", "dynamo"]
3939

4040
[workspace.dependencies]
4141
# Local crates
42-
dynamo-runtime = { path = "lib/runtime", version = "0.3.0" }
43-
dynamo-llm = { path = "lib/llm", version = "0.3.0" }
44-
dynamo-tokens = { path = "lib/tokens", version = "0.3.0" }
42+
dynamo-runtime = { path = "lib/runtime", version = "0.3.1" }
43+
dynamo-llm = { path = "lib/llm", version = "0.3.1" }
44+
dynamo-tokens = { path = "lib/tokens", version = "0.3.1" }
4545

4646
# External dependencies
4747
anyhow = { version = "1" }

container/Dockerfile.vllm

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -178,7 +178,7 @@ RUN uv pip install /workspace/wheels/nixl/*.whl
178178
ARG VLLM_REF="0.8.4"
179179
ARG VLLM_PATCH="vllm_v${VLLM_REF}-dynamo-kv-disagg-patch.patch"
180180
ARG VLLM_PATCHED_PACKAGE_NAME="ai_dynamo_vllm"
181-
ARG VLLM_PATCHED_PACKAGE_VERSION="0.8.4.post2"
181+
ARG VLLM_PATCHED_PACKAGE_VERSION="0.8.4.post3"
182182
ARG VLLM_MAX_JOBS=4
183183
RUN --mount=type=bind,source=./container/deps/,target=/tmp/deps \
184184
--mount=type=cache,target=/root/.cache/uv \

container/build.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -109,7 +109,7 @@ NONE_BASE_IMAGE_TAG="24.04"
109109
SGLANG_BASE_IMAGE="nvcr.io/nvidia/cuda-dl-base"
110110
SGLANG_BASE_IMAGE_TAG="25.01-cuda12.8-devel-ubuntu24.04"
111111

112-
NIXL_COMMIT=f531404be4866d85ed618b3baf4008c636798d63
112+
NIXL_COMMIT=16348080f5bdeb9fe6058a23be140cec020ef3f3
113113
NIXL_REPO=ai-dynamo/nixl.git
114114

115115
NIXL_UCX_EFA_REF=7ec95b95e524a87e81cac92f5ca8523e3966b16b

docs/support_matrix.md

Lines changed: 10 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -68,24 +68,24 @@ If you are using a **GPU**, the following GPU models and architectures are suppo
6868

6969
### Runtime Dependency
7070

71-
| **Python Package** | **Version** | glibc version | CUDA Version |
72-
| :----------------- | :------------ | :------------------- | :----------- |
73-
| ai-dynamo | 0.3.0 | >=2.28 | |
74-
| ai-dynamo-runtime | 0.3.0 | >=2.28 | |
75-
| ai-dynamo-vllm | 0.8.4.post2¹ | >=2.28 (recommended) | |
76-
| NIXL | 0.3.0 | >=2.27 | >=11.8 |
71+
| **Python Package** | **Version** | glibc version | CUDA Version |
72+
| :----------------- | :------------ | :----------------------------------- | :----------- |
73+
| ai-dynamo | 0.3.1 | >=2.28 | |
74+
| ai-dynamo-runtime | 0.3.1 | >=2.28 (Python 3.12 has known issues)| |
75+
| ai-dynamo-vllm | 0.8.4.post3¹ | >=2.28 (recommended) | |
76+
| NIXL | 0.3.1 | >=2.27 | >=11.8 |
7777

7878
### Build Dependency
7979

8080
| **Build Dependency** | **Version** |
8181
| :------------------- | :------------------------------------------------------------------------------- |
8282
| **Base Container** | [25.03](https://catalog.ngc.nvidia.com/orgs/nvidia/containers/cuda-dl-base/tags) |
83-
| **ai-dynamo-vllm** | 0.8.4.post2¹ |
84-
| **TensorRT-LLM** | 0.19.0² |
85-
| **NIXL** | 0.3.0 |
83+
| **ai-dynamo-vllm** | 0.8.4.post3¹ |
84+
| **TensorRT-LLM** | 0.21.0rc² |
85+
| **NIXL** | 0.3.1 |
8686

8787
> [!Important]
88-
> ¹ ai-dynamo-vllm `v0.8.4.post2` is a customized patch of `v0.8.4` from vLLM.
88+
> ¹ ai-dynamo-vllm `v0.8.4.post3` is a customized patch of `v0.8.4` from vLLM.
8989
>
9090
> ² Specific versions of TensorRT-LLM supported by Dynamo are subject to change.
9191

lib/bindings/python/Cargo.lock

Lines changed: 5 additions & 5 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

lib/bindings/python/Cargo.toml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -19,7 +19,7 @@
1919

2020
[package]
2121
name = "dynamo-py3"
22-
version = "0.3.0"
22+
version = "0.3.1"
2323
edition = "2021"
2424
authors = ["NVIDIA"]
2525
license = "Apache-2.0"

lib/runtime/examples/Cargo.lock

Lines changed: 3 additions & 3 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

lib/runtime/examples/Cargo.toml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -21,7 +21,7 @@ members = [
2121
resolver = "3"
2222

2323
[workspace.package]
24-
version = "0.3.0"
24+
version = "0.3.1"
2525
edition = "2021"
2626
authors = ["NVIDIA"]
2727
license = "Apache-2.0"

pyproject.toml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@
1515

1616
[project]
1717
name = "ai-dynamo"
18-
version = "0.3.0"
18+
version = "0.3.1"
1919
description = "Distributed Inference Framework"
2020
readme = "README.md"
2121
authors = [
@@ -28,7 +28,7 @@ dependencies = [
2828
"pytest>=8.3.4",
2929
"types-psutil==7.0.0.20250218",
3030
"kubernetes==32.0.1",
31-
"ai-dynamo-runtime==0.3.0",
31+
"ai-dynamo-runtime==0.3.1",
3232
"fastapi==0.115.6",
3333
"distro",
3434
# filelock: required by planner

0 commit comments

Comments
 (0)