Skip to content

Commit c232339

Browse files
committed
chore: update dynamo and nixl versions for 0.3.1
1 parent b051a21 commit c232339

File tree

11 files changed

+42
-42
lines changed

11 files changed

+42
-42
lines changed

Cargo.lock

Lines changed: 13 additions & 14 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

Cargo.toml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -28,7 +28,7 @@ members = [
2828
resolver = "3"
2929

3030
[workspace.package]
31-
version = "0.3.0"
31+
version = "0.3.1"
3232
edition = "2021"
3333
description = "Dynamo Inference Framework"
3434
authors = ["NVIDIA Inc. <sw-dl-dynamo@nvidia.com>"]
@@ -39,9 +39,9 @@ keywords = ["llm", "genai", "inference", "nvidia", "distributed", "dynamo"]
3939

4040
[workspace.dependencies]
4141
# Local crates
42-
dynamo-runtime = { path = "lib/runtime", version = "0.3.0" }
43-
dynamo-llm = { path = "lib/llm", version = "0.3.0" }
44-
dynamo-tokens = { path = "lib/tokens", version = "0.3.0" }
42+
dynamo-runtime = { path = "lib/runtime", version = "0.3.1" }
43+
dynamo-llm = { path = "lib/llm", version = "0.3.1" }
44+
dynamo-tokens = { path = "lib/tokens", version = "0.3.1" }
4545

4646
# External dependencies
4747
anyhow = { version = "1" }

container/Dockerfile.vllm

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -178,7 +178,7 @@ RUN uv pip install /workspace/wheels/nixl/*.whl
178178
ARG VLLM_REF="0.8.4"
179179
ARG VLLM_PATCH="vllm_v${VLLM_REF}-dynamo-kv-disagg-patch.patch"
180180
ARG VLLM_PATCHED_PACKAGE_NAME="ai_dynamo_vllm"
181-
ARG VLLM_PATCHED_PACKAGE_VERSION="0.8.4.post2"
181+
ARG VLLM_PATCHED_PACKAGE_VERSION="0.8.4.post3"
182182
ARG VLLM_MAX_JOBS=4
183183
RUN --mount=type=bind,source=./container/deps/,target=/tmp/deps \
184184
--mount=type=cache,target=/root/.cache/uv \

container/build.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -109,7 +109,7 @@ NONE_BASE_IMAGE_TAG="24.04"
109109
SGLANG_BASE_IMAGE="nvcr.io/nvidia/cuda-dl-base"
110110
SGLANG_BASE_IMAGE_TAG="25.01-cuda12.8-devel-ubuntu24.04"
111111

112-
NIXL_COMMIT=f531404be4866d85ed618b3baf4008c636798d63
112+
NIXL_COMMIT=16348080f5bdeb9fe6058a23be140cec020ef3f3
113113
NIXL_REPO=ai-dynamo/nixl.git
114114

115115
NIXL_UCX_EFA_REF=7ec95b95e524a87e81cac92f5ca8523e3966b16b

docs/support_matrix.md

Lines changed: 9 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -64,21 +64,22 @@ For **Linux**, the **ARM64** support is experimental and may have limitations. W
6464
### Runtime Dependency
6565
| **Python Package** | **Version** | glibc version | CUDA Version |
6666
|--------------------|---------------|----------------------|--------------|
67-
| ai-dynamo | 0.3.0 | >=2.28 | |
68-
| ai-dynamo-runtime | 0.3.0 | >=2.28 | |
69-
| ai-dynamo-vllm | 0.8.4.post2* | >=2.28 (recommended) | |
70-
| NIXL | 0.3.0 | >=2.27 | >=11.8 |
67+
| ai-dynamo | 0.3.1 | >=2.28 | |
68+
| ai-dynamo-runtime | 0.3.1 | >=2.28 (Python 3.12 has known issues) | |
69+
| ai-dynamo-vllm | 0.8.4.post3* | >=2.28 (recommended) | |
70+
| NIXL | 0.3.1 | >=2.27 | >=11.8 |
71+
7172

7273
### Build Dependency
7374
| **Build Dependency** | **Version** |
7475
|----------------------|-------------|
7576
| **Base Container** | [25.03](https://catalog.ngc.nvidia.com/orgs/nvidia/containers/cuda-dl-base/tags) |
76-
| **ai-dynamo-vllm** |0.8.4.post2* |
77-
| **TensorRT-LLM** | 0.19.0** |
78-
| **NIXL** | 0.3.0 |
77+
| **ai-dynamo-vllm** |0.8.4.post3* |
78+
| **TensorRT-LLM** | 0.21.0rc** |
79+
| **NIXL** | 0.3.1 |
7980

8081
```{note}
81-
*ai-dynamo-vllm v0.8.4.post2 is a customized patch of v0.8.4 from vLLM.
82+
*ai-dynamo-vllm v0.8.4.post3 is a customized patch of v0.8.4 from vLLM.
8283
8384
**Specific versions of TensorRT-LLM supported by Dynamo are subject to change.
8485
```

lib/bindings/python/Cargo.lock

Lines changed: 5 additions & 6 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

lib/bindings/python/Cargo.toml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -19,7 +19,7 @@
1919

2020
[package]
2121
name = "dynamo-py3"
22-
version = "0.3.0"
22+
version = "0.3.1"
2323
edition = "2021"
2424
authors = ["NVIDIA"]
2525
license = "Apache-2.0"

lib/llm/Cargo.toml

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -81,7 +81,8 @@ regex = "1"
8181
rayon = "1"
8282

8383
# block_manager
84-
nixl-sys = { version = "0.3.0-rc.2", optional = true }
84+
# ToDo - switch to 0.3.1 after crates.io publish
85+
nixl-sys = {git = "https://github.com/ai-dynamo/nixl", rev = "16348080f5bdeb9fe6058a23be140cec020ef3f3", optional = true }
8586
cudarc = { version = "0.16.2", features = ["cuda-12020"], optional = true }
8687
ndarray = { version = "0.16", optional = true }
8788
nix = { version = "0.26", optional = true }

lib/runtime/examples/Cargo.lock

Lines changed: 3 additions & 3 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

lib/runtime/examples/Cargo.toml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -21,7 +21,7 @@ members = [
2121
resolver = "3"
2222

2323
[workspace.package]
24-
version = "0.3.0"
24+
version = "0.3.1"
2525
edition = "2021"
2626
authors = ["NVIDIA"]
2727
license = "Apache-2.0"

0 commit comments

Comments
 (0)