Skip to content
Closed
Show file tree
Hide file tree
Changes from 1 commit
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Next Next commit
chore: update dynamo and nixl versions for 0.3.0 (#1240)
  • Loading branch information
nv-anants committed May 29, 2025
commit 50971b7d079a7fe5d44fbf76378ab7826c28d2f1
64 changes: 38 additions & 26 deletions Cargo.lock

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

8 changes: 4 additions & 4 deletions Cargo.toml
Original file line number Diff line number Diff line change
Expand Up @@ -28,7 +28,7 @@ members = [
resolver = "3"

[workspace.package]
version = "0.2.1"
version = "0.3.0"
edition = "2021"
description = "Dynamo Inference Framework"
authors = ["NVIDIA Inc. <[email protected]>"]
Expand All @@ -39,9 +39,9 @@ keywords = ["llm", "genai", "inference", "nvidia", "distributed", "dynamo"]

[workspace.dependencies]
# Local crates
dynamo-runtime = { path = "lib/runtime", version = "0.2.1" }
dynamo-llm = { path = "lib/llm", version = "0.2.1" }
dynamo-tokens = { path = "lib/tokens", version = "0.2.1" }
dynamo-runtime = { path = "lib/runtime", version = "0.3.0" }
dynamo-llm = { path = "lib/llm", version = "0.3.0" }
dynamo-tokens = { path = "lib/tokens", version = "0.3.0" }

# External dependencies
anyhow = { version = "1" }
Expand Down
2 changes: 1 addition & 1 deletion container/Dockerfile.vllm
Original file line number Diff line number Diff line change
Expand Up @@ -169,7 +169,7 @@ RUN uv pip install /workspace/wheels/nixl/*.whl
ARG VLLM_REF="0.8.4"
ARG VLLM_PATCH="vllm_v${VLLM_REF}-dynamo-kv-disagg-patch.patch"
ARG VLLM_PATCHED_PACKAGE_NAME="ai_dynamo_vllm"
ARG VLLM_PATCHED_PACKAGE_VERSION="0.8.4.post1"
ARG VLLM_PATCHED_PACKAGE_VERSION="0.8.4.post2"
ARG VLLM_MAX_JOBS=4
RUN --mount=type=bind,source=./container/deps/,target=/tmp/deps \
--mount=type=cache,target=/root/.cache/uv \
Expand Down
2 changes: 1 addition & 1 deletion container/build.sh
Original file line number Diff line number Diff line change
Expand Up @@ -109,7 +109,7 @@ NONE_BASE_IMAGE_TAG="24.04"
SGLANG_BASE_IMAGE="nvcr.io/nvidia/cuda-dl-base"
SGLANG_BASE_IMAGE_TAG="25.01-cuda12.8-devel-ubuntu24.04"

NIXL_COMMIT=78695c2900cd7fff506764377386592dfc98e87e
NIXL_COMMIT=f531404be4866d85ed618b3baf4008c636798d63
NIXL_REPO=ai-dynamo/nixl.git

NO_CACHE=""
Expand Down
14 changes: 7 additions & 7 deletions docs/support_matrix.md
Original file line number Diff line number Diff line change
Expand Up @@ -62,21 +62,21 @@ For **Linux**, the **ARM64** support is experimental and may have limitations. W
### Runtime Dependency
| **Python Package** | **Version** | glibc version | CUDA Version |
|--------------------|---------------|----------------------|--------------|
| ai-dynamo | 0.2.1 | >=2.28 | |
| ai-dynamo-runtime | 0.2.1 | >=2.28 | |
| ai-dynamo-vllm | 0.8.4.post1* | >=2.28 (recommended) | |
| NIXL | 0.2.1 | >=2.27 | >=11.8 |
| ai-dynamo | 0.3.0 | >=2.28 | |
| ai-dynamo-runtime | 0.3.0 | >=2.28 | |
| ai-dynamo-vllm | 0.8.4.post2* | >=2.28 (recommended) | |
| NIXL | 0.3.0 | >=2.27 | >=11.8 |

### Build Dependency
| **Build Dependency** | **Version** |
|----------------------|-------------|
| **Base Container** | [25.03](https://catalog.ngc.nvidia.com/orgs/nvidia/containers/cuda-dl-base/tags) |
| **ai-dynamo-vllm** |0.8.4.post1* |
| **ai-dynamo-vllm** |0.8.4.post2* |
| **TensorRT-LLM** | 0.19.0** |
| **NIXL** | 0.2.1 |
| **NIXL** | 0.3.0 |

> **Note**:
> - *ai-dynamo-vllm v0.8.4.post1 is a customized patch of v0.8.4 from vLLM.
> - *ai-dynamo-vllm v0.8.4.post2 is a customized patch of v0.8.4 from vLLM.
> - **Specific versions of TensorRT-LLM supported by Dynamo are subject to change.


Expand Down
26 changes: 19 additions & 7 deletions lib/bindings/python/Cargo.lock

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

3 changes: 2 additions & 1 deletion lib/bindings/python/Cargo.toml
Original file line number Diff line number Diff line change
Expand Up @@ -19,7 +19,7 @@

[package]
name = "dynamo-py3"
version = "0.2.1"
version = "0.3.0"
edition = "2021"
authors = ["NVIDIA"]
license = "Apache-2.0"
Expand Down Expand Up @@ -75,3 +75,4 @@ pyo3-async-runtimes = { version = "0.23.0", default-features = false, features =
pythonize = "0.23"

dlpark = { version = "0.5", features = ["pyo3", "half"], optional = true }

2 changes: 1 addition & 1 deletion lib/llm/Cargo.toml
Original file line number Diff line number Diff line change
Expand Up @@ -81,7 +81,7 @@ regex = "1"
rayon = "1"

# block_manager
nixl-sys = { version = "0.2.1-rc.3", optional = true }
nixl-sys = { version = "0.3.0-rc.2", optional = true }
cudarc = { version = "0.16.2", features = ["cuda-12020"], optional = true }
ndarray = { version = "0.16", optional = true }
nix = { version = "0.26", optional = true }
Expand Down
6 changes: 3 additions & 3 deletions lib/runtime/examples/Cargo.lock

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

2 changes: 1 addition & 1 deletion lib/runtime/examples/Cargo.toml
Original file line number Diff line number Diff line change
Expand Up @@ -21,7 +21,7 @@ members = [
resolver = "3"

[workspace.package]
version = "0.2.1"
version = "0.3.0"
edition = "2021"
authors = ["NVIDIA"]
license = "Apache-2.0"
Expand Down
4 changes: 2 additions & 2 deletions pyproject.toml
Original file line number Diff line number Diff line change
Expand Up @@ -15,7 +15,7 @@

[project]
name = "ai-dynamo"
version = "0.2.1"
version = "0.3.0"
description = "Distributed Inference Framework"
readme = "README.md"
authors = [
Expand All @@ -29,7 +29,7 @@ dependencies = [
"bentoml==1.4.8",
"types-psutil==7.0.0.20250218",
"kubernetes==32.0.1",
"ai-dynamo-runtime==0.2.1",
"ai-dynamo-runtime==0.3.0",
"fastapi==0.115.6",
"distro",
"typer",
Expand Down