diff --git a/Cargo.lock b/Cargo.lock index 52a3b155fa7..2407585bcf4 100644 --- a/Cargo.lock +++ b/Cargo.lock @@ -1996,7 +1996,7 @@ dependencies = [ [[package]] name = "dynamo-async-openai" -version = "0.5.0" +version = "0.5.1" dependencies = [ "async-openai-macros", "backoff", @@ -2024,7 +2024,7 @@ dependencies = [ [[package]] name = "dynamo-engine-llamacpp" -version = "0.5.0" +version = "0.5.1" dependencies = [ "async-stream", "dynamo-llm", @@ -2036,7 +2036,7 @@ dependencies = [ [[package]] name = "dynamo-engine-mistralrs" -version = "0.5.0" +version = "0.5.1" dependencies = [ "anyhow", "async-stream", @@ -2054,7 +2054,7 @@ dependencies = [ [[package]] name = "dynamo-llm" -version = "0.5.0" +version = "0.5.1" dependencies = [ "ahash", "aho-corasick", @@ -2148,7 +2148,7 @@ dependencies = [ [[package]] name = "dynamo-parsers" -version = "0.5.0" +version = "0.5.1" dependencies = [ "anyhow", "dynamo-async-openai", @@ -2166,7 +2166,7 @@ dependencies = [ [[package]] name = "dynamo-run" -version = "0.5.0" +version = "0.5.1" dependencies = [ "anyhow", "async-stream", @@ -2195,7 +2195,7 @@ dependencies = [ [[package]] name = "dynamo-runtime" -version = "0.5.0" +version = "0.5.1" dependencies = [ "anyhow", "arc-swap", @@ -2253,7 +2253,7 @@ dependencies = [ [[package]] name = "dynamo-tokens" -version = "0.5.0" +version = "0.5.1" dependencies = [ "bytemuck", "derive-getters", @@ -4145,7 +4145,7 @@ checksum = "6a82ae493e598baaea5209805c49bbf2ea7de956d50d7da0da1164f9c6d28543" [[package]] name = "libdynamo_llm" -version = "0.5.0" +version = "0.5.1" dependencies = [ "anyhow", "async-once-cell", @@ -4544,7 +4544,7 @@ dependencies = [ [[package]] name = "metrics" -version = "0.5.0" +version = "0.5.1" dependencies = [ "axum 0.8.4", "clap 4.5.46", diff --git a/Cargo.toml b/Cargo.toml index a21dafdefff..f3a4a6944a2 100644 --- a/Cargo.toml +++ b/Cargo.toml @@ -16,7 +16,7 @@ members = [ resolver = "3" [workspace.package] -version = "0.5.0" +version = "0.5.1" edition = "2024" description = "Dynamo Inference Framework" authors = ["NVIDIA Inc. "] @@ -27,14 +27,15 @@ keywords = ["llm", "genai", "inference", "nvidia", "distributed"] [workspace.dependencies] # Local crates -dynamo-runtime = { path = "lib/runtime", version = "0.5.0" } -dynamo-llm = { path = "lib/llm", version = "0.5.0" } -dynamo-tokens = { path = "lib/tokens", version = "0.5.0" } -dynamo-async-openai = { path = "lib/async-openai", version = "0.5.0", features = [ +dynamo-runtime = { path = "lib/runtime", version = "0.5.1" } +dynamo-llm = { path = "lib/llm", version = "0.5.1" } +dynamo-tokens = { path = "lib/tokens", version = "0.5.1" } +dynamo-async-openai = { path = "lib/async-openai", version = "0.5.1", features = [ "byot", "rustls", ] } -dynamo-parsers = { path = "lib/parsers", version = "0.5.0" } +dynamo-parsers = { path = "lib/parsers", version = "0.5.1" } + # External dependencies anyhow = { version = "1" } diff --git a/docs/support_matrix.md b/docs/support_matrix.md index 7fcca6bf5bd..176763c66ef 100644 --- a/docs/support_matrix.md +++ b/docs/support_matrix.md @@ -58,8 +58,8 @@ If you are using a **GPU**, the following GPU models and architectures are suppo | **Python Package** | **Version** | glibc version | CUDA Version | | :----------------- | :------------ | :----------------------------------- | :----------- | -| ai-dynamo | 0.5.0 | >=2.28 | | -| ai-dynamo-runtime | 0.5.0 | >=2.28 (Python 3.12 has known issues)| | +| ai-dynamo | 0.5.1 | >=2.28 | | +| ai-dynamo-runtime | 0.5.1 | >=2.28 (Python 3.12 has known issues)| | | NIXL | 0.4.1 | >=2.27 | >=11.8 | ### Build Dependency diff --git a/lib/bindings/python/Cargo.lock b/lib/bindings/python/Cargo.lock index 6558167725f..66aab658ab4 100644 --- a/lib/bindings/python/Cargo.lock +++ b/lib/bindings/python/Cargo.lock @@ -1353,7 +1353,7 @@ dependencies = [ [[package]] name = "dynamo-async-openai" -version = "0.5.0" +version = "0.5.1" dependencies = [ "async-openai-macros", "backoff", @@ -1379,7 +1379,7 @@ dependencies = [ [[package]] name = "dynamo-llm" -version = "0.5.0" +version = "0.5.1" dependencies = [ "ahash", "aho-corasick", @@ -1459,7 +1459,7 @@ dependencies = [ [[package]] name = "dynamo-parsers" -version = "0.5.0" +version = "0.5.1" dependencies = [ "anyhow", "dynamo-async-openai", @@ -1477,7 +1477,7 @@ dependencies = [ [[package]] name = "dynamo-py3" -version = "0.5.0" +version = "0.5.1" dependencies = [ "anyhow", "async-stream", @@ -1513,7 +1513,7 @@ dependencies = [ [[package]] name = "dynamo-runtime" -version = "0.5.0" +version = "0.5.1" dependencies = [ "anyhow", "arc-swap", diff --git a/lib/bindings/python/Cargo.toml b/lib/bindings/python/Cargo.toml index 8b698fa441b..132d825d358 100644 --- a/lib/bindings/python/Cargo.toml +++ b/lib/bindings/python/Cargo.toml @@ -7,7 +7,7 @@ [package] name = "dynamo-py3" -version = "0.5.0" +version = "0.5.1" edition = "2024" authors = ["NVIDIA"] license = "Apache-2.0" diff --git a/lib/bindings/python/pyproject.toml b/lib/bindings/python/pyproject.toml index 33709891435..f011e336979 100644 --- a/lib/bindings/python/pyproject.toml +++ b/lib/bindings/python/pyproject.toml @@ -16,7 +16,7 @@ [project] name = "ai-dynamo-runtime" -version = "0.5.0" +version = "0.5.1" description = "Dynamo Inference Framework Runtime" readme = "README.md" authors = [ diff --git a/lib/runtime/examples/Cargo.lock b/lib/runtime/examples/Cargo.lock index c096ec7d2ee..03e652577fc 100644 --- a/lib/runtime/examples/Cargo.lock +++ b/lib/runtime/examples/Cargo.lock @@ -657,7 +657,7 @@ dependencies = [ [[package]] name = "dynamo-runtime" -version = "0.5.0" +version = "0.5.1" dependencies = [ "anyhow", "arc-swap", @@ -1030,7 +1030,7 @@ checksum = "2304e00983f87ffb38b55b444b5e3b60a884b5d30c0fca7d82fe33449bbe55ea" [[package]] name = "hello_world" -version = "0.5.0" +version = "0.5.1" dependencies = [ "dynamo-runtime", ] @@ -2502,7 +2502,7 @@ dependencies = [ [[package]] name = "service_metrics" -version = "0.5.0" +version = "0.5.1" dependencies = [ "dynamo-runtime", "futures", @@ -2678,7 +2678,7 @@ dependencies = [ [[package]] name = "system_metrics" -version = "0.5.0" +version = "0.5.1" dependencies = [ "anyhow", "dynamo-runtime", diff --git a/lib/runtime/examples/Cargo.toml b/lib/runtime/examples/Cargo.toml index 4b8d0881ed9..653b7f0c7a1 100644 --- a/lib/runtime/examples/Cargo.toml +++ b/lib/runtime/examples/Cargo.toml @@ -10,7 +10,7 @@ members = [ resolver = "3" [workspace.package] -version = "0.5.0" +version = "0.5.1" edition = "2024" authors = ["NVIDIA"] license = "Apache-2.0" diff --git a/pyproject.toml b/pyproject.toml index eff8b4f4264..316608a51ed 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -3,7 +3,7 @@ [project] name = "ai-dynamo" -version = "0.5.0" +version = "0.5.1" description = "Distributed Inference Framework" readme = "README.md" authors = [ @@ -13,7 +13,7 @@ license = { text = "Apache-2.0" } license-files = ["LICENSE"] requires-python = ">=3.10" dependencies = [ - "ai-dynamo-runtime==0.5.0", + "ai-dynamo-runtime==0.5.1", "pytest>=8.3.4", "types-psutil>=7.0.0.20250218", "kubernetes>=32.0.1,<33.0.0",