Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
dynamo
Commits
9d9a1d9b
Unverified
Commit
9d9a1d9b
authored
May 29, 2025
by
Anant Sharma
Committed by
GitHub
May 29, 2025
Browse files
chore: update dynamo and nixl versions for 0.3.0 (#1240)
parent
c9eb6a83
Changes
11
Hide whitespace changes
Inline
Side-by-side
Showing
11 changed files
with
79 additions
and
54 deletions
+79
-54
Cargo.lock
Cargo.lock
+38
-26
Cargo.toml
Cargo.toml
+4
-4
container/Dockerfile.vllm
container/Dockerfile.vllm
+1
-1
container/build.sh
container/build.sh
+1
-1
docs/support_matrix.md
docs/support_matrix.md
+7
-7
lib/bindings/python/Cargo.lock
lib/bindings/python/Cargo.lock
+19
-7
lib/bindings/python/Cargo.toml
lib/bindings/python/Cargo.toml
+2
-1
lib/llm/Cargo.toml
lib/llm/Cargo.toml
+1
-1
lib/runtime/examples/Cargo.lock
lib/runtime/examples/Cargo.lock
+3
-3
lib/runtime/examples/Cargo.toml
lib/runtime/examples/Cargo.toml
+1
-1
pyproject.toml
pyproject.toml
+2
-2
No files found.
Cargo.lock
View file @
9d9a1d9b
...
...
@@ -814,9 +814,9 @@ dependencies = [
[[package]]
name = "cc"
version = "1.2.2
0
"
version = "1.2.2
4
"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "
04da6a0d40b948dfc4fa8f5bbf402b0fc1a64a28dbf7d12ffd683550f2c1b63a
"
checksum = "
16595d3be041c03b09d08d0858631facccee9221e579704070e6e9e4915d3bc7
"
dependencies = [
"jobserver",
"libc",
...
...
@@ -1555,7 +1555,7 @@ dependencies = [
[[package]]
name = "dynamo-engine-llamacpp"
version = "0.
2.1
"
version = "0.
3.0
"
dependencies = [
"async-stream",
"dynamo-llm",
...
...
@@ -1567,7 +1567,7 @@ dependencies = [
[[package]]
name = "dynamo-engine-mistralrs"
version = "0.
2.1
"
version = "0.
3.0
"
dependencies = [
"anyhow",
"async-openai",
...
...
@@ -1586,7 +1586,7 @@ dependencies = [
[[package]]
name = "dynamo-llm"
version = "0.
2.1
"
version = "0.
3.0
"
dependencies = [
"akin",
"aligned-vec",
...
...
@@ -1658,7 +1658,7 @@ dependencies = [
[[package]]
name = "dynamo-run"
version = "0.
2.1
"
version = "0.
3.0
"
dependencies = [
"anyhow",
"async-openai",
...
...
@@ -1686,7 +1686,7 @@ dependencies = [
[[package]]
name = "dynamo-runtime"
version = "0.
2.1
"
version = "0.
3.0
"
dependencies = [
"anyhow",
"assert_matches",
...
...
@@ -1735,7 +1735,7 @@ dependencies = [
[[package]]
name = "dynamo-tokens"
version = "0.
2.1
"
version = "0.
3.0
"
dependencies = [
"bytemuck",
"derive-getters",
...
...
@@ -2733,18 +2733,6 @@ dependencies = [
"match_token",
]
[[package]]
name = "http"
version = "0.2.1"
dependencies = [
"clap",
"dynamo-llm",
"dynamo-runtime",
"serde",
"serde_json",
"tokio",
]
[[package]]
name = "http"
version = "0.2.12"
...
...
@@ -2756,6 +2744,18 @@ dependencies = [
"itoa",
]
[[package]]
name = "http"
version = "0.3.0"
dependencies = [
"clap",
"dynamo-llm",
"dynamo-runtime",
"serde",
"serde_json",
"tokio",
]
[[package]]
name = "http"
version = "1.3.1"
...
...
@@ -3364,7 +3364,7 @@ checksum = "d750af042f7ef4f724306de029d18836c26c1765a54a6a3f094cbd23a7267ffa"
[[package]]
name = "libdynamo_llm"
version = "0.
2.1
"
version = "0.
3.0
"
dependencies = [
"anyhow",
"async-once-cell",
...
...
@@ -3477,7 +3477,7 @@ dependencies = [
[[package]]
name = "llmctl"
version = "0.
2.1
"
version = "0.
3.0
"
dependencies = [
"anyhow",
"clap",
...
...
@@ -3677,7 +3677,7 @@ dependencies = [
[[package]]
name = "metrics"
version = "0.
2.1
"
version = "0.
3.0
"
dependencies = [
"axum 0.6.20",
"clap",
...
...
@@ -4084,13 +4084,14 @@ dependencies = [
[[package]]
name = "nixl-sys"
version = "0.
2.1
-rc.
3
"
version = "0.
3.0
-rc.
2
"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "
bfeec33e0229249e8688309a70c677f522446f9ac92105a85aad4a5ceef2dd2f
"
checksum = "
6a1727039c315bf41aeadcdbea02522b8a3df69a77bd732996243502a5fb6f07
"
dependencies = [
"bindgen 0.71.1",
"cc",
"libc",
"os_info",
"pkg-config",
"serde",
"thiserror 2.0.12",
...
...
@@ -4387,6 +4388,17 @@ dependencies = [
"num-traits",
]
[[package]]
name = "os_info"
version = "3.11.0"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "41fc863e2ca13dc2d5c34fb22ea4a588248ac14db929616ba65c45f21744b1e9"
dependencies = [
"log",
"serde",
"windows-sys 0.52.0",
]
[[package]]
name = "overload"
version = "0.1.1"
...
...
@@ -5333,7 +5345,7 @@ dependencies = [
[[package]]
name = "router"
version = "0.
2.1
"
version = "0.
3.0
"
dependencies = [
"clap",
"dynamo-llm",
...
...
Cargo.toml
View file @
9d9a1d9b
...
...
@@ -28,7 +28,7 @@ members = [
resolver
=
"3"
[workspace.package]
version
=
"0.
2.1
"
version
=
"0.
3.0
"
edition
=
"2021"
description
=
"Dynamo Inference Framework"
authors
=
[
"NVIDIA Inc. <sw-dl-dynamo@nvidia.com>"
]
...
...
@@ -39,9 +39,9 @@ keywords = ["llm", "genai", "inference", "nvidia", "distributed", "dynamo"]
[workspace.dependencies]
# Local crates
dynamo-runtime
=
{
path
=
"lib/runtime"
,
version
=
"0.
2.1
"
}
dynamo-llm
=
{
path
=
"lib/llm"
,
version
=
"0.
2.1
"
}
dynamo-tokens
=
{
path
=
"lib/tokens"
,
version
=
"0.
2.1
"
}
dynamo-runtime
=
{
path
=
"lib/runtime"
,
version
=
"0.
3.0
"
}
dynamo-llm
=
{
path
=
"lib/llm"
,
version
=
"0.
3.0
"
}
dynamo-tokens
=
{
path
=
"lib/tokens"
,
version
=
"0.
3.0
"
}
# External dependencies
anyhow
=
{
version
=
"1"
}
...
...
container/Dockerfile.vllm
View file @
9d9a1d9b
...
...
@@ -169,7 +169,7 @@ RUN uv pip install /workspace/wheels/nixl/*.whl
ARG VLLM_REF="0.8.4"
ARG VLLM_PATCH="vllm_v${VLLM_REF}-dynamo-kv-disagg-patch.patch"
ARG VLLM_PATCHED_PACKAGE_NAME="ai_dynamo_vllm"
ARG VLLM_PATCHED_PACKAGE_VERSION="0.8.4.post
1
"
ARG VLLM_PATCHED_PACKAGE_VERSION="0.8.4.post
2
"
ARG VLLM_MAX_JOBS=4
RUN --mount=type=bind,source=./container/deps/,target=/tmp/deps \
--mount=type=cache,target=/root/.cache/uv \
...
...
container/build.sh
View file @
9d9a1d9b
...
...
@@ -109,7 +109,7 @@ NONE_BASE_IMAGE_TAG="24.04"
SGLANG_BASE_IMAGE
=
"nvcr.io/nvidia/cuda-dl-base"
SGLANG_BASE_IMAGE_TAG
=
"25.01-cuda12.8-devel-ubuntu24.04"
NIXL_COMMIT
=
78695c2900cd7fff506764377386592dfc98e87e
NIXL_COMMIT
=
f531404be4866d85ed618b3baf4008c636798d63
NIXL_REPO
=
ai-dynamo/nixl.git
NO_CACHE
=
""
...
...
docs/support_matrix.md
View file @
9d9a1d9b
...
...
@@ -62,21 +62,21 @@ For **Linux**, the **ARM64** support is experimental and may have limitations. W
### Runtime Dependency
|
**Python Package**
|
**Version**
| glibc version | CUDA Version |
|--------------------|---------------|----------------------|--------------|
| ai-dynamo | 0.
2.1
| >=2.28 | |
| ai-dynamo-runtime | 0.
2.1
| >=2.28 | |
| ai-dynamo-vllm | 0.8.4.post
1
*
| >=2.28 (recommended) | |
| NIXL | 0.
2.1
| >=2.27 | >=11.8 |
| ai-dynamo | 0.
3.0
| >=2.28 | |
| ai-dynamo-runtime | 0.
3.0
| >=2.28 | |
| ai-dynamo-vllm | 0.8.4.post
2
*
| >=2.28 (recommended) | |
| NIXL | 0.
3.0
| >=2.27 | >=11.8 |
### Build Dependency
|
**Build Dependency**
|
**Version**
|
|----------------------|-------------|
|
**Base Container**
|
[
25.03
](
https://catalog.ngc.nvidia.com/orgs/nvidia/containers/cuda-dl-base/tags
)
|
|
**ai-dynamo-vllm**
|0.8.4.post
1
*
|
|
**ai-dynamo-vllm**
|0.8.4.post
2
*
|
|
**TensorRT-LLM**
| 0.19.0
**
|
|
**NIXL**
| 0.
2.1
|
|
**NIXL**
| 0.
3.0
|
> **Note**:
> - *ai-dynamo-vllm v0.8.4.post
1
is a customized patch of v0.8.4 from vLLM.
> - *ai-dynamo-vllm v0.8.4.post
2
is a customized patch of v0.8.4 from vLLM.
> - **Specific versions of TensorRT-LLM supported by Dynamo are subject to change.
...
...
lib/bindings/python/Cargo.lock
View file @
9d9a1d9b
...
...
@@ -577,9 +577,9 @@ dependencies = [
[[package]]
name = "cc"
version = "1.2.2
0
"
version = "1.2.2
4
"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "
04da6a0d40b948dfc4fa8f5bbf402b0fc1a64a28dbf7d12ffd683550f2c1b63a
"
checksum = "
16595d3be041c03b09d08d0858631facccee9221e579704070e6e9e4915d3bc7
"
dependencies = [
"jobserver",
"libc",
...
...
@@ -1092,7 +1092,7 @@ dependencies = [
[[package]]
name = "dynamo-llm"
version = "0.
2.1
"
version = "0.
3.0
"
dependencies = [
"akin",
"anyhow",
...
...
@@ -1155,7 +1155,7 @@ dependencies = [
[[package]]
name = "dynamo-py3"
version = "0.
2.1
"
version = "0.
3.0
"
dependencies = [
"anyhow",
"async-openai",
...
...
@@ -1180,7 +1180,7 @@ dependencies = [
[[package]]
name = "dynamo-runtime"
version = "0.
2.1
"
version = "0.
3.0
"
dependencies = [
"anyhow",
"async-nats",
...
...
@@ -2810,13 +2810,14 @@ dependencies = [
[[package]]
name = "nixl-sys"
version = "0.
2.1
"
version = "0.
3.0-rc.2
"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "
84bf333c75733cad60b29873d84168f841c6bd5207ae9dfbda7490a99c1ebe94
"
checksum = "
6a1727039c315bf41aeadcdbea02522b8a3df69a77bd732996243502a5fb6f07
"
dependencies = [
"bindgen",
"cc",
"libc",
"os_info",
"pkg-config",
"serde",
"thiserror 2.0.12",
...
...
@@ -3065,6 +3066,17 @@ version = "0.2.0"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "04744f49eae99ab78e0d5c0b603ab218f515ea8cfe5a456d7629ad883a3b6e7d"
[[package]]
name = "os_info"
version = "3.11.0"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "41fc863e2ca13dc2d5c34fb22ea4a588248ac14db929616ba65c45f21744b1e9"
dependencies = [
"log",
"serde",
"windows-sys 0.52.0",
]
[[package]]
name = "overload"
version = "0.1.1"
...
...
lib/bindings/python/Cargo.toml
View file @
9d9a1d9b
...
...
@@ -19,7 +19,7 @@
[package]
name
=
"dynamo-py3"
version
=
"0.
2.1
"
version
=
"0.
3.0
"
edition
=
"2021"
authors
=
["NVIDIA"]
license
=
"Apache-2.0"
...
...
@@ -75,3 +75,4 @@ pyo3-async-runtimes = { version = "0.23.0", default-features = false, features =
pythonize
=
"0.23"
dlpark
=
{
version
=
"0.5"
,
features
=
[
"pyo3"
,
"half"
],
optional
=
true
}
lib/llm/Cargo.toml
View file @
9d9a1d9b
...
...
@@ -81,7 +81,7 @@ regex = "1"
rayon
=
"1"
# block_manager
nixl-sys
=
{
version
=
"0.
2.1
-rc.
3
"
,
optional
=
true
}
nixl-sys
=
{
version
=
"0.
3.0
-rc.
2
"
,
optional
=
true
}
cudarc
=
{
version
=
"0.16.2"
,
features
=
["cuda-12020"]
,
optional
=
true
}
ndarray
=
{
version
=
"0.16"
,
optional
=
true
}
nix
=
{
version
=
"0.26"
,
optional
=
true
}
...
...
lib/runtime/examples/Cargo.lock
View file @
9d9a1d9b
...
...
@@ -623,7 +623,7 @@ dependencies = [
[[package]]
name = "dynamo-runtime"
version = "0.
2.1
"
version = "0.
3.0
"
dependencies = [
"anyhow",
"async-nats",
...
...
@@ -994,7 +994,7 @@ checksum = "2304e00983f87ffb38b55b444b5e3b60a884b5d30c0fca7d82fe33449bbe55ea"
[[package]]
name = "hello_world"
version = "0.
2.1
"
version = "0.
3.0
"
dependencies = [
"dynamo-runtime",
]
...
...
@@ -2306,7 +2306,7 @@ dependencies = [
[[package]]
name = "service_metrics"
version = "0.
2.1
"
version = "0.
3.0
"
dependencies = [
"dynamo-runtime",
"futures",
...
...
lib/runtime/examples/Cargo.toml
View file @
9d9a1d9b
...
...
@@ -21,7 +21,7 @@ members = [
resolver
=
"3"
[workspace.package]
version
=
"0.
2.1
"
version
=
"0.
3.0
"
edition
=
"2021"
authors
=
["NVIDIA"]
license
=
"Apache-2.0"
...
...
pyproject.toml
View file @
9d9a1d9b
...
...
@@ -15,7 +15,7 @@
[project]
name
=
"ai-dynamo"
version
=
"0.
2.1
"
version
=
"0.
3.0
"
description
=
"Distributed Inference Framework"
readme
=
"README.md"
authors
=
[
...
...
@@ -29,7 +29,7 @@ dependencies = [
"bentoml==1.4.8"
,
"types-psutil==7.0.0.20250218"
,
"kubernetes==32.0.1"
,
"ai-dynamo-runtime==0.
2.1
"
,
"ai-dynamo-runtime==0.
3.0
"
,
"fastapi==0.115.6"
,
"distro"
,
"typer"
,
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment