Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
dynamo
Commits
c4935b34
Unverified
Commit
c4935b34
authored
Jul 07, 2025
by
Anant Sharma
Committed by
GitHub
Jul 07, 2025
Browse files
chore: update versions for 0.3.2 release (#1793)
parent
533b8cee
Changes
9
Hide whitespace changes
Inline
Side-by-side
Showing
9 changed files
with
32 additions
and
32 deletions
+32
-32
Cargo.lock
Cargo.lock
+11
-11
Cargo.toml
Cargo.toml
+4
-4
container/Dockerfile.vllm
container/Dockerfile.vllm
+1
-1
docs/support_matrix.md
docs/support_matrix.md
+6
-6
lib/bindings/python/Cargo.lock
lib/bindings/python/Cargo.lock
+3
-3
lib/bindings/python/Cargo.toml
lib/bindings/python/Cargo.toml
+1
-1
lib/runtime/examples/Cargo.lock
lib/runtime/examples/Cargo.lock
+3
-3
lib/runtime/examples/Cargo.toml
lib/runtime/examples/Cargo.toml
+1
-1
pyproject.toml
pyproject.toml
+2
-2
No files found.
Cargo.lock
View file @
c4935b34
...
@@ -1674,7 +1674,7 @@ dependencies = [
...
@@ -1674,7 +1674,7 @@ dependencies = [
[[package]]
[[package]]
name = "dynamo-engine-llamacpp"
name = "dynamo-engine-llamacpp"
version = "0.3.
1
"
version = "0.3.
2
"
dependencies = [
dependencies = [
"async-stream",
"async-stream",
"dynamo-llm",
"dynamo-llm",
...
@@ -1686,7 +1686,7 @@ dependencies = [
...
@@ -1686,7 +1686,7 @@ dependencies = [
[[package]]
[[package]]
name = "dynamo-engine-mistralrs"
name = "dynamo-engine-mistralrs"
version = "0.3.
1
"
version = "0.3.
2
"
dependencies = [
dependencies = [
"anyhow",
"anyhow",
"async-openai",
"async-openai",
...
@@ -1704,7 +1704,7 @@ dependencies = [
...
@@ -1704,7 +1704,7 @@ dependencies = [
[[package]]
[[package]]
name = "dynamo-llm"
name = "dynamo-llm"
version = "0.3.
1
"
version = "0.3.
2
"
dependencies = [
dependencies = [
"akin",
"akin",
"aligned-vec",
"aligned-vec",
...
@@ -1778,7 +1778,7 @@ dependencies = [
...
@@ -1778,7 +1778,7 @@ dependencies = [
[[package]]
[[package]]
name = "dynamo-run"
name = "dynamo-run"
version = "0.3.
1
"
version = "0.3.
2
"
dependencies = [
dependencies = [
"anyhow",
"anyhow",
"async-openai",
"async-openai",
...
@@ -1806,7 +1806,7 @@ dependencies = [
...
@@ -1806,7 +1806,7 @@ dependencies = [
[[package]]
[[package]]
name = "dynamo-runtime"
name = "dynamo-runtime"
version = "0.3.
1
"
version = "0.3.
2
"
dependencies = [
dependencies = [
"anyhow",
"anyhow",
"assert_matches",
"assert_matches",
...
@@ -1855,7 +1855,7 @@ dependencies = [
...
@@ -1855,7 +1855,7 @@ dependencies = [
[[package]]
[[package]]
name = "dynamo-tokens"
name = "dynamo-tokens"
version = "0.3.
1
"
version = "0.3.
2
"
dependencies = [
dependencies = [
"bytemuck",
"bytemuck",
"derive-getters",
"derive-getters",
...
@@ -2893,7 +2893,7 @@ dependencies = [
...
@@ -2893,7 +2893,7 @@ dependencies = [
[[package]]
[[package]]
name = "http"
name = "http"
version = "0.3.
1
"
version = "0.3.
2
"
dependencies = [
dependencies = [
"clap",
"clap",
"dynamo-llm",
"dynamo-llm",
...
@@ -3538,7 +3538,7 @@ checksum = "d750af042f7ef4f724306de029d18836c26c1765a54a6a3f094cbd23a7267ffa"
...
@@ -3538,7 +3538,7 @@ checksum = "d750af042f7ef4f724306de029d18836c26c1765a54a6a3f094cbd23a7267ffa"
[[package]]
[[package]]
name = "libdynamo_llm"
name = "libdynamo_llm"
version = "0.3.
1
"
version = "0.3.
2
"
dependencies = [
dependencies = [
"anyhow",
"anyhow",
"async-once-cell",
"async-once-cell",
...
@@ -3650,7 +3650,7 @@ dependencies = [
...
@@ -3650,7 +3650,7 @@ dependencies = [
[[package]]
[[package]]
name = "llmctl"
name = "llmctl"
version = "0.3.
1
"
version = "0.3.
2
"
dependencies = [
dependencies = [
"anyhow",
"anyhow",
"clap",
"clap",
...
@@ -3850,7 +3850,7 @@ dependencies = [
...
@@ -3850,7 +3850,7 @@ dependencies = [
[[package]]
[[package]]
name = "metrics"
name = "metrics"
version = "0.3.
1
"
version = "0.3.
2
"
dependencies = [
dependencies = [
"axum 0.6.20",
"axum 0.6.20",
"clap",
"clap",
...
@@ -5592,7 +5592,7 @@ dependencies = [
...
@@ -5592,7 +5592,7 @@ dependencies = [
[[package]]
[[package]]
name = "router"
name = "router"
version = "0.3.
1
"
version = "0.3.
2
"
dependencies = [
dependencies = [
"clap",
"clap",
"dynamo-llm",
"dynamo-llm",
...
...
Cargo.toml
View file @
c4935b34
...
@@ -28,7 +28,7 @@ members = [
...
@@ -28,7 +28,7 @@ members = [
resolver
=
"3"
resolver
=
"3"
[workspace.package]
[workspace.package]
version
=
"0.3.
1
"
version
=
"0.3.
2
"
edition
=
"2021"
edition
=
"2021"
description
=
"Dynamo Inference Framework"
description
=
"Dynamo Inference Framework"
authors
=
[
"NVIDIA Inc. <sw-dl-dynamo@nvidia.com>"
]
authors
=
[
"NVIDIA Inc. <sw-dl-dynamo@nvidia.com>"
]
...
@@ -39,9 +39,9 @@ keywords = ["llm", "genai", "inference", "nvidia", "distributed", "dynamo"]
...
@@ -39,9 +39,9 @@ keywords = ["llm", "genai", "inference", "nvidia", "distributed", "dynamo"]
[workspace.dependencies]
[workspace.dependencies]
# Local crates
# Local crates
dynamo-runtime
=
{
path
=
"lib/runtime"
,
version
=
"0.3.
1
"
}
dynamo-runtime
=
{
path
=
"lib/runtime"
,
version
=
"0.3.
2
"
}
dynamo-llm
=
{
path
=
"lib/llm"
,
version
=
"0.3.
1
"
}
dynamo-llm
=
{
path
=
"lib/llm"
,
version
=
"0.3.
2
"
}
dynamo-tokens
=
{
path
=
"lib/tokens"
,
version
=
"0.3.
1
"
}
dynamo-tokens
=
{
path
=
"lib/tokens"
,
version
=
"0.3.
2
"
}
# External dependencies
# External dependencies
anyhow
=
{
version
=
"1"
}
anyhow
=
{
version
=
"1"
}
...
...
container/Dockerfile.vllm
View file @
c4935b34
...
@@ -163,7 +163,7 @@ RUN uv pip install /workspace/wheels/nixl/*.whl
...
@@ -163,7 +163,7 @@ RUN uv pip install /workspace/wheels/nixl/*.whl
ARG VLLM_REF="0.8.4"
ARG VLLM_REF="0.8.4"
ARG VLLM_PATCH="vllm_v${VLLM_REF}-dynamo-kv-disagg-patch.patch"
ARG VLLM_PATCH="vllm_v${VLLM_REF}-dynamo-kv-disagg-patch.patch"
ARG VLLM_PATCHED_PACKAGE_NAME="ai_dynamo_vllm"
ARG VLLM_PATCHED_PACKAGE_NAME="ai_dynamo_vllm"
ARG VLLM_PATCHED_PACKAGE_VERSION="0.8.4.post
3
"
ARG VLLM_PATCHED_PACKAGE_VERSION="0.8.4.post
4
"
ARG VLLM_MAX_JOBS=4
ARG VLLM_MAX_JOBS=4
RUN --mount=type=bind,source=./container/deps/,target=/tmp/deps \
RUN --mount=type=bind,source=./container/deps/,target=/tmp/deps \
--mount=type=cache,target=/root/.cache/uv \
--mount=type=cache,target=/root/.cache/uv \
...
...
docs/support_matrix.md
View file @
c4935b34
...
@@ -70,9 +70,9 @@ If you are using a **GPU**, the following GPU models and architectures are suppo
...
@@ -70,9 +70,9 @@ If you are using a **GPU**, the following GPU models and architectures are suppo
|
**Python Package**
|
**Version**
| glibc version | CUDA Version |
|
**Python Package**
|
**Version**
| glibc version | CUDA Version |
| :----------------- | :------------ | :----------------------------------- | :----------- |
| :----------------- | :------------ | :----------------------------------- | :----------- |
| ai-dynamo | 0.3.
1
| >=2.28 | |
| ai-dynamo | 0.3.
2
| >=2.28 | |
| ai-dynamo-runtime | 0.3.
1
| >=2.28 (Python 3.12 has known issues)| |
| ai-dynamo-runtime | 0.3.
2
| >=2.28 (Python 3.12 has known issues)| |
| ai-dynamo-vllm | 0.8.4.post
3
¹ | >=2.28 (recommended) | |
| ai-dynamo-vllm | 0.8.4.post
4
¹ | >=2.28 (recommended) | |
| NIXL | 0.3.1 | >=2.27 | >=11.8 |
| NIXL | 0.3.1 | >=2.27 | >=11.8 |
### Build Dependency
### Build Dependency
...
@@ -80,12 +80,12 @@ If you are using a **GPU**, the following GPU models and architectures are suppo
...
@@ -80,12 +80,12 @@ If you are using a **GPU**, the following GPU models and architectures are suppo
|
**Build Dependency**
|
**Version**
|
|
**Build Dependency**
|
**Version**
|
| :------------------- | :------------------------------------------------------------------------------- |
| :------------------- | :------------------------------------------------------------------------------- |
|
**Base Container**
|
[
25.03
](
https://catalog.ngc.nvidia.com/orgs/nvidia/containers/cuda-dl-base/tags
)
|
|
**Base Container**
|
[
25.03
](
https://catalog.ngc.nvidia.com/orgs/nvidia/containers/cuda-dl-base/tags
)
|
|
**ai-dynamo-vllm**
| 0.8.4.post
3
¹ |
|
**ai-dynamo-vllm**
| 0.8.4.post
4
¹ |
|
**TensorRT-LLM**
|
0.21
.0rc² |
|
**TensorRT-LLM**
|
1.0
.0rc² |
|
**NIXL**
| 0.3.1 |
|
**NIXL**
| 0.3.1 |
> [!Important]
> [!Important]
> ¹ ai-dynamo-vllm `v0.8.4.post
3
` is a customized patch of `v0.8.4` from vLLM.
> ¹ ai-dynamo-vllm `v0.8.4.post
4
` is a customized patch of `v0.8.4` from vLLM.
>
>
> ² Specific versions of TensorRT-LLM supported by Dynamo are subject to change.
> ² Specific versions of TensorRT-LLM supported by Dynamo are subject to change.
...
...
lib/bindings/python/Cargo.lock
View file @
c4935b34
...
@@ -1116,7 +1116,7 @@ dependencies = [
...
@@ -1116,7 +1116,7 @@ dependencies = [
[[package]]
[[package]]
name = "dynamo-llm"
name = "dynamo-llm"
version = "0.3.
1
"
version = "0.3.
2
"
dependencies = [
dependencies = [
"akin",
"akin",
"anyhow",
"anyhow",
...
@@ -1181,7 +1181,7 @@ dependencies = [
...
@@ -1181,7 +1181,7 @@ dependencies = [
[[package]]
[[package]]
name = "dynamo-py3"
name = "dynamo-py3"
version = "0.3.
1
"
version = "0.3.
2
"
dependencies = [
dependencies = [
"anyhow",
"anyhow",
"async-openai",
"async-openai",
...
@@ -1207,7 +1207,7 @@ dependencies = [
...
@@ -1207,7 +1207,7 @@ dependencies = [
[[package]]
[[package]]
name = "dynamo-runtime"
name = "dynamo-runtime"
version = "0.3.
1
"
version = "0.3.
2
"
dependencies = [
dependencies = [
"anyhow",
"anyhow",
"async-nats",
"async-nats",
...
...
lib/bindings/python/Cargo.toml
View file @
c4935b34
...
@@ -19,7 +19,7 @@
...
@@ -19,7 +19,7 @@
[package]
[package]
name
=
"dynamo-py3"
name
=
"dynamo-py3"
version
=
"0.3.
1
"
version
=
"0.3.
2
"
edition
=
"2021"
edition
=
"2021"
authors
=
["NVIDIA"]
authors
=
["NVIDIA"]
license
=
"Apache-2.0"
license
=
"Apache-2.0"
...
...
lib/runtime/examples/Cargo.lock
View file @
c4935b34
...
@@ -623,7 +623,7 @@ dependencies = [
...
@@ -623,7 +623,7 @@ dependencies = [
[[package]]
[[package]]
name = "dynamo-runtime"
name = "dynamo-runtime"
version = "0.3.
1
"
version = "0.3.
2
"
dependencies = [
dependencies = [
"anyhow",
"anyhow",
"async-nats",
"async-nats",
...
@@ -994,7 +994,7 @@ checksum = "2304e00983f87ffb38b55b444b5e3b60a884b5d30c0fca7d82fe33449bbe55ea"
...
@@ -994,7 +994,7 @@ checksum = "2304e00983f87ffb38b55b444b5e3b60a884b5d30c0fca7d82fe33449bbe55ea"
[[package]]
[[package]]
name = "hello_world"
name = "hello_world"
version = "0.3.
1
"
version = "0.3.
2
"
dependencies = [
dependencies = [
"dynamo-runtime",
"dynamo-runtime",
]
]
...
@@ -2306,7 +2306,7 @@ dependencies = [
...
@@ -2306,7 +2306,7 @@ dependencies = [
[[package]]
[[package]]
name = "service_metrics"
name = "service_metrics"
version = "0.3.
1
"
version = "0.3.
2
"
dependencies = [
dependencies = [
"dynamo-runtime",
"dynamo-runtime",
"futures",
"futures",
...
...
lib/runtime/examples/Cargo.toml
View file @
c4935b34
...
@@ -21,7 +21,7 @@ members = [
...
@@ -21,7 +21,7 @@ members = [
resolver
=
"3"
resolver
=
"3"
[workspace.package]
[workspace.package]
version
=
"0.3.
1
"
version
=
"0.3.
2
"
edition
=
"2021"
edition
=
"2021"
authors
=
["NVIDIA"]
authors
=
["NVIDIA"]
license
=
"Apache-2.0"
license
=
"Apache-2.0"
...
...
pyproject.toml
View file @
c4935b34
...
@@ -15,7 +15,7 @@
...
@@ -15,7 +15,7 @@
[project]
[project]
name
=
"ai-dynamo"
name
=
"ai-dynamo"
version
=
"0.3.
1
"
version
=
"0.3.
2
"
description
=
"Distributed Inference Framework"
description
=
"Distributed Inference Framework"
readme
=
"README.md"
readme
=
"README.md"
authors
=
[
authors
=
[
...
@@ -28,7 +28,7 @@ dependencies = [
...
@@ -28,7 +28,7 @@ dependencies = [
"pytest>=8.3.4"
,
"pytest>=8.3.4"
,
"types-psutil==7.0.0.20250218"
,
"types-psutil==7.0.0.20250218"
,
"kubernetes==32.0.1"
,
"kubernetes==32.0.1"
,
"ai-dynamo-runtime==0.3.
1
"
,
"ai-dynamo-runtime==0.3.
2
"
,
"fastapi==0.115.6"
,
"fastapi==0.115.6"
,
"distro"
,
"distro"
,
# filelock: required by planner
# filelock: required by planner
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment