Cargo.toml 5.32 KB
Newer Older
1
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
3
4
5
# SPDX-License-Identifier: Apache-2.0

[workspace]
members = [
6
7
    "lib/llm",
    "lib/runtime",
8
    "lib/config",
9
    "lib/tokenizers",
10
    "lib/tokens",
11
    "lib/mocker",
12
    "lib/kv-router",
13
    "lib/memory",
Ryan Olson's avatar
Ryan Olson committed
14
    "lib/kvbm-common",
Ryan Olson's avatar
Ryan Olson committed
15
16
    "lib/kvbm-config",
    "lib/kvbm-engine",
17
    "lib/kvbm-kernels",
Ryan Olson's avatar
Ryan Olson committed
18
    "lib/kvbm-logical",
Ryan Olson's avatar
Ryan Olson committed
19
    "lib/kvbm-physical",
20
    "lib/protocols",
21
    "lib/parsers",
Yan Ru Pei's avatar
Yan Ru Pei committed
22
    "lib/bench",
23
    "lib/bindings/c",
24
    "lib/bindings/python/codegen",
25
]
26
resolver = "3"
27
28

[workspace.package]
29
version = "1.1.0"
30
edition = "2024"
31
32
description = "Dynamo Inference Framework"
authors = ["NVIDIA Inc. <sw-dl-dynamo@nvidia.com>"]
33
license = "Apache-2.0"
Neelay Shah's avatar
Neelay Shah committed
34
35
homepage = "https://github.com/ai-dynamo/dynamo"
repository = "https://github.com/ai-dynamo/dynamo.git"
36
keywords = ["llm", "genai", "inference", "nvidia", "distributed"]
37
38

[workspace.dependencies]
39
# Local crates
40
41
42
dynamo-runtime = { path = "lib/runtime", version = "1.1.0" }
dynamo-llm = { path = "lib/llm", version = "1.1.0" }
dynamo-config = { path = "lib/config", version = "1.1.0" }
43
dynamo-tokenizers = { path = "lib/tokenizers", version = "1.1.0" }
44
45
46
47
48
49
dynamo-tokens = { path = "lib/tokens", version = "1.1.0" }
dynamo-memory = { path = "lib/memory", version = "1.1.0" }
dynamo-mocker = { path = "lib/mocker", version = "1.1.0" }
dynamo-kv-router = { path = "lib/kv-router", version = "1.1.0", features = ["metrics", "runtime-protocols"] }
dynamo-protocols = { path = "lib/protocols", version = "1.1.0" }
dynamo-parsers = { path = "lib/parsers", version = "1.1.0" }
50
fastokens = { version = "0.1.0" }
51

Ryan Olson's avatar
Ryan Olson committed
52

53
# kvbm
54
55
56
57
58
59
kvbm-common = { path = "lib/kvbm-common", version = "1.1.0" }
kvbm-config = { path = "lib/kvbm-config", version = "1.1.0" }
kvbm-engine = { path = "lib/kvbm-engine", version = "1.1.0" }
kvbm-kernels = { path = "lib/kvbm-kernels", version = "1.1.0" }
kvbm-logical = { path = "lib/kvbm-logical", version = "1.1.0" }
kvbm-physical = { path = "lib/kvbm-physical", version = "1.1.0" }
60
61

# velo
Ryan Olson's avatar
Ryan Olson committed
62
velo = { version = "0.1.0" }
63

64
# External dependencies
65
anyhow = { version = "1" }
66
async-nats = { version = "0.45.0", features = ["service"] }
67
68
async-stream = { version = "0.3" }
async-trait = { version = "0.1" }
69
70
blake3 = { version = "1" }
bytes = { version = "1" }
71
72
73
74
75
76
77
chrono = { version = "0.4", default-features = false, features = [
    "alloc",
    "std",
    "clock",
    "now",
    "serde",
] }
78
cudarc = { version = "=0.19.3", features = ["cuda-version-from-build-system", "fallback-latest"] }
79
dashmap = { version = "6.1" }
80
81
82
derive_builder = { version = "0.20" }
derive-getters = { version = "0.5" }
either = { version = "1.13", features = ["serde"] }
83
etcd-client = { version = "0.17.0", features = ["tls"] }
84
futures = { version = "0.3" }
85
futures-util = { version = "0.3.32" }
86
87
88
89
90
91
92
hf-hub = { version = "0.4.2", default-features = false, features = [
    "tokio",
    "rustls-tls",
    "ureq",
] }

# ModelExpress for model downloading
93
94
modelexpress-client = { version = "0.3.0" }
modelexpress-common = { version = "0.3.0" }
95

96
humantime = { version = "2.2.0" }
97
indexmap = { version = "2" }
98
libc = { version = "0.2" }
99
oneshot = { version = "0.1.13", features = ["std", "async"] }
100
ordered-float = "4"
101
parking_lot = "0.12.5"
Ryan Olson's avatar
Ryan Olson committed
102
prometheus = { version = "0.14"}
103
104
rand = { version = "0.9.2" }
reqwest = { version = "0.12.24", default-features = false, features = [
105
    "multipart",
106
107
108
109
    "json",
    "stream",
    "rustls-tls",
] }
110
rmp-serde = { version = "1" }
Ryan Olson's avatar
Ryan Olson committed
111
serde_bytes = { version = "0.11" }
112
113
# "rc" is for async-openai. Allows serializing Rc and Arc. Generally avoid doing that.
serde = { version = "1", features = ["derive", "rc"] }
114
serde_json = { version = "1" }
115
strum = { version = "0.27", features = ["derive"] }
116
tempfile = "3"
117
thiserror = { version = "2.0.17" }
118
tmq = { version = "0.5.0" }
Ryan Olson's avatar
Ryan Olson committed
119
tokio = { version = "=1.48.0", features = ["full"] }
120
tokio-stream = { version = "0.1" }
Ryan Olson's avatar
Ryan Olson committed
121
tokio-util = { version = "0.7.17", features = ["codec", "net", "rt", "io-util"] }
122
tower-http = { version = "0.6", features = ["trace"] }
123
axum = { version = "=0.8.4", features = ["macros"] }
124
axum-core = { version = "0.5.2" }
125
126
hyper = { version = "=1.7.0" }
hyper-util = { version = "=0.1.17" }
127
mio = { version = "=1.1.1" }
128
tracing = { version = "0.1" }
129
130
131
132
133
tracing-subscriber = { version = "0.3", features = [
    "env-filter",
    "local-time",
    "json",
] }
134
tracing-opentelemetry = { version = "0.32.0" }
135
136
137
138
opentelemetry = { version = "0.31.0", features = ["trace", "logs"] }
opentelemetry_sdk = { version = "0.31.0", features = ["trace", "logs", "rt-tokio"] }
opentelemetry-otlp = { version = "0.31.0", features = ["trace", "logs", "grpc-tonic"] }
opentelemetry-appender-tracing = { version = "0.31.0" }
139
validator = { version = "0.20.0", features = ["derive"] }
140
uuid = { version = "1.18.1", features = ["v4", "serde"] }
141
url = { version = "2.5", features = ["serde"] }
142
xxhash-rust = { version = "0.8", features = ["xxh3", "const_xxh3"] }
Graham King's avatar
Graham King committed
143
144
145

[profile.dev.package]
insta.opt-level = 3
146

147
148
[profile.dev]
# release level optimizations otherwise everything feels slow
149
# opt-level = 3
150

151
[profile.release]
152
# These make the build much slower but shrink the binary, and could help performance
153
codegen-units = 1
154
lto = "thin"
155
156
157
158
159
160
161

# Profiling profile: release-like but retains debug symbols for perf/flamegraph/Nsight.
# Build: cargo build --profile profiling --features nvtx
[profile.profiling]
inherits = "release"
debug = true
strip = false