"lib/vscode:/vscode.git/clone" did not exist on "6634f33f2768d9ef5ed74aca56fa744c02f6d0a5"
Cargo.toml 6.14 KB
Newer Older
1
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
3
4
# SPDX-License-Identifier: Apache-2.0

[package]
Neelay Shah's avatar
Neelay Shah committed
5
name = "dynamo-llm"
6
7
8
9
10
version.workspace = true
edition.workspace = true
authors.workspace = true
license.workspace = true
homepage.workspace = true
11
12
13
repository.workspace = true
readme.workspace = true
description = "Dynamo LLM Library"
14

15
[features]
16
default = []
Ryan Olson's avatar
Ryan Olson committed
17
# todo(ops): get this working in CI as a default.
18
19
# default = ["block-manager", "testing-full"]

20
21
22
testing-full = ["testing-cuda", "testing-nixl"]
testing-cuda = ["dep:cudarc"]
testing-nixl = ["dep:nixl-sys"]
Ryan Olson's avatar
Ryan Olson committed
23
testing-etcd = []
24
block-manager = ["dep:nixl-sys", "dep:cudarc", "dep:nix", "dep:aligned-vec", "dep:dynamo-memory"]
25
block-manager-bench = ["block-manager", "testing-full", "dep:clap", "dep:indicatif"]
26
27
cuda = ["dep:cudarc"]
integration = ["dynamo-runtime/integration"]
28
media-nixl = ["dep:nixl-sys", "dep:dynamo-memory"]
29
media-ffmpeg = ["dep:video-rs", "dep:ffmpeg-next", "dep:memfile", "media-nixl"]
30
kv-router-stress = ["dep:clap", "dep:indicatif"]
31

32
33
34
35
[[bench]]
name = "tokenizer"
harness = false

36
37
38
39
[[bench]]
name = "transfer_context_v2"
harness = false
required-features = ["block-manager", "testing-cuda"]
40

41
42
[dependencies]
# repo
Neelay Shah's avatar
Neelay Shah committed
43
dynamo-runtime = { workspace = true }
44
dynamo-memory = { path = "../memory", optional = true }
45
46

# workspace
Ryan Olson's avatar
Ryan Olson committed
47
aho-corasick = "1.1"
48
anyhow = { workspace = true }
49
dynamo-async-openai = { workspace = true }
50
dynamo-parsers = { workspace = true }
51
52
async-stream = { workspace = true }
async-trait = { workspace = true }
53
async-nats = { workspace = true }
54
async_zmq = { workspace = true }
55
bytes = { workspace = true }
56
chrono = { workspace = true }
57
derive_builder = { workspace = true }
58
either = { workspace = true }
59
etcd-client = { workspace = true }
60
futures = { workspace = true }
Ryan Olson's avatar
Ryan Olson committed
61
futures-util = "0.3.31"
62
hf-hub = { workspace = true }
63
humantime = { workspace = true }                           # input/batch
64
rand = { workspace = true }
Ryan Olson's avatar
Ryan Olson committed
65
oneshot = { workspace = true }
66
parking_lot = { workspace = true }
67
prometheus = { workspace = true }
68
serde = { workspace = true }
69
serde_json = { workspace = true }
70
strum = { workspace = true }
71
tempfile = { workspace = true }
72
thiserror = { workspace = true }
73
tmq = { workspace = true }
74
75
76
77
78
tokio = { workspace = true }
tokio-stream = { workspace = true }
tokio-util = { workspace = true }
tracing = { workspace = true }
validator = { workspace = true }
79
url = { workspace = true }
80
uuid = { workspace = true }
81
xxhash-rust = { workspace = true }
82
83
modelexpress-client = { workspace = true }
modelexpress-common = { workspace = true }
84
akin = "0.4.0"
85
bitflags = { version = "2.4", features = ["serde"] }
86
blake3 = { version = "1.8", features = ["mmap", "rayon"] }
87
bytemuck = "1.22"
88
candle-core = { version = "0.9.1" }
89
derive-getters = "0.5"
90
offset-allocator = "0.2"
91
regex = "1"
92
rayon = "1"
93
dashmap = { version = "5.5.3" }
94
bincode = { version = "2.0.1", features = ["serde", "derive"] }
95

96
97
98
# lora
object_store = { version = "0.12.4", features = ["aws", "gcp", "azure", "http"] }

99
# input/text
100
101
102
103
dialoguer = { version = "0.11", default-features = false, features = [
  "editor",
  "history",
] }
104

Ryan Olson's avatar
Ryan Olson committed
105
# block_manager
106
aligned-vec = { version = "0.6.4", optional = true }
107
nixl-sys = { version = "=0.9.0", optional = true }
108
cudarc = { workspace = true, optional = true }
109
nix = { version = "0.26", optional = true }
110

111
112
113
114
# block_manager_bench
clap = { version = "4.5.49", features = ["derive"], optional = true }
indicatif = { version = "0.18.0", optional = true }

115

116
117
118
119
# protocols
unicode-segmentation = "1.12"

# http-service
120
axum = { workspace = true }
Graham King's avatar
Graham King committed
121
axum-server = { version = "0.7", features = ["tls-rustls"] }
122
123
hyper = { version = "1.5", features = ["http2", "server"] }
hyper-util = { version = "0.1", features = ["tokio", "server", "server-auto"] }
124
tower-http = { workspace = true }
Graham King's avatar
Graham King committed
125
rustls = { version = "0.23" }
126
tower = { version = "0.5", features = ["util", "make"] }
127
128
utoipa = { version = "5.3", features = ["axum_extras"] }
utoipa-swagger-ui = { version = "9.0", features = ["axum"] }
129

130

GuanLuo's avatar
GuanLuo committed
131
132
133
134
135
136
137
# grpc-service
# ping version to 0.13.1 so it depends on prost 0.13.5
# which is used across other libraries
tonic = { version = "0.13.1" }
# Request prost specifically so tonic-build properly compiles protobuf message
prost = { version = "0.13.5" }

Biswa Panda's avatar
Biswa Panda committed
138
# tokenizers
139
tokenizers = { version = "0.21.4", default-features = false, features = [
Biswa Panda's avatar
Biswa Panda committed
140
141
  "onig",
  "esaxx_fast",
142
  "rustls-tls",
Biswa Panda's avatar
Biswa Panda committed
143
144
145
146
] }

# backend
galil-seiferas = { version = "0.1" }
147
toktrie = { version = "1.1" }
148
toktrie_hf_tokenizers = { version = "1.1" }
Biswa Panda's avatar
Biswa Panda committed
149
150
151
152
153

# preprocessor
bs62 = { version = "0.1" }
erased-serde = { version = "0.4" }
itertools = { version = "0.14.0" }
154
155
minijinja = { version = "2.14.0", features = ["loader"] }
minijinja-contrib = { version = "2.14.0", features = ["pycompat"] }
156
json-five = { version = "0.3" }
157

158
159
160
# media loading in the preprocessor
reqwest = { workspace = true }
base64 = { version = "0.22" }
161
image = { version = "0.25", features = ["serde"] }
162
163
164
video-rs = { version = "0.10.5", optional = true }
ffmpeg-next = { version = "7.1.0", optional = true }
memfile = { version = "0.3.2", optional = true }
165
166
tokio-rayon = {version = "2" }
ndarray = { version = "0.16" }
167
168
ndarray-npy = { version = "0.9" }
ndarray-interp = { version = "0.5" }
169

170
171
172
# Publishers
zeromq = "0.4.1"
rmp-serde = "1.3"
173
ahash = "0.8.12"
174

175
[dev-dependencies]
176
approx = "0.5"
177
assert_matches = "1.5"
178
criterion = { version = "0.3", features = ["html_reports"] }
179
hf-hub = { workspace = true }
180
181
modelexpress-client = { workspace = true }
modelexpress-common = { workspace = true }
182
proptest = "1.5.0"
183
reqwest = { workspace = true }
184
rstest = "0.18.2"
185
rstest_reuse = "0.7.0"
186
serial_test = "3"
187
temp-env = { version = "0.3.6", features = ["async_closure"] }
188
tempfile = "3.17.1"
Biswa Panda's avatar
Biswa Panda committed
189
190
191
192
193
194
insta = { version = "1.41", features = [
  "glob",
  "json",
  "redactions",
  "filters",
] }
195

196
lazy_static = "1.4"
197
mockito = "1.7.0"
GuanLuo's avatar
GuanLuo committed
198

199
200
201
202
[[bin]]
name = "generate-frontend-openapi"
path = "src/bin/generate_frontend_openapi.rs"

GuanLuo's avatar
GuanLuo committed
203
[build-dependencies]
204
tonic-build = { version = "0.13.1" }
205
206
207
208
209

[[bin]]
name = "bench_local_transfer_v2"
path = "bin/bench_local_transfer_v2.rs"
required-features = ["block-manager-bench"]
210
211
212
213
214
215

[[bench]]
name = "radix_tree_microbench"
path = "benches/radix_tree_microbench.rs"
harness = false
required-features = ["kv-router-stress"]