Cargo.toml 5.2 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# SPDX-License-Identifier: Apache-2.0
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

[package]
Neelay Shah's avatar
Neelay Shah committed
17
name = "dynamo-llm"
18
19
20
21
22
version.workspace = true
edition.workspace = true
authors.workspace = true
license.workspace = true
homepage.workspace = true
23
24
25
repository.workspace = true
readme.workspace = true
description = "Dynamo LLM Library"
26

27
[features]
28
default = []
Ryan Olson's avatar
Ryan Olson committed
29
# todo(ops): get this working in CI as a default.
30
31
# default = ["block-manager", "testing-full"]

Ryan Olson's avatar
Ryan Olson committed
32
33
34
testing-full  = ["testing-cuda", "testing-nixl"]
testing-cuda  = ["dep:cudarc"]
testing-nixl  = ["dep:nixl-sys"]
Ryan Olson's avatar
Ryan Olson committed
35
testing-etcd = []
36
block-manager = ["dep:nixl-sys", "dep:cudarc", "dep:ndarray", "dep:nix"]
37
cuda          = ["dep:cudarc"]
38
integration   = ["dynamo-runtime/integration"]
39
40
# NOTE: This feature will be enabled once ModelExpress packages are published
# model-express = ["dep:model_express_client", "dep:model_express_common"]
41

42
43
44
45
[[bench]]
name = "tokenizer"
harness = false

46
47
48
49
[[bench]]
name = "transfer_context_v2"
harness = false
required-features = ["block-manager", "testing-cuda"]
50
51
[dependencies]
# repo
Neelay Shah's avatar
Neelay Shah committed
52
dynamo-runtime = { workspace = true }
53
54

# workspace
Ryan Olson's avatar
Ryan Olson committed
55
aho-corasick = "1.1"
56
anyhow = { workspace = true }
57
dynamo-async-openai = { workspace = true }
58
dynamo-parsers = { workspace = true}
59
60
async-stream = { workspace = true }
async-trait = { workspace = true }
61
async-nats = { workspace = true }
62
async_zmq = { workspace = true }
63
bytes = { workspace = true }
64
chrono = { workspace = true }
65
derive_builder = {workspace = true }
66
either = { workspace = true }
67
etcd-client = { workspace = true }
68
futures =  { workspace = true }
Ryan Olson's avatar
Ryan Olson committed
69
futures-util = "0.3.31"
70
hf-hub = { workspace = true }
71
humantime = { workspace = true } # input/batch
72
rand = { workspace = true }
Ryan Olson's avatar
Ryan Olson committed
73
oneshot = { workspace = true }
74
parking_lot = "0.12.4"
75
prometheus = { workspace = true }
76
serde = { workspace = true }
77
serde_json = { workspace = true }
78
strum = { workspace = true }
79
tempfile = { workspace = true }
80
thiserror = { workspace = true }
Ryan Olson's avatar
Ryan Olson committed
81
tmq = "0.5.0"
82
83
84
85
86
tokio = { workspace = true }
tokio-stream = { workspace = true }
tokio-util = { workspace = true }
tracing = { workspace = true }
validator = { workspace = true }
87
url = { workspace = true }
88
uuid = { workspace = true }
89
xxhash-rust = { workspace = true }
90

91
92
93
94
95
# ModelExpress client for model downloading
# NOTE: These will be uncommented once the packages are published to crates.io
# model_express_client = { version = "0.1.0", optional = true }
# model_express_common = { version = "0.1.0", optional = true }

96
akin = "0.4.0"
97
bitflags = { version = "2.4", features = ["serde"] }
98
blake3 = { version = "1.8", features=["mmap", "rayon"] }
99
bytemuck = "1.22"
100
candle-core = { version = "0.9.1" }
101
derive-getters = "0.5"
102
offset-allocator = "0.2"
103
regex = "1"
104
rayon = "1"
105
dashmap = { version = "5.5.3" }
106

107
108
109
# input/text
dialoguer = { version = "0.11", default-features = false, features = ["editor", "history"] }

Ryan Olson's avatar
Ryan Olson committed
110
# block_manager
111
nixl-sys = {version = "0.4.1", optional = true }
112
cudarc = { version = "0.17.1", features = ["cuda-12020"], optional = true }
113
ndarray = { version = "0.16", optional = true }
114
nix = { version = "0.26", optional = true }
115

116
117
118
119
# protocols
unicode-segmentation = "1.12"

# http-service
120
axum = { workspace = true }
Graham King's avatar
Graham King committed
121
axum-server = { version = "0.7", features = ["tls-rustls"] }
122
tower-http = {workspace = true}
Graham King's avatar
Graham King committed
123
rustls = { version = "0.23" }
124

125

GuanLuo's avatar
GuanLuo committed
126
127
128
129
130
131
132
# grpc-service
# ping version to 0.13.1 so it depends on prost 0.13.5
# which is used across other libraries
tonic = { version = "0.13.1" }
# Request prost specifically so tonic-build properly compiles protobuf message
prost = { version = "0.13.5" }

Biswa Panda's avatar
Biswa Panda committed
133
# tokenizers
134
tokenizers = { version = "0.21.4", default-features = false, features = [
Biswa Panda's avatar
Biswa Panda committed
135
136
  "onig",
  "esaxx_fast",
137
  "rustls-tls",
Biswa Panda's avatar
Biswa Panda committed
138
139
140
141
] }

# backend
galil-seiferas = { version = "0.1" }
142
143
toktrie = { version = "1.1" }
toktrie_hf_tokenizers =  { version = "1.1" }
Biswa Panda's avatar
Biswa Panda committed
144
145
146
147
148

# preprocessor
bs62 = { version = "0.1" }
erased-serde = { version = "0.4" }
itertools = { version = "0.14.0" }
149
150
minijinja = { version = "2.10.2", features = ["loader"] }
minijinja-contrib = { version = "2.10.2", features = ["pycompat"] }
151
json-five = { version = "0.3" }
152

153
154
155
# GGUF
ggus = "0.4.0"
memmap2 = "0.9.5"
156

157
158
159
# Publishers
zeromq = "0.4.1"
rmp-serde = "1.3"
160
ahash = "0.8.12"
161

162
[dev-dependencies]
163
approx = "0.5"
164
assert_matches = "1.5"
165
criterion = { version = "0.3", features = ["html_reports"] }
166
hf-hub = { workspace = true }
167
proptest = "1.5.0"
168
reqwest = { workspace = true }
169
rstest = "0.18.2"
170
rstest_reuse = "0.7.0"
171
serial_test = "3"
172
temp-env = { version = "0.3.6", features = ["async_closure"] }
173
tempfile = "3.17.1"
Biswa Panda's avatar
Biswa Panda committed
174
175
176
177
178
179
insta = { version = "1.41", features = [
  "glob",
  "json",
  "redactions",
  "filters",
] }
180
181
aligned-vec = "0.6.4"
lazy_static = "1.4"
GuanLuo's avatar
GuanLuo committed
182
183

[build-dependencies]
184
tonic-build = { version = "0.13.1"}