Cargo.toml 4.1 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# SPDX-License-Identifier: Apache-2.0
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

[package]
Neelay Shah's avatar
Neelay Shah committed
17
name = "dynamo-llm"
18
19
20
21
22
version.workspace = true
edition.workspace = true
authors.workspace = true
license.workspace = true
homepage.workspace = true
23
24
25
repository.workspace = true
readme.workspace = true
description = "Dynamo LLM Library"
26

27
[features]
28
default = []
Ryan Olson's avatar
Ryan Olson committed
29
# todo(ops): get this working in CI as a default.
30
31
# default = ["block-manager", "testing-full"]

Ryan Olson's avatar
Ryan Olson committed
32
33
34
testing-full  = ["testing-cuda", "testing-nixl"]
testing-cuda  = ["dep:cudarc"]
testing-nixl  = ["dep:nixl-sys"]
Ryan Olson's avatar
Ryan Olson committed
35
testing-etcd = []
36
block-manager = ["dep:nixl-sys", "dep:cudarc", "dep:ndarray", "dep:nix"]
37
cuda          = ["dep:cudarc"]
38
integration = []
39

40
41
42
43
[[bench]]
name = "tokenizer"
harness = false

44
45
[dependencies]
# repo
Neelay Shah's avatar
Neelay Shah committed
46
dynamo-runtime = { workspace = true }
47
48
49

# workspace
anyhow = { workspace = true }
50
dynamo-async-openai = { workspace = true }
51
52
async-stream = { workspace = true }
async-trait = { workspace = true }
53
async-nats = { workspace = true }
54
async_zmq = { workspace = true }
55
bytes = { workspace = true }
56
chrono = { workspace = true }
57
derive_builder = {workspace = true }
58
either = { workspace = true }
59
etcd-client = { workspace = true }
60
futures =  { workspace = true }
Ryan Olson's avatar
Ryan Olson committed
61
futures-util = "0.3.31"
62
hf-hub = { workspace = true }
63
humantime = { workspace = true } # input/batch
64
rand = { workspace = true }
Ryan Olson's avatar
Ryan Olson committed
65
oneshot = { workspace = true }
66
prometheus = { workspace = true }
67
serde = { workspace = true }
68
serde_json = { workspace = true }
69
strum = { workspace = true }
70
tempfile = { workspace = true }
71
thiserror = { workspace = true }
Ryan Olson's avatar
Ryan Olson committed
72
tmq = "0.5.0"
73
74
75
76
77
tokio = { workspace = true }
tokio-stream = { workspace = true }
tokio-util = { workspace = true }
tracing = { workspace = true }
validator = { workspace = true }
78
url = { workspace = true }
79
uuid = { workspace = true }
80
xxhash-rust = { workspace = true }
81

82
akin = "0.4.0"
83
blake3 = "1"
84
bytemuck = "1.22"
85
candle-core = { version = "0.9.1" }
86
derive-getters = "0.5"
87
offset-allocator = "0.2"
88
regex = "1"
89
rayon = "1"
90
dashmap = { version = "5.5.3" }
91

92
93
94
# input/text
dialoguer = { version = "0.11", default-features = false, features = ["editor", "history"] }

Ryan Olson's avatar
Ryan Olson committed
95
# block_manager
96
nixl-sys = {version = "0.4.1", optional = true }
97
cudarc = { version = "0.17.1", features = ["cuda-12020"], optional = true }
98
ndarray = { version = "0.16", optional = true }
99
nix = { version = "0.26", optional = true }
100

101
102
103
104
# protocols
unicode-segmentation = "1.12"

# http-service
105
axum = { workspace = true }
Graham King's avatar
Graham King committed
106
axum-server = { version = "0.7", features = ["tls-rustls"] }
107
tower-http = {workspace = true}
Graham King's avatar
Graham King committed
108
rustls = { version = "0.23" }
109

110

Biswa Panda's avatar
Biswa Panda committed
111
# tokenizers
112
tokenizers = { version = "0.21.4", default-features = false, features = [
Biswa Panda's avatar
Biswa Panda committed
113
114
  "onig",
  "esaxx_fast",
115
  "rustls-tls",
Biswa Panda's avatar
Biswa Panda committed
116
117
118
119
] }

# backend
galil-seiferas = { version = "0.1" }
120
121
toktrie = { version = "1.1" }
toktrie_hf_tokenizers =  { version = "1.1" }
Biswa Panda's avatar
Biswa Panda committed
122
123
124
125
126

# preprocessor
bs62 = { version = "0.1" }
erased-serde = { version = "0.4" }
itertools = { version = "0.14.0" }
127
128
minijinja = { version = "2.10.2", features = ["loader"] }
minijinja-contrib = { version = "2.10.2", features = ["pycompat"] }
129

130
131
132
# GGUF
ggus = "0.4.0"
memmap2 = "0.9.5"
133

134
135
136
# Publishers
zeromq = "0.4.1"
rmp-serde = "1.3"
137
ahash = "0.8.12"
138

139
[dev-dependencies]
140
approx = "0.5"
141
assert_matches = "1.5"
142
criterion = { version = "0.3", features = ["html_reports"] }
143
hf-hub = { workspace = true }
144
proptest = "1.5.0"
145
reqwest = { workspace = true }
146
rstest = "0.18.2"
147
rstest_reuse = "0.7.0"
148
serial_test = "3"
149
tempfile = "3.17.1"
Biswa Panda's avatar
Biswa Panda committed
150
151
152
153
154
155
insta = { version = "1.41", features = [
  "glob",
  "json",
  "redactions",
  "filters",
] }
156
157
aligned-vec = "0.6.4"
lazy_static = "1.4"