Cargo.toml 3.16 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# SPDX-License-Identifier: Apache-2.0
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

[package]
Neelay Shah's avatar
Neelay Shah committed
17
name = "dynamo-llm"
18
19
20
21
22
version.workspace = true
edition.workspace = true
authors.workspace = true
license.workspace = true
homepage.workspace = true
23
24
25
repository.workspace = true
readme.workspace = true
description = "Dynamo LLM Library"
26

27
[features]
28
default = []
29
30
31

cuda_kv = ["dep:cudarc", "dep:ndarray"]
sentencepiece = ["dep:sentencepiece"]
32

33
34
[dependencies]
# repo
Neelay Shah's avatar
Neelay Shah committed
35
dynamo-runtime = { workspace = true }
36
37
38
39
40

# workspace
anyhow = { workspace = true }
async-stream = { workspace = true }
async-trait = { workspace = true }
41
async-nats = { workspace = true }
42
async_zmq = { workspace = true }
43
bytes = { workspace = true }
44
chrono = { workspace = true }
45
derive_builder = {workspace = true }
46
either = { workspace = true }
47
futures =  { workspace = true }
48
49
rand = { workspace = true }
prometheus = { workspace = true }
50
serde = { workspace = true }
51
serde_json = { workspace = true }
52
53
54
55
56
57
thiserror = { workspace = true }
tokio = { workspace = true }
tokio-stream = { workspace = true }
tokio-util = { workspace = true }
tracing = { workspace = true }
validator = { workspace = true }
58
url = { workspace = true }
59
uuid = { workspace = true }
60
xxhash-rust = { workspace = true }
61
strum = { workspace = true }
62

63
akin = "0.4.0"
Paul Hendricks's avatar
Paul Hendricks committed
64
async-openai = "0.27.2"
65
blake3 = "1"
66
bytemuck = "1.22"
67
candle-core = { version = "0.8.0" }
68
derive-getters = "0.5"
69
regex = "1"
70
71
72
73
74
rayon = "1"

# kv_cuda
cudarc = { git = "https://github.com/coreylowman/cudarc.git", rev = "8c52e735b55bf8e979e1a16bd85e3dfe4f87c9fe", features = ["cuda-12040"], optional = true }
ndarray = { version = "0.16", optional = true }
75

76
77
78
79
80
81
# protocols
unicode-segmentation = "1.12"

# http-service
axum = "0.8"

Biswa Panda's avatar
Biswa Panda committed
82
# tokenizers
83
tokenizers = { version = "0.21.1", default-features = false, features = [
Biswa Panda's avatar
Biswa Panda committed
84
85
  "onig",
  "esaxx_fast",
86
  "rustls-tls",
Biswa Panda's avatar
Biswa Panda committed
87
88
89
90
91
] }
sentencepiece = { version = "0.11.2", optional = true }

# backend
galil-seiferas = { version = "0.1" }
92
toktrie = { version = "0.6.28" }
Biswa Panda's avatar
Biswa Panda committed
93
94
95
96
97
98
99
100
toktrie_hf_tokenizers =  { version = "0.6.28" }

# preprocessor
bs62 = { version = "0.1" }
erased-serde = { version = "0.4" }
itertools = { version = "0.14.0" }
minijinja = { version = "2.3.1", features = ["loader"] }
minijinja-contrib = { version = "2.3.1", features = ["pycompat"] }
101

102
103
104
# GGUF
ggus = "0.4.0"
memmap2 = "0.9.5"
105

106
[dev-dependencies]
107
hf-hub = { workspace = true }
108
109
proptest = "1.5.0"
reqwest = { version = "0.12", default-features = false, features = ["json", "stream", "rustls-tls"] }
110
rstest = "0.18.2"
111
rstest_reuse = "0.7.0"
112
tempfile = "3.17.1"
Biswa Panda's avatar
Biswa Panda committed
113
114
115
116
117
118
insta = { version = "1.41", features = [
  "glob",
  "json",
  "redactions",
  "filters",
] }