Cargo.toml 3.9 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# SPDX-License-Identifier: Apache-2.0
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

Neelay Shah's avatar
Neelay Shah committed
16
17
18
19
20
21
22
23
[workspace.package]
version = "0.2.0"
edition = "2021"
authors = ["NVIDIA"]
license = "Apache-2.0"
homepage = "https://github.com/triton-inference-server/triton_distributed"
repository = "https://github.com/triton-inference-server/triton_distributed"

24
[package]
Neelay Shah's avatar
Neelay Shah committed
25
name = "triton-distributed-llm"
26
27
28
29
30
31
version.workspace = true
edition.workspace = true
authors.workspace = true
license.workspace = true
homepage.workspace = true

32
33
34
35
[features]
mistralrs = ["dep:mistralrs"]
metal = ["mistralrs/metal"]
cuda = ["mistralrs/cuda"]
Biswa Panda's avatar
Biswa Panda committed
36
sentencepiece = ["dep:sentencepiece"]
37

Neelay Shah's avatar
Neelay Shah committed
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
[workspace.dependencies]
# local or crates.io
triton-distributed-runtime = { version = "0.2.0", path = "../runtime" }

# crates.io
anyhow = { version = "1" }
async-stream = { version = "0.3" }
async-trait = { version = "0.1" }
bytes = "1"
derive_builder = "0.20"
futures = "0.3"
serde = { version = "1", features = ["derive"] }
thiserror = { version = "2.0.11" }
tokio = { version = "1", features = ["full"] }
tokio-stream = { version = "0.1" }
tokio-util = { version = "0.7", features = ["codec", "net"] }
tracing = { version = "0.1" }
validator = { version = "0.20.0", features = ["derive"] }
uuid = { version = "1", features = ["v4", "serde"] }
xxhash-rust = { version = "0.8", features = ["xxh3", "const_xxh3"] }
58
strum = { version = "0.27", features = ["derive"] }
Neelay Shah's avatar
Neelay Shah committed
59

60
61
62
[dependencies]

# repo
Neelay Shah's avatar
Neelay Shah committed
63
triton-distributed-runtime = { workspace = true }
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79

# workspace
anyhow = { workspace = true }
async-stream = { workspace = true }
async-trait = { workspace = true }
bytes = { workspace = true }
derive_builder = {workspace = true }
futures =  { workspace = true }
serde = { workspace = true }
thiserror = { workspace = true }
tokio = { workspace = true }
tokio-stream = { workspace = true }
tokio-util = { workspace = true }
tracing = { workspace = true }
validator = { workspace = true }
uuid = { workspace = true }
80
xxhash-rust = { workspace = true }
81
strum = { workspace = true }
82

83
84
blake3 = "1"

85
# protocols
86
87
88
89
90
91
92
chrono = { version = "0.4", default-features = false, features = [
  "alloc",
  "std",
  "clock",
  "now",
  "serde",
] }
93
94
95
96
97
98
99
100
serde_json = { version = "1" }
regex = "1"
unicode-segmentation = "1.12"

# http-service
axum = "0.8"
prometheus = { version = "0.13" }

101
102
103
# mistralrs
either = { version = "1.13" }
indexmap = { version = "2.6" }
104
mistralrs = { git = "https://github.com/EricLBuehler/mistral.rs.git", rev = "5e689c9", optional = true }
105

Biswa Panda's avatar
Biswa Panda committed
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
# tokenizers
tokenizers = { version = "0.21.0", default-features = false, features = [
  "onig",
  "esaxx_fast",
] }
sentencepiece = { version = "0.11.2", optional = true }

# backend
galil-seiferas = { version = "0.1" }
toktrie = {version = "0.6.28" }
toktrie_hf_tokenizers =  { version = "0.6.28" }

# preprocessor
bs62 = { version = "0.1" }
erased-serde = { version = "0.4" }
itertools = { version = "0.14.0" }
minijinja = { version = "2.3.1", features = ["loader"] }
minijinja-contrib = { version = "2.3.1", features = ["pycompat"] }
semver = { version = "1", features = ["serde"] }

126
127
128
[dev-dependencies]
proptest = "1.5.0"
reqwest = { version = "0.12", default-features = false, features = ["json", "stream", "rustls-tls"] }
129
rstest = "0.18.2"
130
tempfile = "3.17.1"
Biswa Panda's avatar
Biswa Panda committed
131
132
133
134
135
136
137
138
139
140
hf-hub = "0.4.1"
insta = { version = "1.41", features = [
  "glob",
  "json",
  "redactions",
  "filters",
] }

[profile.dev.package]
insta.opt-level = 3