"googlemock/include/vscode:/vscode.git/clone" did not exist on "0c0ca90382457859785a97bea5695093d72097dd"
Cargo.toml 2.99 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# SPDX-License-Identifier: Apache-2.0
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

[workspace]
members = [
18
19
20
21
    "components/*",
    "launch/*",
    "lib/llm",
    "lib/runtime",
22
    "lib/tokens",
23
    "lib/bindings/c",
24
    "lib/engines/*",
25
]
26
resolver = "3"
27
28

[workspace.package]
29
version = "0.1.1"
30
edition = "2021"
31
32
description = "Dynamo Inference Framework"
authors = ["NVIDIA Inc. <sw-dl-dynamo@nvidia.com>"]
33
license = "Apache-2.0"
Neelay Shah's avatar
Neelay Shah committed
34
35
homepage = "https://github.com/ai-dynamo/dynamo"
repository = "https://github.com/ai-dynamo/dynamo.git"
36
keywords = ["llm", "genai", "inference", "nvidia", "distributed", "dynamo"]
37
38

[workspace.dependencies]
39
# Local crates
40
41
42
dynamo-runtime = { path = "lib/runtime", version = "0.1.1" }
dynamo-llm = { path = "lib/llm", version = "0.1.1" }
dynamo-tokens = { path = "lib/tokens", version = "0.1.1" }
43

44
# External dependencies
45
anyhow = { version = "1" }
46
async-nats = { version = "0.40", features = ["service"] }
47
48
async-stream = { version = "0.3" }
async-trait = { version = "0.1" }
49
50
51
52
53
54
55
56
async_zmq = { version = "0.4.0" }
blake3 = { version = "1" }
bytes = { version = "1" }
chrono = { version = "0.4", default-features = false, features = ["alloc", "std", "clock", "now", "serde"] }
derive_builder = { version = "0.20" }
derive-getters = { version = "0.5" }
either = { version = "1.13", features = ["serde"] }
futures = { version = "0.3" }
57
58
hf-hub = { version = "0.4.2", default-features = false, features = ["tokio", "rustls-tls"] }
humantime = { version = "2.2.0" }
59
prometheus = { version = "0.14" }
60
rand = { version = "0.9.0" }
61
62
serde = { version = "1", features = ["derive"] }
serde_json = { version = "1" }
63
strum = { version = "0.27", features = ["derive"] }
64
65
66
67
68
thiserror = { version = "2.0.11" }
tokio = { version = "1", features = ["full"] }
tokio-stream = { version = "0.1" }
tokio-util = { version = "0.7", features = ["codec", "net"] }
tracing = { version = "0.1" }
69
tracing-subscriber = { version = "0.3", features = ["env-filter", "local-time", "json"] }
70
71
validator = { version = "0.20.0", features = ["derive"] }
uuid = { version = "1", features = ["v4", "serde"] }
72
url = {version = "2.5", features = ["serde"]}
73
xxhash-rust = { version = "0.8", features = ["xxh3", "const_xxh3"] }
Graham King's avatar
Graham King committed
74
75
76

[profile.dev.package]
insta.opt-level = 3
77

78
79
80
81
[profile.dev]
# release level optimizations otherwise everything feels slow
opt-level = 3

82
[profile.release]
83
# These make the build much slower but shrink the binary, and could help performance
84
85
codegen-units = 1
lto = true