Cargo.toml 3.04 KB
Newer Older
1
2
3
4
5
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# SPDX-License-Identifier: Apache-2.0

[workspace]
members = [
6
    "components/metrics",
7
8
9
    "launch/*",
    "lib/llm",
    "lib/runtime",
10
    "lib/tokens",
11
    "lib/async-openai",
12
    "lib/parsers",
13
    "lib/bindings/c",
14
    "lib/engines/*",
15
]
16
resolver = "3"
17
18

[workspace.package]
19
version = "0.4.1"
20
edition = "2024"
21
22
description = "Dynamo Inference Framework"
authors = ["NVIDIA Inc. <sw-dl-dynamo@nvidia.com>"]
23
license = "Apache-2.0"
Neelay Shah's avatar
Neelay Shah committed
24
25
homepage = "https://github.com/ai-dynamo/dynamo"
repository = "https://github.com/ai-dynamo/dynamo.git"
26
keywords = ["llm", "genai", "inference", "nvidia", "distributed", "dynamo"]
27
28

[workspace.dependencies]
29
# Local crates
30
31
32
33
dynamo-runtime = { path = "lib/runtime", version = "0.4.1" }
dynamo-llm = { path = "lib/llm", version = "0.4.1" }
dynamo-tokens = { path = "lib/tokens", version = "0.4.1" }
dynamo-async-openai = { path = "lib/async-openai", version = "0.4.1", features = ["byot", "rustls"]}
34
dynamo-parsers = { path = "lib/parsers", version = "0.4.1" }
35

36
# External dependencies
37
anyhow = { version = "1" }
38
async-nats = { version = "0.40", features = ["service"] }
39
40
async-stream = { version = "0.3" }
async-trait = { version = "0.1" }
41
42
43
44
45
46
47
async_zmq = { version = "0.4.0" }
blake3 = { version = "1" }
bytes = { version = "1" }
chrono = { version = "0.4", default-features = false, features = ["alloc", "std", "clock", "now", "serde"] }
derive_builder = { version = "0.20" }
derive-getters = { version = "0.5" }
either = { version = "1.13", features = ["serde"] }
48
etcd-client = { version = "0.16", features = ["tls"] }
49
futures = { version = "0.3" }
50
hf-hub = { version = "0.4.2", default-features = false, features = ["tokio", "rustls-tls", "ureq"] }
51
humantime = { version = "2.2.0" }
52
libc = { version = "0.2" }
Ryan Olson's avatar
Ryan Olson committed
53
oneshot = { version = "0.1.11", features = ["std", "async"] }
54
prometheus = { version = "0.14" }
55
rand = { version = "0.9.0" }
56
reqwest = { version = "0.12.22", default-features = false, features = ["json", "stream", "rustls-tls"] }
57
58
serde = { version = "1", features = ["derive"] }
serde_json = { version = "1" }
59
strum = { version = "0.27", features = ["derive"] }
60
tempfile = "3"
61
62
63
thiserror = { version = "2.0.11" }
tokio = { version = "1", features = ["full"] }
tokio-stream = { version = "0.1" }
Ryan Olson's avatar
Ryan Olson committed
64
tokio-util = { version = "0.7", features = ["codec", "net", "rt"] }
65
66
tower-http = {version = "0.6", features=["trace"]}
axum = { version = "0.8" , features = ["macros"]}
67
tracing = { version = "0.1" }
68
tracing-subscriber = { version = "0.3", features = ["env-filter", "local-time", "json"] }
69
validator = { version = "0.20.0", features = ["derive"] }
70
uuid = { version = "1.17", features = ["v4", "serde"] }
71
url = {version = "2.5", features = ["serde"]}
72
xxhash-rust = { version = "0.8", features = ["xxh3", "const_xxh3"] }
Graham King's avatar
Graham King committed
73
74
75

[profile.dev.package]
insta.opt-level = 3
76

77
78
79
80
[profile.dev]
# release level optimizations otherwise everything feels slow
opt-level = 3

81
[profile.release]
82
# These make the build much slower but shrink the binary, and could help performance
83
84
codegen-units = 1
lto = true