# SPDX-FileCopyrightText: Copyright (c) 2024-2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved. # SPDX-License-Identifier: Apache-2.0 # # Licensed under the Apache License, Version 2.0 (the "License"); # you may not use this file except in compliance with the License. # You may obtain a copy of the License at # # http://www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, software # distributed under the License is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. [project] name = "ai-dynamo" version = "0.3.2" description = "Distributed Inference Framework" readme = "README.md" authors = [ { name = "NVIDIA Inc.", email = "sw-dl-dynamo@nvidia.com" }, ] license = { text = "Apache-2.0" } license-files = ["LICENSE"] requires-python = ">=3.10" dependencies = [ "ai-dynamo-runtime==0.3.2", "pytest>=8.3.4", "types-psutil>=7.0.0.20250218", "kubernetes>=32.0.1,<33.0.0", "fastapi>=0.115.0", "distro", # filelock: required by planner "filelock", "typer", "circus>=0.19.0", "click<8.2.0", "setuptools", ] classifiers = [ "Development Status :: 4 - Beta", "Intended Audience :: Developers", "Intended Audience :: Science/Research", "Intended Audience :: Information Technology", "License :: OSI Approved :: Apache Software License", "Programming Language :: Python :: 3", "Programming Language :: Python :: 3.10", "Programming Language :: Python :: 3.11", "Programming Language :: Python :: 3.12", "Topic :: Scientific/Engineering", "Topic :: Scientific/Engineering :: Artificial Intelligence", "Operating System :: POSIX :: Linux", ] keywords = ["llm", "genai", "inference", "nvidia", "distributed", "dynamo"] [project.urls] Repository = "https://github.com/ai-dynamo/dynamo.git" [project.optional-dependencies] trtllm =[ "uvloop", "tensorrt-llm==1.0.0rc4" ] vllm = [ "uvloop", "nixl", "vllm==0.10.0", ] sglang = [ "uvloop", "nixl", "sglang[runtime_common]==0.4.9.post1", "einops", "sgl-kernel==0.2.4", "sentencepiece", ] llama_cpp = [ "uvloop", "llama-cpp-python", ] [build-system] requires = ["hatchling"] build-backend = "hatchling.build" [tool.hatch.build.targets.wheel] packages = [ "components/frontend/src/dynamo", "components/planner/src/dynamo", "components/backends/llama_cpp/src/dynamo", "components/backends/mocker/src/dynamo", "components/backends/trtllm/src/dynamo", "components/backends/sglang/src/dynamo", "components/backends/vllm/src/dynamo" ] [tool.hatch.metadata] allow-direct-references = true [tool.codespell] # note: pre-commit passes explicit lists of files here, which this skip file list doesn't override - # this is only to allow you to run codespell interactively # this also overrides the grpc_generated folder, since it is generated # Ignore data files and auto-generated files skip = "./.git,./.github,./lib/llm/tests/data,*.lock,*.sum" # ignore allowed words used in code ignore-words-list = "afterall,ser,ende" # use the 'clear' dictionary for unambiguous spelling mistakes builtin = "clear" # use custom dictionary in addition to the built-in one dictionary = "./codespell.txt" # disable warnings about binary files and wrong encoding quiet-level = 3 [tool.isort] profile = "black" use_parentheses = true multi_line_output = 3 include_trailing_comma = true force_grid_wrap = 0 ensure_newline_before_comments = true line_length = 88 balanced_wrapping = true indent = " " skip = ["build"] known_first_party = ["dynamo"] [tool.pytest.ini_options] minversion = "8.0" tmp_path_retention_policy = "failed" # NOTE # We ignore model.py explcitly here to avoid mypy errors with duplicate modules # pytest overrides the default mypy exclude configuration and so we exclude here as well addopts = [ "-ra", "--showlocals", "--strict-markers", "--strict-config", "--mypy", "--ignore-glob=*model.py", "--ignore-glob=*_inc.py", "--ignore-glob=*/llm/tensorrtllm*", "--ignore-glob=docs/*", # FIXME: Get relative/generic blob paths to work here ] xfail_strict = true log_cli_level = "INFO" filterwarnings = [ "error", "ignore:.*cuda*:DeprecationWarning", # Need this to avoid deprecation warnings from CUDA in tensorrt_llm. "ignore:.*pkg_resources.*:DeprecationWarning", "ignore:.*pkg_resources.*:UserWarning", "ignore:.*multipart.*:PendingDeprecationWarning", "ignore:.*PyType_Spec.*custom tp_new.*:DeprecationWarning", # Ignore protobuf deprecation warning "ignore:.*unclosed.*socket.*:ResourceWarning", # Ignore unclosed socket warnings "ignore:.*unclosed event loop.*:ResourceWarning", # Ignore unclosed event loop warnings "ignore:.*Exception ignored in.*:pytest.PytestUnraisableExceptionWarning", # Ignore unraisable exception warnings ] # NOTE: Can also manually mark tests with @pytest.mark.asyncio asyncio_mode = "auto" markers = [ "pre_merge: marks tests to run before merging", "nightly: marks tests to run nightly", "weekly: marks tests to run weekly", "gpu_1: marks tests to run on GPU", "gpu_2: marks tests to run on 2GPUs", "gpu_4: marks tests to run on 4GPUs", "gpu_8: marks tests to run on 8GPUs", "e2e: marks tests as end-to-end tests", "integration: marks tests as integration tests", "unit: marks tests as unit tests", "stress: marks tests as stress tests", "vllm: marks tests as requiring vllm", "tensorrtllm: marks tests as requiring tensorrtllm", "sglang: marks tests as requiring sglang", "slow: marks tests as known to be slow" ] # Linting/formatting [tool.ruff] # Same as Black. line-length = 88 indent-width = 4 [tool.ruff.lint.extend-per-file-ignores] "icp/tests/**/test_*.py" = ["F811", "F401"] "*_inc.py" = ["F821"] [tool.mypy] # --disable-error-code: WAR large set of errors due to mypy not being run # previously. We can slowly enable sets of errors to fix over time. # disable_error_code = [] # --explicit-package-bases: WAR errors about duplicate module names used # throughout the llm examples. For example, the common module in # tensorrt_llm and vllm are both named common. explicit_package_bases = true # --ignore-missing-imports: WAR too many errors when developing outside # of container environment with PYTHONPATH set and packages installed. # NOTE: Can possibly move mypy from pre-commit to a github action run only in # a container with the expected environment and PYTHONPATH setup. ignore_missing_imports = true check_untyped_defs = true [[tool.mypy.overrides]] # Skip mypy analysis on internal dependencies of vllm module = ["vllm.*"] follow_imports = "skip" ignore_missing_imports = true [tool.sphinx] # extra-content-head extra_content_head = [ ''' ''', ] #extra-content-footer extra_content_footer = [ ''' ''', ]