generate_argparse.py 8.38 KB
Newer Older
1
2
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
3
import importlib
4
5
import logging
import sys
6
import traceback
7
8
9
10
11
from argparse import SUPPRESS, HelpFormatter
from pathlib import Path
from typing import Literal
from unittest.mock import MagicMock, patch

12
13
14
15
from pydantic_core import core_schema

logger = logging.getLogger("mkdocs")

16
17
18
19
ROOT_DIR = Path(__file__).parent.parent.parent.parent
ARGPARSE_DOC_DIR = ROOT_DIR / "docs/argparse"

sys.path.insert(0, str(ROOT_DIR))
20
21
22
23
24
25
26
27
28
29
30
31
32


# Mock custom op code
class MockCustomOp:
    @staticmethod
    def register(name):
        def decorator(cls):
            return cls

        return decorator


noop = lambda *a, **k: None
33
sys.modules["vllm._C"] = MagicMock()
34
35
36
37
38
39
40
41
42
43
sys.modules["vllm.model_executor.custom_op"] = MagicMock(CustomOp=MockCustomOp)
sys.modules["vllm.utils.torch_utils"] = MagicMock(direct_register_custom_op=noop)

# Mock any version checks by reading from compiled CI requirements
with open(ROOT_DIR / "requirements/test.txt") as f:
    VERSIONS = dict(line.strip().split("==") for line in f if "==" in line)
importlib.metadata.version = lambda name: VERSIONS.get(name) or "0.0.0"

# Make torch.nn.Parameter safe to inherit from
sys.modules["torch.nn"] = MagicMock(Parameter=object)
44
45


46
47
48
class PydanticMagicMock(MagicMock):
    """`MagicMock` that's able to generate pydantic-core schemas."""

49
50
51
52
53
    def __init__(self, *args, **kwargs):
        name = kwargs.pop("name", None)
        super().__init__(*args, **kwargs)
        self.__spec__ = importlib.machinery.ModuleSpec(name, None)

54
55
56
57
    def __get_pydantic_core_schema__(self, source_type, handler):
        return core_schema.any_schema()


58
def auto_mock(module, attr, max_mocks=100):
59
60
61
62
63
    """Function that automatically mocks missing modules during imports."""
    logger.info("Importing %s from %s", attr, module)
    for _ in range(max_mocks):
        try:
            # First treat attr as an attr, then as a submodule
64
65
66
67
68
            return getattr(
                importlib.import_module(module),
                attr,
                importlib.import_module(f"{module}.{attr}"),
            )
69
70
        except ModuleNotFoundError as e:
            logger.info("Mocking %s for argparse doc generation", e.name)
71
72
73
            sys.modules[e.name] = PydanticMagicMock(name=e.name)
        except Exception as e:
            logger.warning("Failed to import %s.%s: %s", module, attr, e)
74
75

    raise ImportError(
76
77
        f"Failed to import {module}.{attr} after mocking {max_mocks} imports"
    )
78
79


80
81
82
83
84
85
86
87
bench_latency = auto_mock("vllm.benchmarks", "latency")
bench_serve = auto_mock("vllm.benchmarks", "serve")
bench_sweep_plot = auto_mock("vllm.benchmarks.sweep.plot", "SweepPlotArgs")
bench_sweep_serve = auto_mock("vllm.benchmarks.sweep.serve", "SweepServeArgs")
bench_sweep_serve_sla = auto_mock(
    "vllm.benchmarks.sweep.serve_sla", "SweepServeSLAArgs"
)
bench_throughput = auto_mock("vllm.benchmarks", "throughput")
88
89
90
91
AsyncEngineArgs = auto_mock("vllm.engine.arg_utils", "AsyncEngineArgs")
EngineArgs = auto_mock("vllm.engine.arg_utils", "EngineArgs")
ChatCommand = auto_mock("vllm.entrypoints.cli.openai", "ChatCommand")
CompleteCommand = auto_mock("vllm.entrypoints.cli.openai", "CompleteCommand")
92
93
openai_cli_args = auto_mock("vllm.entrypoints.openai", "cli_args")
openai_run_batch = auto_mock("vllm.entrypoints.openai", "run_batch")
Cyrus Leung's avatar
Cyrus Leung committed
94
95
96
FlexibleArgumentParser = auto_mock(
    "vllm.utils.argparse_utils", "FlexibleArgumentParser"
)
97
98
99
100
101


class MarkdownFormatter(HelpFormatter):
    """Custom formatter that generates markdown for argument groups."""

102
    def __init__(self, prog, starting_heading_level=3):
103
        super().__init__(prog, max_help_position=float("inf"), width=float("inf"))
104
105
        self._section_heading_prefix = "#" * starting_heading_level
        self._argument_heading_prefix = "#" * (starting_heading_level + 1)
106
107
108
109
        self._markdown_output = []

    def start_section(self, heading):
        if heading not in {"positional arguments", "options"}:
110
111
            heading_md = f"\n{self._section_heading_prefix} {heading}\n\n"
            self._markdown_output.append(heading_md)
112
113
114
115
116
117
118
119
120
121
122
123
124

    def end_section(self):
        pass

    def add_text(self, text):
        if text:
            self._markdown_output.append(f"{text.strip()}\n\n")

    def add_usage(self, usage, actions, groups, prefix=None):
        pass

    def add_arguments(self, actions):
        for action in actions:
125
            if len(action.option_strings) == 0 or "--help" in action.option_strings:
126
                continue
127

128
            option_strings = f"`{'`, `'.join(action.option_strings)}`"
129
130
            heading_md = f"{self._argument_heading_prefix} {option_strings}\n\n"
            self._markdown_output.append(heading_md)
131
132

            if choices := action.choices:
133
134
135
136
137
                choices = f"`{'`, `'.join(str(c) for c in choices)}`"
                self._markdown_output.append(f"Possible choices: {choices}\n\n")
            elif (metavar := action.metavar) and isinstance(metavar, (list, tuple)):
                metavar = f"`{'`, `'.join(str(m) for m in metavar)}`"
                self._markdown_output.append(f"Possible choices: {metavar}\n\n")
138

139
140
            if action.help:
                self._markdown_output.append(f"{action.help}\n\n")
141
142

            if (default := action.default) != SUPPRESS:
143
144
145
                # Make empty string defaults visible
                if default == "":
                    default = '""'
146
147
148
149
150
151
152
                self._markdown_output.append(f"Default: `{default}`\n\n")

    def format_help(self):
        """Return the formatted help as markdown."""
        return "".join(self._markdown_output)


153
def create_parser(add_cli_args, **kwargs) -> FlexibleArgumentParser:
154
    """Create a parser for the given class with markdown formatting.
155

156
157
158
159
160
161
162
    Args:
        cls: The class to create a parser for
        **kwargs: Additional keyword arguments to pass to `cls.add_cli_args`.

    Returns:
        FlexibleArgumentParser: A parser with markdown formatting for the class.
    """
163
164
165
166
167
168
169
170
171
172
173
174
175
    try:
        parser = FlexibleArgumentParser(add_json_tip=False)
        parser.formatter_class = MarkdownFormatter
        with patch("vllm.config.DeviceConfig.__post_init__"):
            _parser = add_cli_args(parser, **kwargs)
    except ModuleNotFoundError as e:
        # Auto-mock runtime imports
        if tb_list := traceback.extract_tb(e.__traceback__):
            path = Path(tb_list[-1].filename).relative_to(ROOT_DIR)
            auto_mock(module=".".join(path.parent.parts), attr=path.stem)
            return create_parser(add_cli_args, **kwargs)
        else:
            raise e
176
177
    # add_cli_args might be in-place so return parser if _parser is None
    return _parser or parser
178
179


180
181
182
183
184
185
186
187
188
189
190
def on_startup(command: Literal["build", "gh-deploy", "serve"], dirty: bool):
    logger.info("Generating argparse documentation")
    logger.debug("Root directory: %s", ROOT_DIR.resolve())
    logger.debug("Output directory: %s", ARGPARSE_DOC_DIR.resolve())

    # Create the ARGPARSE_DOC_DIR if it doesn't exist
    if not ARGPARSE_DOC_DIR.exists():
        ARGPARSE_DOC_DIR.mkdir(parents=True)

    # Create parsers to document
    parsers = {
191
        # Engine args
192
193
194
195
        "engine_args": create_parser(EngineArgs.add_cli_args),
        "async_engine_args": create_parser(
            AsyncEngineArgs.add_cli_args, async_args_only=True
        ),
196
197
        # CLI
        "serve": create_parser(openai_cli_args.make_arg_parser),
198
199
        "chat": create_parser(ChatCommand.add_cli_args),
        "complete": create_parser(CompleteCommand.add_cli_args),
200
201
202
203
204
205
206
207
        "run-batch": create_parser(openai_run_batch.make_arg_parser),
        # Benchmark CLI
        "bench_latency": create_parser(bench_latency.add_cli_args),
        "bench_serve": create_parser(bench_serve.add_cli_args),
        "bench_sweep_plot": create_parser(bench_sweep_plot.add_cli_args),
        "bench_sweep_serve": create_parser(bench_sweep_serve.add_cli_args),
        "bench_sweep_serve_sla": create_parser(bench_sweep_serve_sla.add_cli_args),
        "bench_throughput": create_parser(bench_throughput.add_cli_args),
208
209
210
211
212
    }

    # Generate documentation for each parser
    for stem, parser in parsers.items():
        doc_path = ARGPARSE_DOC_DIR / f"{stem}.md"
213
214
        # Specify encoding for building on Windows
        with open(doc_path, "w", encoding="utf-8") as f:
215
            f.write(super(type(parser), parser).format_help())
216
        logger.info("Argparse generated: %s", doc_path.relative_to(ROOT_DIR))
217
218
219
220


if __name__ == "__main__":
    on_startup("build", False)