"vllm/vscode:/vscode.git/clone" did not exist on "bd4c1e6fdbec56594079764bcb74c7e2a81ce525"
__init__.py 783 Bytes
Newer Older
1
2
"""vLLM: a high-throughput and memory-efficient inference engine for LLMs"""

Woosuk Kwon's avatar
Woosuk Kwon committed
3
4
5
6
from vllm.engine.arg_utils import AsyncEngineArgs, EngineArgs
from vllm.engine.async_llm_engine import AsyncLLMEngine
from vllm.engine.llm_engine import LLMEngine
from vllm.entrypoints.llm import LLM
7
from vllm.executor.ray_utils import initialize_ray_cluster
8
from vllm.model_executor.models import ModelRegistry
Woosuk Kwon's avatar
Woosuk Kwon committed
9
10
from vllm.outputs import CompletionOutput, RequestOutput
from vllm.sampling_params import SamplingParams
zhuwenwen's avatar
zhuwenwen committed
11
from vllm.version import __dcu_version__
Woosuk Kwon's avatar
Woosuk Kwon committed
12

Simon Mo's avatar
Simon Mo committed
13
__version__ = "0.4.2"
Woosuk Kwon's avatar
Woosuk Kwon committed
14
15
16

__all__ = [
    "LLM",
17
    "ModelRegistry",
Woosuk Kwon's avatar
Woosuk Kwon committed
18
19
20
21
22
23
24
    "SamplingParams",
    "RequestOutput",
    "CompletionOutput",
    "LLMEngine",
    "EngineArgs",
    "AsyncLLMEngine",
    "AsyncEngineArgs",
25
    "initialize_ray_cluster",
Woosuk Kwon's avatar
Woosuk Kwon committed
26
]