Unverified Commit 2f99f2f5 authored by Harry Mellor's avatar Harry Mellor Committed by GitHub
Browse files

Tidy `vllm/config/__init__.py` to only add classes and functions (#26405)


Signed-off-by: default avatarHarry Mellor <19981378+hmellor@users.noreply.github.com>
parent 338b1bf0
...@@ -15,7 +15,7 @@ from typing import Literal, NamedTuple, Optional ...@@ -15,7 +15,7 @@ from typing import Literal, NamedTuple, Optional
import pytest import pytest
from vllm.config import RunnerOption from vllm.config.model import RunnerOption
from vllm.logger import init_logger from vllm.logger import init_logger
from ..models.registry import HF_EXAMPLE_MODELS from ..models.registry import HF_EXAMPLE_MODELS
......
...@@ -6,7 +6,7 @@ from typing import Literal, NamedTuple, Optional ...@@ -6,7 +6,7 @@ from typing import Literal, NamedTuple, Optional
import pytest import pytest
from vllm.config import RunnerOption from vllm.config.model import RunnerOption
from vllm.logger import init_logger from vllm.logger import init_logger
from ..utils import compare_two_settings, create_new_process_for_each_test from ..utils import compare_two_settings, create_new_process_for_each_test
......
...@@ -15,7 +15,7 @@ from typing import Literal, NamedTuple, Optional ...@@ -15,7 +15,7 @@ from typing import Literal, NamedTuple, Optional
import pytest import pytest
from vllm.config import RunnerOption from vllm.config.model import RunnerOption
from vllm.logger import init_logger from vllm.logger import init_logger
from ..models.registry import HF_EXAMPLE_MODELS from ..models.registry import HF_EXAMPLE_MODELS
......
...@@ -7,7 +7,7 @@ from typing import Any, Callable, Optional ...@@ -7,7 +7,7 @@ from typing import Any, Callable, Optional
import torch import torch
from transformers.models.auto.auto_factory import _BaseAutoModelClass from transformers.models.auto.auto_factory import _BaseAutoModelClass
from vllm.config import RunnerOption from vllm.config.model import RunnerOption
from vllm.transformers_utils.tokenizer import AnyTokenizer from vllm.transformers_utils.tokenizer import AnyTokenizer
from .....conftest import HfRunner, VllmRunner from .....conftest import HfRunner, VllmRunner
......
...@@ -12,7 +12,7 @@ from pytest import MarkDecorator ...@@ -12,7 +12,7 @@ from pytest import MarkDecorator
from transformers import AutoModelForCausalLM from transformers import AutoModelForCausalLM
from transformers.models.auto.auto_factory import _BaseAutoModelClass from transformers.models.auto.auto_factory import _BaseAutoModelClass
from vllm.config import RunnerOption from vllm.config.model import RunnerOption
from vllm.logprobs import SampleLogprobs from vllm.logprobs import SampleLogprobs
from vllm.transformers_utils.tokenizer import AnyTokenizer from vllm.transformers_utils.tokenizer import AnyTokenizer
......
...@@ -10,7 +10,7 @@ import torch ...@@ -10,7 +10,7 @@ import torch
from packaging.version import Version from packaging.version import Version
from transformers import __version__ as TRANSFORMERS_VERSION from transformers import __version__ as TRANSFORMERS_VERSION
from vllm.config import ModelDType, TokenizerMode from vllm.config.model import ModelDType, TokenizerMode
@dataclass(frozen=True) @dataclass(frozen=True)
......
...@@ -10,7 +10,7 @@ import torch ...@@ -10,7 +10,7 @@ import torch
import torch.nn.functional as F import torch.nn.functional as F
from transformers import PretrainedConfig from transformers import PretrainedConfig
from vllm.config import ModelConfig, ModelDType, RunnerOption from vllm.config.model import ModelConfig, ModelDType, RunnerOption
from vllm.logprobs import Logprob, PromptLogprobs, SampleLogprobs from vllm.logprobs import Logprob, PromptLogprobs, SampleLogprobs
from vllm.multimodal.processing import InputProcessingContext from vllm.multimodal.processing import InputProcessingContext
from vllm.transformers_utils.tokenizer import cached_tokenizer_from_config from vllm.transformers_utils.tokenizer import cached_tokenizer_from_config
......
...@@ -15,11 +15,11 @@ from vllm.config import ( ...@@ -15,11 +15,11 @@ from vllm.config import (
DeviceConfig, DeviceConfig,
LoadConfig, LoadConfig,
ModelConfig, ModelConfig,
ModelDType,
ParallelConfig, ParallelConfig,
SchedulerConfig, SchedulerConfig,
VllmConfig, VllmConfig,
) )
from vllm.config.model import ModelDType
from vllm.platforms import current_platform from vllm.platforms import current_platform
from vllm.utils import resolve_obj_by_qualname from vllm.utils import resolve_obj_by_qualname
from vllm.v1.attention.backends.utils import CommonAttentionMetadata from vllm.v1.attention.backends.utils import CommonAttentionMetadata
......
...@@ -29,7 +29,7 @@ from vllm.sampling_params import ( ...@@ -29,7 +29,7 @@ from vllm.sampling_params import (
) )
if TYPE_CHECKING: if TYPE_CHECKING:
from vllm.config import TokenizerMode from vllm.config.model import TokenizerMode
NGRAM_SPEC_CONFIG = { NGRAM_SPEC_CONFIG = {
"model": "[ngram]", "model": "[ngram]",
......
...@@ -4,7 +4,7 @@ ...@@ -4,7 +4,7 @@
import pytest import pytest
import ray import ray
from vllm.config import ModelDType from vllm.config.model import ModelDType
from vllm.sampling_params import SamplingParams from vllm.sampling_params import SamplingParams
from vllm.v1.engine.async_llm import AsyncEngineArgs, AsyncLLM from vllm.v1.engine.async_llm import AsyncEngineArgs, AsyncLLM
from vllm.v1.metrics.ray_wrappers import RayPrometheusMetric, RayPrometheusStatLogger from vllm.v1.metrics.ray_wrappers import RayPrometheusMetric, RayPrometheusStatLogger
......
...@@ -16,7 +16,7 @@ from tests.v1.sample.utils import ( ...@@ -16,7 +16,7 @@ from tests.v1.sample.utils import (
get_test_batch, get_test_batch,
) )
from vllm import SamplingParams from vllm import SamplingParams
from vllm.config import LogprobsMode from vllm.config.model import LogprobsMode
from ...conftest import HfRunner, VllmRunner from ...conftest import HfRunner, VllmRunner
......
# SPDX-License-Identifier: Apache-2.0 # SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project # SPDX-FileCopyrightText: Copyright contributors to the vLLM project
from vllm.config.cache import ( from vllm.config.cache import CacheConfig
BlockSize,
CacheConfig,
CacheDType,
MambaDType,
PrefixCachingHashAlgo,
)
from vllm.config.compilation import ( from vllm.config.compilation import (
CompilationConfig, CompilationConfig,
CompilationLevel, CompilationLevel,
CUDAGraphMode, CUDAGraphMode,
PassConfig, PassConfig,
) )
from vllm.config.device import Device, DeviceConfig from vllm.config.device import DeviceConfig
from vllm.config.kv_events import KVEventsConfig from vllm.config.kv_events import KVEventsConfig
from vllm.config.kv_transfer import KVTransferConfig from vllm.config.kv_transfer import KVTransferConfig
from vllm.config.load import LoadConfig from vllm.config.load import LoadConfig
from vllm.config.lora import LoRAConfig from vllm.config.lora import LoRAConfig
from vllm.config.model import ( from vllm.config.model import (
ConvertOption,
HfOverrides,
LogprobsMode,
ModelConfig, ModelConfig,
ModelDType,
ModelImpl,
RunnerOption,
TaskOption,
TokenizerMode,
iter_architecture_defaults, iter_architecture_defaults,
try_match_architecture_defaults, try_match_architecture_defaults,
) )
from vllm.config.multimodal import MMCacheType, MMEncoderTPMode, MultiModalConfig from vllm.config.multimodal import MultiModalConfig
from vllm.config.observability import DetailedTraceModules, ObservabilityConfig from vllm.config.observability import ObservabilityConfig
from vllm.config.parallel import DistributedExecutorBackend, EPLBConfig, ParallelConfig from vllm.config.parallel import EPLBConfig, ParallelConfig
from vllm.config.pooler import PoolerConfig from vllm.config.pooler import PoolerConfig
from vllm.config.scheduler import RunnerType, SchedulerConfig, SchedulerPolicy from vllm.config.scheduler import SchedulerConfig
from vllm.config.speculative import SpeculativeConfig from vllm.config.speculative import SpeculativeConfig
from vllm.config.speech_to_text import SpeechToTextConfig from vllm.config.speech_to_text import SpeechToTextConfig
from vllm.config.structured_outputs import StructuredOutputsConfig from vllm.config.structured_outputs import StructuredOutputsConfig
...@@ -56,20 +42,17 @@ from vllm.config.vllm import ( ...@@ -56,20 +42,17 @@ from vllm.config.vllm import (
set_current_vllm_config, set_current_vllm_config,
) )
# __all__ should only contain classes and functions.
# Types and globals should be imported from their respective modules.
__all__ = [ __all__ = [
# From vllm.config.cache # From vllm.config.cache
"BlockSize",
"CacheConfig", "CacheConfig",
"CacheDType",
"MambaDType",
"PrefixCachingHashAlgo",
# From vllm.config.compilation # From vllm.config.compilation
"CompilationConfig", "CompilationConfig",
"CompilationLevel", "CompilationLevel",
"CUDAGraphMode", "CUDAGraphMode",
"PassConfig", "PassConfig",
# From vllm.config.device # From vllm.config.device
"Device",
"DeviceConfig", "DeviceConfig",
# From vllm.config.kv_events # From vllm.config.kv_events
"KVEventsConfig", "KVEventsConfig",
...@@ -80,34 +63,20 @@ __all__ = [ ...@@ -80,34 +63,20 @@ __all__ = [
# From vllm.config.lora # From vllm.config.lora
"LoRAConfig", "LoRAConfig",
# From vllm.config.model # From vllm.config.model
"ConvertOption",
"HfOverrides",
"LogprobsMode",
"ModelConfig", "ModelConfig",
"ModelDType",
"ModelImpl",
"RunnerOption",
"TaskOption",
"TokenizerMode",
"iter_architecture_defaults", "iter_architecture_defaults",
"try_match_architecture_defaults", "try_match_architecture_defaults",
# From vllm.config.multimodal # From vllm.config.multimodal
"MMCacheType",
"MMEncoderTPMode",
"MultiModalConfig", "MultiModalConfig",
# From vllm.config.observability # From vllm.config.observability
"DetailedTraceModules",
"ObservabilityConfig", "ObservabilityConfig",
# From vllm.config.parallel # From vllm.config.parallel
"DistributedExecutorBackend",
"EPLBConfig", "EPLBConfig",
"ParallelConfig", "ParallelConfig",
# From vllm.config.pooler # From vllm.config.pooler
"PoolerConfig", "PoolerConfig",
# From vllm.config.scheduler # From vllm.config.scheduler
"RunnerType",
"SchedulerConfig", "SchedulerConfig",
"SchedulerPolicy",
# From vllm.config.speculative # From vllm.config.speculative
"SpeculativeConfig", "SpeculativeConfig",
# From vllm.config.speech_to_text # From vllm.config.speech_to_text
......
...@@ -31,43 +31,41 @@ from typing_extensions import TypeIs, deprecated ...@@ -31,43 +31,41 @@ from typing_extensions import TypeIs, deprecated
import vllm.envs as envs import vllm.envs as envs
from vllm.config import ( from vllm.config import (
BlockSize,
CacheConfig, CacheConfig,
CacheDType,
CompilationConfig, CompilationConfig,
ConfigType, ConfigType,
ConvertOption,
DetailedTraceModules,
Device,
DeviceConfig, DeviceConfig,
DistributedExecutorBackend,
EPLBConfig, EPLBConfig,
HfOverrides,
KVEventsConfig, KVEventsConfig,
KVTransferConfig, KVTransferConfig,
LoadConfig, LoadConfig,
LogprobsMode,
LoRAConfig, LoRAConfig,
MambaDType,
MMEncoderTPMode,
ModelConfig, ModelConfig,
ModelDType, MultiModalConfig,
ObservabilityConfig, ObservabilityConfig,
ParallelConfig, ParallelConfig,
PoolerConfig, PoolerConfig,
PrefixCachingHashAlgo,
RunnerOption,
SchedulerConfig, SchedulerConfig,
SchedulerPolicy,
SpeculativeConfig, SpeculativeConfig,
StructuredOutputsConfig, StructuredOutputsConfig,
TaskOption,
TokenizerMode,
VllmConfig, VllmConfig,
get_attr_docs, get_attr_docs,
) )
from vllm.config.multimodal import MMCacheType, MultiModalConfig from vllm.config.cache import BlockSize, CacheDType, MambaDType, PrefixCachingHashAlgo
from vllm.config.parallel import ExpertPlacementStrategy from vllm.config.device import Device
from vllm.config.model import (
ConvertOption,
HfOverrides,
LogprobsMode,
ModelDType,
RunnerOption,
TaskOption,
TokenizerMode,
)
from vllm.config.multimodal import MMCacheType, MMEncoderTPMode
from vllm.config.observability import DetailedTraceModules
from vllm.config.parallel import DistributedExecutorBackend, ExpertPlacementStrategy
from vllm.config.scheduler import SchedulerPolicy
from vllm.config.utils import get_field from vllm.config.utils import get_field
from vllm.logger import init_logger from vllm.logger import init_logger
from vllm.platforms import CpuArchEnum, current_platform from vllm.platforms import CpuArchEnum, current_platform
......
...@@ -19,18 +19,18 @@ from vllm.beam_search import ( ...@@ -19,18 +19,18 @@ from vllm.beam_search import (
) )
from vllm.config import ( from vllm.config import (
CompilationConfig, CompilationConfig,
ModelDType, PoolerConfig,
StructuredOutputsConfig, StructuredOutputsConfig,
TokenizerMode,
is_init_field, is_init_field,
) )
from vllm.engine.arg_utils import ( from vllm.config.model import (
ConvertOption, ConvertOption,
EngineArgs,
HfOverrides, HfOverrides,
PoolerConfig, ModelDType,
RunnerOption, RunnerOption,
TokenizerMode,
) )
from vllm.engine.arg_utils import EngineArgs
from vllm.entrypoints.chat_utils import ( from vllm.entrypoints.chat_utils import (
ChatCompletionMessageParam, ChatCompletionMessageParam,
ChatTemplateContentFormatOption, ChatTemplateContentFormatOption,
......
...@@ -4,7 +4,8 @@ from typing import Union ...@@ -4,7 +4,8 @@ from typing import Union
import torch import torch
from vllm.config import MambaDType, ModelDType from vllm.config.cache import MambaDType
from vllm.config.model import ModelDType
from vllm.distributed import divide from vllm.distributed import divide
from vllm.utils import STR_DTYPE_TO_TORCH_DTYPE, get_kv_cache_torch_dtype from vllm.utils import STR_DTYPE_TO_TORCH_DTYPE, get_kv_cache_torch_dtype
......
...@@ -15,7 +15,8 @@ from .interface import Platform, PlatformEnum ...@@ -15,7 +15,8 @@ from .interface import Platform, PlatformEnum
if TYPE_CHECKING: if TYPE_CHECKING:
from vllm.attention.backends.registry import _Backend from vllm.attention.backends.registry import _Backend
from vllm.config import BlockSize, ModelConfig, VllmConfig from vllm.config import ModelConfig, VllmConfig
from vllm.config.cache import BlockSize
from vllm.pooling_params import PoolingParams from vllm.pooling_params import PoolingParams
else: else:
BlockSize = None BlockSize = None
......
...@@ -8,7 +8,7 @@ import torch.nn as nn ...@@ -8,7 +8,7 @@ import torch.nn as nn
from packaging import version from packaging import version
from vllm import envs from vllm import envs
from vllm.config import LogprobsMode from vllm.config.model import LogprobsMode
from vllm.logger import init_logger from vllm.logger import init_logger
from vllm.platforms import current_platform from vllm.platforms import current_platform
......
...@@ -7,7 +7,7 @@ from typing import Optional ...@@ -7,7 +7,7 @@ from typing import Optional
import torch import torch
import torch.nn as nn import torch.nn as nn
from vllm.config import LogprobsMode from vllm.config.model import LogprobsMode
from vllm.utils import is_pin_memory_available from vllm.utils import is_pin_memory_available
from vllm.v1.outputs import LogprobsTensors, SamplerOutput from vllm.v1.outputs import LogprobsTensors, SamplerOutput
from vllm.v1.sample.metadata import SamplingMetadata from vllm.v1.sample.metadata import SamplingMetadata
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment