"vscode:/vscode.git/clone" did not exist on "f0ca0671c70fae6d1562127e3330eeaedf4abb3f"
Unverified Commit 5157338e authored by Jee Jee Li's avatar Jee Jee Li Committed by GitHub
Browse files

[Misc] Improve LoRA spelling (#13831)

parent e206b543
...@@ -13,11 +13,11 @@ from vllm.model_executor.layers.sampler import SamplerOutput ...@@ -13,11 +13,11 @@ from vllm.model_executor.layers.sampler import SamplerOutput
from vllm.sequence import ExecuteModelRequest from vllm.sequence import ExecuteModelRequest
from vllm.worker.neuron_model_runner import NeuronModelRunner from vllm.worker.neuron_model_runner import NeuronModelRunner
from vllm.worker.worker_base import (LocalOrDistributedWorkerBase, from vllm.worker.worker_base import (LocalOrDistributedWorkerBase,
LoraNotSupportedWorkerBase, WorkerBase, LoRANotSupportedWorkerBase, WorkerBase,
WorkerInput) WorkerInput)
class NeuronWorker(LoraNotSupportedWorkerBase, LocalOrDistributedWorkerBase): class NeuronWorker(LoRANotSupportedWorkerBase, LocalOrDistributedWorkerBase):
"""A worker class that executes the model on a group of neuron cores. """A worker class that executes the model on a group of neuron cores.
""" """
......
...@@ -24,7 +24,7 @@ from vllm.sampling_params import SamplingParams ...@@ -24,7 +24,7 @@ from vllm.sampling_params import SamplingParams
from vllm.sequence import ExecuteModelRequest, SequenceGroupMetadata from vllm.sequence import ExecuteModelRequest, SequenceGroupMetadata
from vllm.utils import bind_kv_cache from vllm.utils import bind_kv_cache
from vllm.worker.openvino_model_runner import OpenVINOModelRunner from vllm.worker.openvino_model_runner import OpenVINOModelRunner
from vllm.worker.worker_base import LoraNotSupportedWorkerBase, WorkerBase from vllm.worker.worker_base import LoRANotSupportedWorkerBase, WorkerBase
logger = init_logger(__name__) logger = init_logger(__name__)
...@@ -203,7 +203,7 @@ class OpenVINOCacheEngine: ...@@ -203,7 +203,7 @@ class OpenVINOCacheEngine:
return dtype_size * total return dtype_size * total
class OpenVINOWorker(LoraNotSupportedWorkerBase): class OpenVINOWorker(LoRANotSupportedWorkerBase):
"""A worker class that executes the model on OpenVINO backend. """A worker class that executes the model on OpenVINO backend.
Each worker is associated with a single OpenVINO device. The worker is Each worker is associated with a single OpenVINO device. The worker is
......
...@@ -17,13 +17,13 @@ from vllm.sequence import ExecuteModelRequest ...@@ -17,13 +17,13 @@ from vllm.sequence import ExecuteModelRequest
from vllm.utils import STR_DTYPE_TO_TORCH_DTYPE, bind_kv_cache, get_dtype_size from vllm.utils import STR_DTYPE_TO_TORCH_DTYPE, bind_kv_cache, get_dtype_size
from vllm.worker.tpu_model_runner import ExecutionMode, TPUModelRunner from vllm.worker.tpu_model_runner import ExecutionMode, TPUModelRunner
from vllm.worker.worker_base import (LocalOrDistributedWorkerBase, from vllm.worker.worker_base import (LocalOrDistributedWorkerBase,
LoraNotSupportedWorkerBase, WorkerBase, LoRANotSupportedWorkerBase, WorkerBase,
WorkerInput) WorkerInput)
logger = init_logger(__name__) logger = init_logger(__name__)
class TPUWorker(LoraNotSupportedWorkerBase, LocalOrDistributedWorkerBase): class TPUWorker(LoRANotSupportedWorkerBase, LocalOrDistributedWorkerBase):
def __init__( def __init__(
self, self,
......
...@@ -189,7 +189,7 @@ class DelegateWorkerBase(WorkerBase): ...@@ -189,7 +189,7 @@ class DelegateWorkerBase(WorkerBase):
return getattr(self.worker, attr) return getattr(self.worker, attr)
class LoraNotSupportedWorkerBase(WorkerBase): class LoRANotSupportedWorkerBase(WorkerBase):
"""Partial implementation of WorkerBase that raises exceptions when LoRA """Partial implementation of WorkerBase that raises exceptions when LoRA
methods are invoked. methods are invoked.
""" """
......
...@@ -18,13 +18,13 @@ from vllm.model_executor import set_random_seed ...@@ -18,13 +18,13 @@ from vllm.model_executor import set_random_seed
from vllm.platforms import current_platform from vllm.platforms import current_platform
from vllm.worker.cache_engine import CacheEngine from vllm.worker.cache_engine import CacheEngine
from vllm.worker.worker import Worker from vllm.worker.worker import Worker
from vllm.worker.worker_base import LoraNotSupportedWorkerBase, WorkerBase from vllm.worker.worker_base import LoRANotSupportedWorkerBase, WorkerBase
from vllm.worker.xpu_model_runner import XPUModelRunner from vllm.worker.xpu_model_runner import XPUModelRunner
logger = init_logger(__name__) logger = init_logger(__name__)
class XPUWorker(LoraNotSupportedWorkerBase, Worker): class XPUWorker(LoRANotSupportedWorkerBase, Worker):
"""A worker class that executes (a partition of) the model on a GPU. """A worker class that executes (a partition of) the model on a GPU.
Each worker is associated with a single XPU device. The worker is Each worker is associated with a single XPU device. The worker is
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment