Commit 987ac3d6 authored by Baber's avatar Baber
Browse files

nit

parent 41fd08f2
...@@ -111,7 +111,7 @@ def _vllm_mp_worker( ...@@ -111,7 +111,7 @@ def _vllm_mp_worker(
@register_model("vllm") @register_model("vllm")
class VLLM(TemplateLM): class VLLM(TemplateLM):
_DEFAULT_MAX_LENGTH = 2048 _DEFAULT_MAX_LENGTH = 4096
def __init__( def __init__(
self, self,
...@@ -283,14 +283,19 @@ class VLLM(TemplateLM): ...@@ -283,14 +283,19 @@ class VLLM(TemplateLM):
@property @property
def max_length(self): def max_length(self):
return 8096 if self._max_length_internal > 8096 else self._max_length return (
8096
if self._max_length_internal and self._max_length_internal > 8096
else self._max_length
)
@property @property
def _max_length_internal(self): def _max_length_internal(self):
if self._max_length: # if max length manually set, return it if self._max_length: # if max length manually set, return it
return self._max_length return self._max_length
if self.data_parallel_size <= 1: if self.data_parallel_size <= 1:
return self.model.llm_engine.model_config.max_model_len if max_l := self.model.llm_engine.model_config.max_model_len:
return max_l
else: else:
seqlen_config_attrs = ("n_positions", "max_position_embeddings", "n_ctx") seqlen_config_attrs = ("n_positions", "max_position_embeddings", "n_ctx")
for attr in seqlen_config_attrs: for attr in seqlen_config_attrs:
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment