Unverified Commit ba558c02 authored by Tova Movshovitz's avatar Tova Movshovitz Committed by GitHub
Browse files

[config] Expose `get_total_num_hidden_layers()` in ModelConfig (#28961)


Signed-off-by: default avatartovam <tovam@pliops.com>
Co-authored-by: default avatarWentao Ye <44945378+yewentao256@users.noreply.github.com>
Co-authored-by: default avatarCyrus Leung <tlleungac@connect.ust.hk>
parent 97cfa99d
......@@ -1369,11 +1369,7 @@ class ModelConfig:
# Coerce to 0 if explicitly set to None
return num_experts or 0
def get_layers_start_end_indices(
self, parallel_config: ParallelConfig
) -> tuple[int, int]:
from vllm.distributed.utils import get_pp_indices
def get_total_num_hidden_layers(self) -> int:
if (
self.hf_text_config.model_type == "deepseek_mtp"
or self.hf_config.model_type == "mimo_mtp"
......@@ -1393,6 +1389,15 @@ class ModelConfig:
total_num_hidden_layers = getattr(
self.hf_text_config, "num_hidden_layers", 0
)
return total_num_hidden_layers
def get_layers_start_end_indices(
self, parallel_config: ParallelConfig
) -> tuple[int, int]:
from vllm.distributed.utils import get_pp_indices
total_num_hidden_layers = self.get_total_num_hidden_layers()
# the layout order is: DP x PP x TP
pp_rank = (
parallel_config.rank // parallel_config.tensor_parallel_size
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment