[Docs] Fix warnings in vllm/profiler and vllm/transformers_utils (#25220)

Signed-off-by: windsonsea <haifeng.yao@daocloud.io>

[Docs] Fix warnings in vllm/profiler and vllm/transformers_utils (#25220)
Signed-off-by: windsonsea <haifeng.yao@daocloud.io>
367a480b · Michael Yao · GitHub · bef180f0 · 367a480b · 367a480b
Unverified Commit 367a480b authored Sep 21, 2025 by Michael Yao Committed by GitHub Sep 20, 2025
Showing with 4 additions and 4 deletions

mkdocs.yaml mkdocs.yaml +1 -0

vllm/profiler/layerwise_profile.py vllm/profiler/layerwise_profile.py +2 -2

vllm/transformers_utils/configs/jais.py vllm/transformers_utils/configs/jais.py +1 -2

No files found.
--- a/mkdocs.yaml
+++ b/mkdocs.yaml
@@ -102,6 +102,7 @@ plugins:
          - https://numpy.org/doc/stable/objects.inv
          - https://pytorch.org/docs/stable/objects.inv
          - https://psutil.readthedocs.io/en/stable/objects.inv
+          - https://huggingface.co/docs/transformers/main/en/objects.inv

 markdown_extensions:
  - attr_list

--- a/vllm/profiler/layerwise_profile.py
+++ b/vllm/profiler/layerwise_profile.py
@@ -353,8 +353,8 @@ class layerwise_profile(profile):

        Args:
            num_running_seqs (Optional[int], optional): When given,
-            num_running_seqs will be passed to LayerProfileResults for metadata
-            update. Defaults to None.
+                num_running_seqs will be passed to LayerProfileResults
+                for metadata update. Defaults to None.
        """
        super().__init__(
            activities=[ProfilerActivity.CPU, ProfilerActivity.CUDA],

--- a/vllm/transformers_utils/configs/jais.py
+++ b/vllm/transformers_utils/configs/jais.py
@@ -74,8 +74,7 @@ class JAISConfig(PretrainedConfig):
        use_cache (`bool`, *optional*, defaults to `True`):
            Whether or not the model should return the last key/values
            attentions (not used by all models).
-        scale_attn_by_inverse_layer_idx
-            (`bool`, *optional*, defaults to `False`): 
+        scale_attn_by_inverse_layer_idx (`bool`, *optional*, default `True`):
            Whether to additionally scale attention weights 
            by `1 / layer_idx + 1`.
        reorder_and_upcast_attn (`bool`, *optional*, defaults to `False`):