[Model] Adding torch compile annotations to chatglm (#15624)

Signed-off-by: Jee Jee Li <pandaleefree@gmail.com>

[Model] Adding torch compile annotations to chatglm (#15624)
Signed-off-by: Jee Jee Li <pandaleefree@gmail.com>
91276c57 · Jee Jee Li · GitHub · 0b416752 · 91276c57
Unverified Commit 91276c57 authored Mar 28, 2025 by Jee Jee Li Committed by GitHub Mar 28, 2025
Hide whitespace changes
Inline Side-by-side

Showing with 2 additions and 0 deletions

vllm/model_executor/models/chatglm.py vllm/model_executor/models/chatglm.py +2 -0

No files found.
--- a/vllm/model_executor/models/chatglm.py
+++ b/vllm/model_executor/models/chatglm.py
@@ -10,6 +10,7 @@ from torch import nn
 from torch.nn import LayerNorm
 from vllm.attention import Attention
+from vllm.compilation.decorators import support_torch_compile
 from vllm.config import CacheConfig, VllmConfig
 from vllm.distributed import get_pp_group, get_tensor_model_parallel_world_size
 from vllm.model_executor.layers.activation import SiluAndMul
@@ -293,6 +294,7 @@ class GLMTransformer(nn.Module):
        return hidden_states
+@support_torch_compile
 class ChatGLMModel(nn.Module):
    def __init__(self, *, vllm_config: VllmConfig, prefix: str = ""):