[Feature] add CustomOp Decorator for UnquantizedLinearMethod and...

[Feature] add CustomOp Decorator for UnquantizedLinearMethod and UnquantizedEmbeddingMethod for vllm_hcu

[Feature] add CustomOp Decorator for UnquantizedLinearMethod and...
[Feature] add CustomOp Decorator for UnquantizedLinearMethod and UnquantizedEmbeddingMethod for vllm_hcu
9d774fc5 · zhangzbb · 8680bfdb · 9d774fc5 · 9d774fc5
Commit 9d774fc5 authored Apr 06, 2026 by zhangzbb
Showing with 6 additions and 4 deletions

vllm/model_executor/layers/linear.py vllm/model_executor/layers/linear.py +3 -2

vllm/model_executor/layers/vocab_parallel_embedding.py vllm/model_executor/layers/vocab_parallel_embedding.py +3 -2

No files found.
--- a/vllm/model_executor/layers/linear.py
+++ b/vllm/model_executor/layers/linear.py
@@ -39,6 +39,7 @@ from vllm.model_executor.parameter import (
 )
 from vllm.model_executor.utils import set_weight_attrs
 from vllm.platforms import current_platform
+from vllm.model_executor.custom_op import CustomOp
 logger = init_logger(__name__)
@@ -178,8 +179,8 @@ class LinearMethodBase(QuantizeMethodBase):
        Expects create_weights to have been called before on the layer."""
        raise NotImplementedError
+@CustomOp.register("unquantized_linear_method")
-class UnquantizedLinearMethod(LinearMethodBase):
+class UnquantizedLinearMethod(LinearMethodBase, CustomOp):
    """Linear method without quantization."""
    def create_weights(

--- a/vllm/model_executor/layers/vocab_parallel_embedding.py
+++ b/vllm/model_executor/layers/vocab_parallel_embedding.py
@@ -24,11 +24,12 @@ from vllm.model_executor.layers.utils import dispatch_unquantized_gemm
 from vllm.model_executor.parameter import BasevLLMParameter
 from vllm.model_executor.utils import set_weight_attrs
 from vllm.platforms import current_platform
+from vllm.model_executor.custom_op import CustomOp
 DEFAULT_VOCAB_PADDING_SIZE = 64
+@CustomOp.register("unquantized_embedding_method")
-class UnquantizedEmbeddingMethod(QuantizeMethodBase):
+class UnquantizedEmbeddingMethod(QuantizeMethodBase, CustomOp):
    """Unquantized method for embeddings."""
    def create_weights(