Unverified Commit a55caf6a authored by yugong333's avatar yugong333 Committed by GitHub
Browse files

[LoRA] Support Quantized Adapters (#30286)


Signed-off-by: default avatarYu Gong <yu3.gong@gmail.com>
Signed-off-by: default avatarwz1qqx <ziqi.wang@novita.ai>
Signed-off-by: default avatarmgoin <mgoin64@gmail.com>
Co-authored-by: default avatarwz1qqx <55830058+wz1qqx@users.noreply.github.com>
Co-authored-by: default avatarwz1qqx <ziqi.wang@novita.ai>
Co-authored-by: default avatarMichael Goin <mgoin64@gmail.com>
Co-authored-by: default avatarJee Jee Li <pandaleefree@gmail.com>
Co-authored-by: default avatarRobert Shaw <114415538+robertgshaw2-redhat@users.noreply.github.com>
Co-authored-by: default avatarCyrus Leung <tlleungac@connect.ust.hk>
parent 0e22cd61
......@@ -2,6 +2,11 @@
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
from vllm.lora.ops.triton_ops.fused_moe_lora_fp8_op import (
fused_moe_lora_expand_fp8,
fused_moe_lora_fp8,
fused_moe_lora_shrink_fp8,
)
from vllm.lora.ops.triton_ops.fused_moe_lora_op import (
fused_moe_lora,
fused_moe_lora_expand,
......@@ -18,4 +23,7 @@ __all__ = [
"fused_moe_lora",
"fused_moe_lora_shrink",
"fused_moe_lora_expand",
"fused_moe_lora_fp8",
"fused_moe_lora_shrink_fp8",
"fused_moe_lora_expand_fp8",
]
This diff is collapsed.
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment