Fix refactor error - fp8.py (#5106)

Co-authored-by: Lianmin Zheng <lianminzheng@gmail.com>

Fix refactor error - fp8.py (#5106)
Co-authored-by: Lianmin Zheng <lianminzheng@gmail.com>
81992474 · HAI · GitHub · f04c80dc · 81992474
Unverified Commit 81992474 authored Apr 07, 2025 by HAI Committed by GitHub Apr 07, 2025
Hide whitespace changes
Inline Side-by-side

Showing with 1 addition and 1 deletion

python/sglang/srt/layers/quantization/fp8.py python/sglang/srt/layers/quantization/fp8.py +1 -1

No files found.
--- a/python/sglang/srt/layers/quantization/fp8.py
+++ b/python/sglang/srt/layers/quantization/fp8.py
@@ -860,7 +860,7 @@ class Fp8MoEMethod:
            layer.w13_weight_scale1[expert_id] *= max_w13_scales[expert_id]
            layer.w2_weight_scale1[expert_id] *= layer.w2_weight_scale[expert_id]

-    def process_weights_hip_scale_padding(self, layer: Module, padding_size: int):
+    def process_weights_hip_scale_padding(self, layer: Module):
        from sglang.srt.layers.moe.fused_moe_triton.fused_moe import (
            padding_size,  # Avoid circular import
        )