"tools/python/vscode:/vscode.git/clone" did not exist on "6b064d3584358ded2d20282547b236de7045a0dd"
Unverified Commit 7eebd440 authored by JieXin Liang's avatar JieXin Liang Committed by GitHub
Browse files

[fix] fix modelopt fp4 on b200 (#8195)

parent 93d124ef
...@@ -21,6 +21,9 @@ from sglang.srt.layers.quantization.petit_utils import ( ...@@ -21,6 +21,9 @@ from sglang.srt.layers.quantization.petit_utils import (
verify_petit_nvfp4_supported, verify_petit_nvfp4_supported,
) )
from sglang.srt.layers.quantization.utils import is_layer_skipped from sglang.srt.layers.quantization.utils import is_layer_skipped
from sglang.srt.utils import is_hip
_is_hip = is_hip()
# Initialize logger for the module # Initialize logger for the module
logger = logging.getLogger(__name__) logger = logging.getLogger(__name__)
...@@ -104,7 +107,7 @@ class PetitNvFp4Config(QuantizationConfig): ...@@ -104,7 +107,7 @@ class PetitNvFp4Config(QuantizationConfig):
@classmethod @classmethod
def is_petit_nvfp4_compatible(cls, quant_config: Dict[str, Any]) -> bool: def is_petit_nvfp4_compatible(cls, quant_config: Dict[str, Any]) -> bool:
quant_method = quant_config.get("quant_method", "").lower() quant_method = quant_config.get("quant_method", "").lower()
return quant_method == "modelopt" return _is_hip and quant_method == "modelopt"
def is_layer_excluded(self, prefix: str, exclude_modules: list): def is_layer_excluded(self, prefix: str, exclude_modules: list):
for pattern in exclude_modules: for pattern in exclude_modules:
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment