Unverified Commit b6553be1 authored by Jee Jee Li's avatar Jee Jee Li Committed by GitHub
Browse files

[Misc] Slight improvement of the BNB (#19418)


Signed-off-by: default avatarJee Jee Li <pandaleefree@gmail.com>
Co-authored-by: default avatarIsotr0py <2037008807@qq.com>
Co-authored-by: default avatargemini-code-assist[bot] <176961590+gemini-code-assist[bot]@users.noreply.github.com>
parent 64a9af5a
...@@ -71,9 +71,7 @@ class BitsAndBytesConfig(QuantizationConfig): ...@@ -71,9 +71,7 @@ class BitsAndBytesConfig(QuantizationConfig):
@staticmethod @staticmethod
def get_config_filenames() -> list[str]: def get_config_filenames() -> list[str]:
return [ return []
"adapter_config.json",
]
@classmethod @classmethod
def from_config(cls, config: dict[str, Any]) -> "BitsAndBytesConfig": def from_config(cls, config: dict[str, Any]) -> "BitsAndBytesConfig":
......
...@@ -392,7 +392,8 @@ class BitsAndBytesModelLoader(BaseModelLoader): ...@@ -392,7 +392,8 @@ class BitsAndBytesModelLoader(BaseModelLoader):
def _get_bnb_target_modules(self, model: nn.Module) -> None: def _get_bnb_target_modules(self, model: nn.Module) -> None:
for name, module in model.named_modules(): for name, module in model.named_modules():
if isinstance(module, (LinearBase, )): if (isinstance(module, LinearBase) and
hasattr(module.quant_method, "quant_config")):
if modules_info := self.modules_mapping.get_sub_modules(name): if modules_info := self.modules_mapping.get_sub_modules(name):
# Map vllm's names to transformers's names. # Map vllm's names to transformers's names.
rep_name, sub_modules = modules_info rep_name, sub_modules = modules_info
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment