Unverified Commit cb944d58 authored by Daniel Han's avatar Daniel Han Committed by GitHub
Browse files

Allow Unsloth Dynamic 4bit BnB quants to work (#12974)

parent d46d490c
...@@ -133,8 +133,16 @@ def is_layer_skipped_bnb(prefix: str, llm_int8_skip_modules: List[str]): ...@@ -133,8 +133,16 @@ def is_layer_skipped_bnb(prefix: str, llm_int8_skip_modules: List[str]):
components = prefix.split('.') components = prefix.split('.')
# Check if any of the skip modules exactly matches any component # Check if any of the skip modules exactly matches any component
return any(module_name in components substr_check = any(module_name in components
for module_name in llm_int8_skip_modules) for module_name in llm_int8_skip_modules)
# Allow certain layers to not be quantized
set_components = set(".".join(components[:i + 1])
for i in range(len(components)))
set_llm_int8_skip_modules = set(llm_int8_skip_modules)
prefix_check = len(set_llm_int8_skip_modules & set_components) != 0
return substr_check or prefix_check
class BitsAndBytesLinearMethod(LinearMethodBase): class BitsAndBytesLinearMethod(LinearMethodBase):
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment