Unverified Commit cb944d58 authored by Daniel Han's avatar Daniel Han Committed by GitHub
Browse files

Allow Unsloth Dynamic 4bit BnB quants to work (#12974)

parent d46d490c
......@@ -133,9 +133,17 @@ def is_layer_skipped_bnb(prefix: str, llm_int8_skip_modules: List[str]):
components = prefix.split('.')
# Check if any of the skip modules exactly matches any component
return any(module_name in components
substr_check = any(module_name in components
for module_name in llm_int8_skip_modules)
# Allow certain layers to not be quantized
set_components = set(".".join(components[:i + 1])
for i in range(len(components)))
set_llm_int8_skip_modules = set(llm_int8_skip_modules)
prefix_check = len(set_llm_int8_skip_modules & set_components) != 0
return substr_check or prefix_check
class BitsAndBytesLinearMethod(LinearMethodBase):
"""Linear method for BitsAndBytes.
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment