Skip to content

Commit

Permalink
Allow Unsloth Dynamic 4bit BnB quants to work (vllm-project#12974)
Browse files Browse the repository at this point in the history
  • Loading branch information
danielhanchen authored and kerthcet committed Feb 21, 2025
1 parent 5743595 commit ab133dc
Showing 1 changed file with 10 additions and 2 deletions.
12 changes: 10 additions & 2 deletions vllm/model_executor/layers/quantization/bitsandbytes.py
Original file line number Diff line number Diff line change
Expand Up @@ -133,8 +133,16 @@ def is_layer_skipped_bnb(prefix: str, llm_int8_skip_modules: List[str]):
components = prefix.split('.')

# Check if any of the skip modules exactly matches any component
return any(module_name in components
for module_name in llm_int8_skip_modules)
substr_check = any(module_name in components
for module_name in llm_int8_skip_modules)

# Allow certain layers to not be quantized
set_components = set(".".join(components[:i + 1])
for i in range(len(components)))
set_llm_int8_skip_modules = set(llm_int8_skip_modules)
prefix_check = len(set_llm_int8_skip_modules & set_components) != 0

return substr_check or prefix_check


class BitsAndBytesLinearMethod(LinearMethodBase):
Expand Down

0 comments on commit ab133dc

Please sign in to comment.