We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 96e0c9c commit 37a4947Copy full SHA for 37a4947
vllm/model_executor/layers/quantization/bitsandbytes.py
@@ -119,7 +119,12 @@ def get_scaled_act_names(self) -> List[str]:
119
120
121
def is_layer_skipped_bnb(prefix: str, llm_int8_skip_modules: List[str]):
122
- return any(module_name in prefix for module_name in llm_int8_skip_modules)
+ # Split the prefix into its dot-separated components
123
+ components = prefix.split('.')
124
+
125
+ # Check if any of the skip modules exactly matches any component
126
+ return any(module_name in components
127
+ for module_name in llm_int8_skip_modules)
128
129
130
class BitsAndBytesLinearMethod(LinearMethodBase):
0 commit comments