Skip to content

Commit 74e0d35

Browse files
blueyo0tlrmchlsmth
authored andcommitted
[Qwen2.5] Support bnb quant for Qwen2.5 (vllm-project#9467)
Signed-off-by: Tyler Michael Smith <tyler@neuralmagic.com>
1 parent 9bf0a83 commit 74e0d35

File tree

1 file changed

+8
-0
lines changed

1 file changed

+8
-0
lines changed

vllm/model_executor/models/qwen2.py

+8
Original file line numberDiff line numberDiff line change
@@ -364,6 +364,14 @@ class Qwen2ForCausalLM(nn.Module, SupportsLoRA, SupportsPP):
364364
]
365365
embedding_modules = {}
366366
embedding_padding_modules = []
367+
bitsandbytes_stacked_params_mapping = {
368+
# shard_name, weight_name, index
369+
"q_proj": ("qkv_proj", 0),
370+
"k_proj": ("qkv_proj", 1),
371+
"v_proj": ("qkv_proj", 2),
372+
"gate_proj": ("gate_up_proj", 0),
373+
"up_proj": ("gate_up_proj", 1),
374+
}
367375

368376
def __init__(
369377
self,

0 commit comments

Comments
 (0)