Skip to content

Commit 068e672

Browse files
LucasWilkinsonmgoin
andcommitted
Update utils.py
Co-authored-by: Michael Goin <mgoin64@gmail.com> Signed-off-by: Lucas Wilkinson <lwilkinson@neuralmagic.com>
1 parent f2cac91 commit 068e672

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

vllm/attention/backends/mla/utils.py

+2-2
Original file line numberDiff line numberDiff line change
@@ -231,15 +231,15 @@ def process_weights_after_loading(self):
231231
.flatten(start_dim=0, end_dim=1).contiguous()
232232

233233
tp_size = get_tensor_model_parallel_world_size()
234-
self.o_proj_absored = RowParallelLinear(
234+
self.o_proj_absorbed = RowParallelLinear(
235235
self.W_UV_O.shape[0] * tp_size,
236236
self.W_UV_O.shape[1],
237237
bias=False,
238238
# TODO(lucas) figure out how to properly forward quant_method
239239
#quant_config=self.o_proj.quant_method,
240240
)
241241

242-
self.o_proj_absored.weight = torch.nn.Parameter(self.W_UV_O.T)
242+
self.o_proj_absorbed.weight = torch.nn.Parameter(self.W_UV_O.T)
243243
else:
244244
self.W_UV = W_UV
245245
self.W_UK = W_UK

0 commit comments

Comments
 (0)