We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent ed6ea06 commit 6aa754eCopy full SHA for 6aa754e
vllm/attention/backends/mla/common.py
@@ -1308,7 +1308,7 @@ def _compute_prefill_context(
1308
)
1309
1310
kv_c_normed = workspace[:toks]\
1311
- [..., :self.kv_lora_rank].unsqueeze(1)
+ [..., :self.kv_lora_rank]
1312
k_pe = workspace[:toks]\
1313
[..., self.kv_lora_rank:].unsqueeze(1)
1314
vllm/v1/attention/backends/mla/common.py
@@ -874,7 +874,7 @@ def _compute_prefill_context(
874
875
876
877
878
879
880
0 commit comments