Merge pull request #1090 from kvcache-ai/Atream-patch-1

Update attention.py
This commit is contained in:
Atream 2025-04-09 10:54:37 +08:00 committed by GitHub
commit 9037bf30d5
No known key found for this signature in database
GPG key ID: B5690EEEBB952194

View file

@ -435,6 +435,7 @@ class KDeepseekV2Attention(BaseInjectedModule, DeepseekV2Attention):
kv_len_arr = torch.tensor([position_ids[0, -1].item()+1], dtype=torch.int32, device=self.device)
self.mla_wrapper.plan(qo_indptr,None,None,
kv_len_arr,
None,
self.num_heads,
self.kv_lora_rank,
self.qk_rope_head_dim,