update install doc and fix local_chat bug

2025-09-10 23:34:35 +00:00 · 2025-04-03 12:42:41 +08:00 · 2025-04-03 12:42:41 +08:00 · 1b7672937b
commit 1b7672937b
parent ab0b0f4ea1
4 changed files with 14 additions and 28 deletions
--- a/ktransformers/operators/attention.py
+++ b/ktransformers/operators/attention.py
@ -422,6 +422,7 @@ class KDeepseekV2Attention(BaseInjectedModule, DeepseekV2Attention):
                if q_len == 1:
                    self.mla_wrapper.plan(None,None,None,
                                        position_ids.squeeze(1)+1,
+                                        None,
                                        self.num_heads,
                                        self.kv_lora_rank,
                                        self.qk_rope_head_dim,