fix rope; update moegate

2025-09-09 13:55:27 +00:00 · 2025-02-01 18:05:45 +00:00 · 2025-02-01 18:05:45 +00:00 · f748cd29f0
commit f748cd29f0
parent f873558a89
5 changed files with 54 additions and 21 deletions
--- a/ktransformers/operators/models.py
+++ b/ktransformers/operators/models.py
@ -643,7 +643,7 @@ class KDeepseekV2Model(BaseInjectedModule):
            org_device = input_ids.device
            # TODO move to embed_tokens's device, not hard code to cpu
            input_ids = input_ids.to("cpu")
-            inputs_embeds = self.embed_tokens(input_ids)
+            inputs_embeds = self.embed_tokens(input_ids).to(org_device)
            input_ids = input_ids.to(org_device)

        if per_layer_prefill_flag: