mirror of
https://github.com/kvcache-ai/ktransformers.git
synced 2025-09-09 13:55:27 +00:00
fix rope; update moegate
This commit is contained in:
parent
f873558a89
commit
f748cd29f0
5 changed files with 54 additions and 21 deletions
|
@ -643,7 +643,7 @@ class KDeepseekV2Model(BaseInjectedModule):
|
|||
org_device = input_ids.device
|
||||
# TODO move to embed_tokens's device, not hard code to cpu
|
||||
input_ids = input_ids.to("cpu")
|
||||
inputs_embeds = self.embed_tokens(input_ids)
|
||||
inputs_embeds = self.embed_tokens(input_ids).to(org_device)
|
||||
input_ids = input_ids.to(org_device)
|
||||
|
||||
if per_layer_prefill_flag:
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue