From 027b11266c9bb59ca4853fa854aeacbb2370e7c0 Mon Sep 17 00:00:00 2001 From: Azure Date: Thu, 6 Feb 2025 14:07:38 +0000 Subject: [PATCH] modify moeinfer param --- ktransformers/local_chat.py | 2 ++ ktransformers/operators/experts.py | 2 +- 2 files changed, 3 insertions(+), 1 deletion(-) diff --git a/ktransformers/local_chat.py b/ktransformers/local_chat.py index 513f480..827d88f 100644 --- a/ktransformers/local_chat.py +++ b/ktransformers/local_chat.py @@ -81,8 +81,10 @@ def local_chat(): content = "hi" else: content = open(config.prompt_file, "r").read() + print("User: ", content) elif os.path.isfile(content): content = open(content, "r").read() + print("User: ", content) messages = his_content + [{"role": "user", "content": content}] async def async_inference(messages): diff --git a/ktransformers/operators/experts.py b/ktransformers/operators/experts.py index f3fd515..dcca038 100644 --- a/ktransformers/operators/experts.py +++ b/ktransformers/operators/experts.py @@ -163,7 +163,7 @@ class KExpertsCPU(KExpertsBase): self.config.hidden_size, self.config.moe_intermediate_size, 64, - 10, + 1024, 1024, gate_ptr, up_ptr,