diff --git a/ktransformers/local_chat.py b/ktransformers/local_chat.py index 513f480..827d88f 100644 --- a/ktransformers/local_chat.py +++ b/ktransformers/local_chat.py @@ -81,8 +81,10 @@ def local_chat(): content = "hi" else: content = open(config.prompt_file, "r").read() + print("User: ", content) elif os.path.isfile(content): content = open(content, "r").read() + print("User: ", content) messages = his_content + [{"role": "user", "content": content}] async def async_inference(messages): diff --git a/ktransformers/operators/experts.py b/ktransformers/operators/experts.py index f3fd515..dcca038 100644 --- a/ktransformers/operators/experts.py +++ b/ktransformers/operators/experts.py @@ -163,7 +163,7 @@ class KExpertsCPU(KExpertsBase): self.config.hidden_size, self.config.moe_intermediate_size, 64, - 10, + 1024, 1024, gate_ptr, up_ptr,