modify moeinfer param

This commit is contained in:
Azure 2025-02-06 14:07:38 +00:00
parent ee24a27001
commit 027b11266c
2 changed files with 3 additions and 1 deletions

View file

@ -81,8 +81,10 @@ def local_chat():
content = "hi"
else:
content = open(config.prompt_file, "r").read()
print("User: ", content)
elif os.path.isfile(content):
content = open(content, "r").read()
print("User: ", content)
messages = his_content + [{"role": "user", "content": content}]
async def async_inference(messages):

View file

@ -163,7 +163,7 @@ class KExpertsCPU(KExpertsBase):
self.config.hidden_size,
self.config.moe_intermediate_size,
64,
10,
1024,
1024,
gate_ptr,
up_ptr,