Commit 027b1126 authored by Azure's avatar Azure
Browse files

modify moeinfer param

parent ee24a270
...@@ -81,8 +81,10 @@ def local_chat(): ...@@ -81,8 +81,10 @@ def local_chat():
content = "hi" content = "hi"
else: else:
content = open(config.prompt_file, "r").read() content = open(config.prompt_file, "r").read()
print("User: ", content)
elif os.path.isfile(content): elif os.path.isfile(content):
content = open(content, "r").read() content = open(content, "r").read()
print("User: ", content)
messages = his_content + [{"role": "user", "content": content}] messages = his_content + [{"role": "user", "content": content}]
async def async_inference(messages): async def async_inference(messages):
......
...@@ -163,7 +163,7 @@ class KExpertsCPU(KExpertsBase): ...@@ -163,7 +163,7 @@ class KExpertsCPU(KExpertsBase):
self.config.hidden_size, self.config.hidden_size,
self.config.moe_intermediate_size, self.config.moe_intermediate_size,
64, 64,
10, 1024,
1024, 1024,
gate_ptr, gate_ptr,
up_ptr, up_ptr,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment