Commit 0189f17c authored by zhouxiang's avatar zhouxiang
Browse files

add qwen72

parent ee33e2e7
...@@ -448,6 +448,7 @@ If a question does not make any sense, or is not factually coherent, explain why ...@@ -448,6 +448,7 @@ If a question does not make any sense, or is not factually coherent, explain why
return ret return ret
@MODELS.register_module(name='qwen-72b')
@MODELS.register_module(name='qwen-14b') @MODELS.register_module(name='qwen-14b')
@MODELS.register_module(name='qwen-7b') @MODELS.register_module(name='qwen-7b')
class Qwen7BChat(BaseModel): class Qwen7BChat(BaseModel):
......
...@@ -864,9 +864,11 @@ def deploy_qwen(model_name: str, model_path: str, tokenizer_path: str, ...@@ -864,9 +864,11 @@ def deploy_qwen(model_name: str, model_path: str, tokenizer_path: str,
def get_tensor(name, trans=True): def get_tensor(name, trans=True):
"""return a transposed tensor according its name.""" """return a transposed tensor according its name."""
if trans: if trans:
return _params[name].cuda().t() # return _params[name].cuda().t()
return _params[name].t()
else: else:
return _params[name].cuda() # return _params[name].cuda()
return _params[name]
for i in range(num_layer): for i in range(num_layer):
print(i) print(i)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment