Unverified Commit e0c7f51b authored by tpoisonooo's avatar tpoisonooo Committed by GitHub
Browse files

fix(deploy.py): qkv no bias assertion

parent 1b7151c1
...@@ -245,7 +245,7 @@ def deploy_llama(model_name: str, model_path: str, tokenizer_path: str, ...@@ -245,7 +245,7 @@ def deploy_llama(model_name: str, model_path: str, tokenizer_path: str,
print(f'layers.{i}.attention.w_qkv.{t}', qkv.shape) print(f'layers.{i}.attention.w_qkv.{t}', qkv.shape)
model_params[f'layers.{i}.attention.w_qkv.{t}'] = qkv model_params[f'layers.{i}.attention.w_qkv.{t}'] = qkv
assert num_layer == i, f'miss matched layers: {num_layer} vs {i}' assert i == 0 or num_layer == i, f'miss matched layers: {num_layer} vs {i}'
return export(model_name, num_layer, norm_eps, model_params, return export(model_name, num_layer, norm_eps, model_params,
tokenizer_path, triton_models_path, tp) tokenizer_path, triton_models_path, tp)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment