Unverified Commit f46864d6 authored by egortolmachev's avatar egortolmachev Committed by GitHub
Browse files

[Bugfix] Added Command-R GPTQ support (#3849)


Co-authored-by: default avatarEgor Tolmachev <t333ga@gmail.com>
parent b4543c8f
......@@ -349,11 +349,21 @@ class CohereForCausalLM(nn.Module):
if shard_name not in name:
continue
name = name.replace(shard_name, param_name)
# Skip loading extra bias for GPTQ models.
if name.endswith(".bias") and name not in params_dict:
continue
param = params_dict[name]
weight_loader = param.weight_loader
weight_loader(param, loaded_weight, shard_id)
break
else:
# lm_head is not used in vllm as it is tied with embed_token.
# To prevent errors, skip loading lm_head.weight.
if "lm_head.weight" in name:
continue
# Skip loading extra bias for GPTQ models.
if name.endswith(".bias") and name not in params_dict:
continue
param = params_dict[name]
weight_loader = getattr(param, "weight_loader",
default_weight_loader)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment