Unverified Commit f59c7bf5 authored by PanZezhong1725's avatar PanZezhong1725 Committed by GitHub
Browse files

Merge pull request #19 from mxCynic/main

fix: assign scale_* as class members instead of local variables
parents 2f35b2b9 1549eced
......@@ -91,15 +91,19 @@ class JiugeMetaFromLlama(JiugeMetaCStruct):
else:
dt_ = DataType.INFINI_DTYPE_F16
scale_input = 1.0
scale_output = 1.0
scale_o = 1.0
scale_down = 1.0
self.scale_input = 1.0
self.scale_output = 1.0
self.scale_o = 1.0
self.scale_down = 1.0
if "fm9g" == config["model_type"]:
scale_input = config["scale_emb"]
scale_output = config["hidden_size"] // config["dim_model_base"]
scale_o = config["scale_depth"] / math.sqrt(config["num_hidden_layers"])
scale_down = config["scale_depth"] / math.sqrt(config["num_hidden_layers"])
self.scale_input = config["scale_emb"]
self.scale_output = config["hidden_size"] // config["dim_model_base"]
self.scale_o = config["scale_depth"] / math.sqrt(
config["num_hidden_layers"]
)
self.scale_down = config["scale_depth"] / math.sqrt(
config["num_hidden_layers"]
)
super().__init__(
dt_logits=dt_,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment