"vscode:/vscode.git/clone" did not exist on "e7aa64838cc604abf7a49e69ca0ffe7af683d8ca"
Unverified Commit e708bb75 authored by Oliver Åstrand's avatar Oliver Åstrand Committed by GitHub
Browse files

Correct TF formatting to exclude LayerNorms from weight decay (#4448)

* Exclude LayerNorms from weight decay

* Include both formats of layer norm
parent 49c06132
......@@ -75,7 +75,7 @@ def create_optimizer(init_lr, num_train_steps, num_warmup_steps, end_lr=0.0, opt
beta_1=0.9,
beta_2=0.999,
epsilon=1e-6,
exclude_from_weight_decay=["layer_norm", "bias"],
exclude_from_weight_decay=["LayerNorm", "layer_norm", "bias"],
)
return optimizer
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment