"...git@developer.sourcefind.cn:chenpangpang/open-webui.git" did not exist on "22c210e8f67e996e2816835786393d298e69db6e"
Unverified Commit eaace0c6 authored by raghavanone's avatar raghavanone Committed by GitHub
Browse files

Optimize by not computing gradients for parameters set to requires_grad=False (#21236)

* Optimize by not computing gradients for parameters set to requires_grad=False

* Make change to retrigger the build

* Fix isort issue

* Fix issue
parent 6e4d3f08
......@@ -1020,11 +1020,15 @@ class Trainer:
decay_parameters = [name for name in decay_parameters if "bias" not in name]
optimizer_grouped_parameters = [
{
"params": [p for n, p in opt_model.named_parameters() if n in decay_parameters],
"params": [
p for n, p in opt_model.named_parameters() if (n in decay_parameters and p.requires_grad)
],
"weight_decay": self.args.weight_decay,
},
{
"params": [p for n, p in opt_model.named_parameters() if n not in decay_parameters],
"params": [
p for n, p in opt_model.named_parameters() if (n not in decay_parameters and p.requires_grad)
],
"weight_decay": 0.0,
},
]
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment