adamw-apex-zero.yaml 196 Bytes
Newer Older
Tri Dao's avatar
Tri Dao committed
1
2
3
4
5
6
7
# @package train.optimizer
_target_: torch.distributed.optim.ZeroRedundancyOptimizer
_recursive_: True
optimizer_class:
  _target_: apex.optimizers.FusedAdam
  _partial_: True
  adam_w_mode: True