Commit 02ecf002 authored by Peizhao Zhang's avatar Peizhao Zhang Committed by Facebook GitHub Bot
Browse files

Updated scaling rules for base_lr_end and quantization.

Summary:
Pull Request resolved: https://github.com/facebookresearch/d2go/pull/161

Updated scaling rules for base_lr_end and quantization.

Reviewed By: zhanghang1989, wat3rBro

Differential Revision: D33292860

fbshipit-source-id: c7a8747c8fb1f894d3c5508bbd607b3d1ef3d400
parent fcd51171
...@@ -92,6 +92,7 @@ def default_scale_d2_configs(cfg, new_world_size): ...@@ -92,6 +92,7 @@ def default_scale_d2_configs(cfg, new_world_size):
gpu_scale = new_world_size / cfg.SOLVER.REFERENCE_WORLD_SIZE gpu_scale = new_world_size / cfg.SOLVER.REFERENCE_WORLD_SIZE
base_lr = cfg.SOLVER.BASE_LR base_lr = cfg.SOLVER.BASE_LR
base_lr_end = cfg.SOLVER.BASE_LR_END
max_iter = cfg.SOLVER.MAX_ITER max_iter = cfg.SOLVER.MAX_ITER
steps = cfg.SOLVER.STEPS steps = cfg.SOLVER.STEPS
eval_period = cfg.TEST.EVAL_PERIOD eval_period = cfg.TEST.EVAL_PERIOD
...@@ -110,6 +111,7 @@ def default_scale_d2_configs(cfg, new_world_size): ...@@ -110,6 +111,7 @@ def default_scale_d2_configs(cfg, new_world_size):
# default configs in D2 # default configs in D2
cfg.SOLVER.BASE_LR = base_lr * lr_scale cfg.SOLVER.BASE_LR = base_lr * lr_scale
cfg.SOLVER.BASE_LR_END = base_lr_end * lr_scale
cfg.SOLVER.MAX_ITER = int(round(max_iter / gpu_scale)) cfg.SOLVER.MAX_ITER = int(round(max_iter / gpu_scale))
cfg.SOLVER.STEPS = tuple(int(round(s / gpu_scale)) for s in steps) cfg.SOLVER.STEPS = tuple(int(round(s / gpu_scale)) for s in steps)
cfg.TEST.EVAL_PERIOD = int(round(eval_period / gpu_scale)) cfg.TEST.EVAL_PERIOD = int(round(eval_period / gpu_scale))
...@@ -128,6 +130,9 @@ def default_scale_quantization_configs(cfg, new_world_size): ...@@ -128,6 +130,9 @@ def default_scale_quantization_configs(cfg, new_world_size):
cfg.QUANTIZATION.QAT.ENABLE_OBSERVER_ITER = int( cfg.QUANTIZATION.QAT.ENABLE_OBSERVER_ITER = int(
round(cfg.QUANTIZATION.QAT.ENABLE_OBSERVER_ITER / gpu_scale) round(cfg.QUANTIZATION.QAT.ENABLE_OBSERVER_ITER / gpu_scale)
) )
cfg.QUANTIZATION.QAT.ENABLE_LEARNABLE_OBSERVER_ITER = int(
round(cfg.QUANTIZATION.QAT.ENABLE_LEARNABLE_OBSERVER_ITER / gpu_scale)
)
cfg.QUANTIZATION.QAT.DISABLE_OBSERVER_ITER = int( cfg.QUANTIZATION.QAT.DISABLE_OBSERVER_ITER = int(
round(cfg.QUANTIZATION.QAT.DISABLE_OBSERVER_ITER / gpu_scale) round(cfg.QUANTIZATION.QAT.DISABLE_OBSERVER_ITER / gpu_scale)
) )
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment