use custom prepare function

Summary: Pull Request resolved: https://github.com/facebookresearch/d2go/pull/660 To enable w8a16 sigmoid in d2go, we need to use custom prepare function. Reviewed By: ayushidalmia, jiaxuzhu92 Differential Revision: D56275899 fbshipit-source-id: 654900011a1393e81289e8c9412b5886831765e2

use custom prepare function
Summary: Pull Request resolved: https://github.com/facebookresearch/d2go/pull/660 To enable w8a16 sigmoid in d2go, we need to use custom prepare function. Reviewed By: ayushidalmia, jiaxuzhu92 Differential Revision: D56275899 fbshipit-source-id: 654900011a1393e81289e8c9412b5886831765e2
05b33018 · Naveen Suda · Facebook GitHub Bot · ba7c235b · 05b33018 · 05b33018
Commit 05b33018 authored Apr 23, 2024 by Naveen Suda Committed by Facebook GitHub Bot Apr 23, 2024
Show whitespace changes
Inline Side-by-side

Showing with 11 additions and 5 deletions

d2go/quantization/fx.py d2go/quantization/fx.py +7 -0

d2go/quantization/modeling.py d2go/quantization/modeling.py +4 -5

No files found.
--- a/d2go/quantization/fx.py
+++ b/d2go/quantization/fx.py
@@ -6,6 +6,7 @@ from typing import Tuple

 import torch
 from mobile_cv.common.misc.oss_utils import fb_overwritable
+from torch.ao.quantization.quantize import prepare, prepare_qat


 TORCH_VERSION: Tuple[int, ...] = tuple(int(x) for x in torch.__version__.split(".")[:2])
@@ -28,3 +29,9 @@ def get_convert_fn(cfg, example_inputs=None, qconfig_mapping=None, backend_confi
        return convert
    else:
        return convert_fx
+
+
+@fb_overwritable()
+def get_prepare_fn(cfg, is_qat):
+    if cfg.QUANTIZATION.EAGER_MODE:
+        return prepare_qat if is_qat else prepare
--- a/d2go/quantization/modeling.py
+++ b/d2go/quantization/modeling.py
@@ -10,7 +10,7 @@ from typing import Any, Dict, Optional, Tuple
 import detectron2.utils.comm as comm
 import torch
 from d2go.quantization import learnable_qat
-from d2go.quantization.fx import get_convert_fn, get_prepare_fx_fn
+from d2go.quantization.fx import get_convert_fn, get_prepare_fn, get_prepare_fx_fn
 from d2go.quantization.qconfig import (
    set_backend_and_create_qconfig,
    smart_decode_backend,
@@ -34,6 +34,7 @@ from torch.ao.quantization.quantizer.xnnpack_quantizer import (
 )

 TORCH_VERSION: Tuple[int, ...] = tuple(int(x) for x in torch.__version__.split(".")[:2])
+# some tests still import prepare/convert from below. So don't remove these.
 if TORCH_VERSION > (1, 10):
    from torch.ao.quantization.quantize import convert
    from torch.ao.quantization.quantize_fx import convert_fx, prepare_fx, prepare_qat_fx
@@ -388,10 +389,8 @@ def prepare_fake_quant_model(cfg, model, is_qat, example_input=None):
                )
                model = default_prepare_for_quant(cfg, model)
            # NOTE: eager model needs to call prepare after `prepare_for_quant`
-            if is_qat:
-                torch.ao.quantization.prepare_qat(model, inplace=True)
-            else:
-                torch.ao.quantization.prepare(model, inplace=True)
+            prepare_fn = get_prepare_fn(cfg, is_qat)
+            prepare_fn(model, inplace=True)

        else:
            # FX graph mode requires the model to be symbolically traceable, swap common