Implement Boltnn conversion

Summary: Implementing `prepare_for_export` using the boltnn conversion from https://fburl.com/diffusion/ql1i3358. Implementing `prepare_for_quant` using the quantization from https://fburl.com/diffusion/8nre9o03. Differential Revision: D29817424 fbshipit-source-id: 800571ecf7f07d01c0a3a12100525354b48fe568

Implement Boltnn conversion
Summary: Implementing `prepare_for_export` using the boltnn conversion from https://fburl.com/diffusion/ql1i3358. Implementing `prepare_for_quant` using the quantization from https://fburl.com/diffusion/8nre9o03. Differential Revision: D29817424 fbshipit-source-id: 800571ecf7f07d01c0a3a12100525354b48fe568
cb985322 · Francisc Bungiu · Facebook GitHub Bot · cbb6843e · cb985322 · cb985322
Commit cb985322 authored Aug 06, 2021 by Francisc Bungiu Committed by Facebook GitHub Bot Aug 06, 2021
Hide whitespace changes
Inline Side-by-side

Showing with 5 additions and 3 deletions

d2go/export/api.py d2go/export/api.py +2 -1

d2go/modeling/quantization.py d2go/modeling/quantization.py +3 -2

No files found.
--- a/d2go/export/api.py
+++ b/d2go/export/api.py
@@ -114,7 +114,8 @@ def convert_and_export_predictor(
            )
            pytorch_model = post_training_quantize(cfg, pytorch_model, data_loader)
            # only check bn exists in ptq as qat still has bn inside fused ops
-            assert not fuse_utils.check_bn_exist(pytorch_model)
+            if fuse_utils.check_bn_exist(pytorch_model):
+                logger.warn(f"Post training quantized model has bn inside fused ops")
        logger.info(f"Converting quantized model {cfg.QUANTIZATION.BACKEND}...")

        if cfg.QUANTIZATION.EAGER_MODE:

--- a/d2go/modeling/quantization.py
+++ b/d2go/modeling/quantization.py
@@ -288,6 +288,9 @@ def post_training_quantize(cfg, model, data_loader):

    calibration_iters = cfg.QUANTIZATION.PTQ.CALIBRATION_NUM_IMAGES
    for idx, inputs in enumerate(data_loader):
+        # Setting CALIBRATION_NUM_IMAGES to 0 allows skipping calibration
+        if idx == calibration_iters:
+            break
        logger.info("Running calibration iter: {}/{}".format(idx, calibration_iters))

        if calibration_force_on_gpu:
@@ -299,8 +302,6 @@ def post_training_quantize(cfg, model, data_loader):

        with torch.no_grad():
            model(inputs)
-        if idx + 1 == calibration_iters:
-            break
    else:
        logger.warning("Can't run enough calibration iterations")