Separate into API and Exporter

Summary: Pull Request resolved: https://github.com/facebookresearch/d2go/pull/238 *This diff is part of a stack which has the goal of "buckifying" D2 (https://github.com/facebookresearch/d2go/commit/87374efb134e539090e0b5c476809dc35bf6aedb)Go core and enabling autodeps and other tooling. The last diff in the stack introduces the TARGETS. The diffs earlier in the stack are resolving circular dependencies and other issues which prevent the buckification from occurring.* Following the comments in an abandoned diff, split the export code into two files, which will have their corresponding dependencies: exporter and api. api.py contains the components which have little dependencies, so it can be imported basically anywhere without circular dependencies. exporter.py contains the utilities, which are use for export operations, for example in the exporter binary. Reviewed By: mcimpoi Differential Revision: D36166603 fbshipit-source-id: 25ded0b3925464c05be4048472a4c2ddcdb17ecf

Separate into API and Exporter
Summary: Pull Request resolved: https://github.com/facebookresearch/d2go/pull/238 *This diff is part of a stack which has the goal of "buckifying" D2 (https://github.com/facebookresearch/d2go/commit/87374efb134e539090e0b5c476809dc35bf6aedb)Go core and enabling autodeps and other tooling. The last diff in the stack introduces the TARGETS. The diffs earlier in the stack are resolving circular dependencies and other issues which prevent the buckification from occurring.* Following the comments in an abandoned diff, split the export code into two files, which will have their corresponding dependencies: exporter and api. api.py contains the components which have little dependencies, so it can be imported basically anywhere without circular dependencies. exporter.py contains the utilities, which are use for export operations, for example in the exporter binary. Reviewed By: mcimpoi Differential Revision: D36166603 fbshipit-source-id: 25ded0b3925464c05be4048472a4c2ddcdb17ecf
24da990f · Miquel Jubert Hermoso · Facebook GitHub Bot · 33ca49ac · 24da990f · 24da990f
Commit 24da990f authored Jun 02, 2022 by Miquel Jubert Hermoso Committed by Facebook GitHub Bot Jun 02, 2022
8 changed files
--- a/d2go/export/api.py
+++ b/d2go/export/api.py
 #!/usr/bin/env python3
 # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved
-
-
-"""
-API for exporting a pytorch model to a predictor, the predictor contains model(s) in
-deployable format and predefined functions as glue code. The exported predictor should
-generate same output as the original pytorch model. (See predictor/api.py for details of
-predictor)
-
-This API defines customizable methods for the pytorch model:
-    prepare_for_export (required by the default export_predictor): returns
-        PredictorExportConfig which tells information about how export the predictor.
-
-NOTE:
-    1: There's a difference between predictor type and model type. model type
-        refers to predefined deployable format such as caffe2, torchscript(_int8),
-        while the predictor type can be anything that "export_predictor" can
-        recognize.
-    2: The standard model exporting methods are provided by the library code, they're
-        meant to be modularized and can be used by customized export_predictor as well.
-"""
-
 import json
-import logging
-import os
 import sys
 from abc import ABC, abstractmethod
-from typing import Callable, Dict, NamedTuple, Optional, Tuple, Union
-
-if sys.version_info >= (3, 8):
-    from typing import final
-else:
-    # If final decorator not available when using older python version, replace with the
-    # dummy implementation that does nothing.
-    def final(func):
-        return func
-
+from typing import Callable, Dict, NamedTuple, Optional, Union

-import torch
 import torch.nn as nn
-from detectron2.utils.file_io import PathManager
-from mobile_cv.arch.utils import fuse_utils
 from mobile_cv.common.misc.file_utils import make_temp_directory
 from mobile_cv.common.misc.registry import Registry
-from mobile_cv.predictor.api import FuncInfo, ModelInfo, PredictorInfo
+from mobile_cv.predictor.api import FuncInfo
 from mobile_cv.predictor.builtin_functions import (
    IdentityPostprocess,
    IdentityPreprocess,
    NaiveRunFunc,
 )

-TORCH_VERSION: Tuple[int, ...] = tuple(int(x) for x in torch.__version__.split(".")[:2])
-if TORCH_VERSION > (1, 10):
-    from torch.ao.quantization import convert
-    from torch.ao.quantization.quantize_fx import convert_fx
+if sys.version_info >= (3, 8):
+    from typing import final
 else:
-    from torch.quantization import convert
-    from torch.quantization.quantize_fx import convert_fx
-
-logger = logging.getLogger(__name__)
+    # If final decorator not available when using older python version, replace with the
+    # dummy implementation that does nothing.
+    def final(func):
+        return func


 class PredictorExportConfig(NamedTuple):
@@ -93,191 +56,6 @@ class PredictorExportConfig(NamedTuple):
    run_func_info: FuncInfo = FuncInfo.gen_func_info(NaiveRunFunc, params={})


-def convert_predictor(
-    cfg,
-    pytorch_model,
-    predictor_type,
-    data_loader,
-):
-    if "int8" in predictor_type:
-        if not cfg.QUANTIZATION.QAT.ENABLED:
-            logger.info(
-                "The model is not quantized during training, running post"
-                " training quantization ..."
-            )
-            # delayed import to avoid circular import since d2go.modeling depends on d2go.export
-            from d2go.quantization.modeling import post_training_quantize
-
-            pytorch_model = post_training_quantize(cfg, pytorch_model, data_loader)
-            # only check bn exists in ptq as qat still has bn inside fused ops
-            if fuse_utils.check_bn_exist(pytorch_model):
-                logger.warn("Post training quantized model has bn inside fused ops")
-        logger.info(f"Converting quantized model {cfg.QUANTIZATION.BACKEND}...")
-
-        if hasattr(pytorch_model, "prepare_for_quant_convert"):
-            pytorch_model = pytorch_model.prepare_for_quant_convert(cfg)
-        else:
-            # TODO(T93870381): move this to a default function
-            if cfg.QUANTIZATION.EAGER_MODE:
-                pytorch_model = convert(pytorch_model, inplace=False)
-            else:  # FX graph mode quantization
-                pytorch_model = convert_fx(pytorch_model)
-
-        logger.info("Quantized Model:\n{}".format(pytorch_model))
-    else:
-        pytorch_model = fuse_utils.fuse_model(pytorch_model)
-        logger.info("Fused Model:\n{}".format(pytorch_model))
-        if fuse_utils.count_bn_exist(pytorch_model) > 0:
-            logger.warning("BN existed in pytorch model after fusing.")
-    return pytorch_model
-
-
-def convert_and_export_predictor(
-    cfg,
-    pytorch_model,
-    predictor_type,
-    output_dir,
-    data_loader,
-):
-    """
-    Entry point for convert and export model. This involves two steps:
-        - convert: converting the given `pytorch_model` to another format, currently
-            mainly for quantizing the model.
-        - export: exporting the converted `pytorch_model` to predictor. This step
-            should not alter the behaviour of model.
-    """
-    pytorch_model = convert_predictor(cfg, pytorch_model, predictor_type, data_loader)
-    return export_predictor(cfg, pytorch_model, predictor_type, output_dir, data_loader)
-
-
-def export_predictor(cfg, pytorch_model, predictor_type, output_dir, data_loader):
-    """
-    Interface for exporting a pytorch model to predictor of given type. This function
-    can be override to achieve customized exporting procedure, eg. using non-default
-    optimization passes, composing traced models, etc.
-
-    Args:
-        cfg (CfgNode): the config
-        pytorch_model (nn.Module): a pytorch model, mostly also a meta-arch
-        predictor_type (str): a string which specifies the type of predictor, note that
-            the definition of type is interpreted by "export_predictor", the default
-            implementation uses the deployable model format (eg. caffe2_fp32,
-            torchscript_int8) as predictor type.
-        output_dir (str): the parent directory where the predictor will be saved
-        data_loader: data loader for the pytorch model
-
-    Returns:
-        predictor_path (str): the directory of exported predictor, a sub-directory of
-            "output_dir"
-    """
-    return default_export_predictor(
-        cfg, pytorch_model, predictor_type, output_dir, data_loader
-    )
-
-
-def _export_single_model(
-    predictor_path,
-    model,
-    input_args,
-    save_path,
-    model_export_method,
-    model_export_kwargs,
-):
-    assert isinstance(model, nn.Module), model
-    # model_export_method either inherits ModelExportMethod or is a key in the registry
-    model_export_method_str = None
-    if isinstance(model_export_method, str):
-        model_export_method_str = model_export_method
-        model_export_method = ModelExportMethodRegistry.get(model_export_method)
-    assert issubclass(model_export_method, ModelExportMethod), model_export_method
-    logger.info("Using model export method: {}".format(model_export_method))
-
-    load_kwargs = model_export_method.export(
-        model=model,
-        input_args=input_args,
-        save_path=save_path,
-        export_method=model_export_method_str,
-        **model_export_kwargs,
-    )
-    assert isinstance(load_kwargs, dict)
-    model_rel_path = os.path.relpath(save_path, predictor_path)
-    return ModelInfo(
-        path=model_rel_path,
-        export_method="{}.{}".format(
-            model_export_method.__module__, model_export_method.__qualname__
-        ),
-        load_kwargs=load_kwargs,
-    )
-
-
-def default_export_predictor(
-    cfg, pytorch_model, predictor_type, output_dir, data_loader
-):
-    # The default implementation acts based on the PredictorExportConfig returned by
-    # calling "prepare_for_export". It'll export all sub models in standard way
-    # according to the "predictor_type".
-    assert hasattr(pytorch_model, "prepare_for_export"), pytorch_model
-    inputs = next(iter(data_loader))
-    export_config = pytorch_model.prepare_for_export(cfg, inputs, predictor_type)
-    model_inputs = (
-        export_config.data_generator(inputs)
-        if export_config.data_generator is not None
-        else (inputs,)
-    )
-
-    predictor_path = os.path.join(output_dir, predictor_type)
-    PathManager.mkdirs(predictor_path)
-
-    predictor_init_kwargs = {
-        "preprocess_info": export_config.preprocess_info,
-        "postprocess_info": export_config.postprocess_info,
-        "run_func_info": export_config.run_func_info,
-    }
-
-    if isinstance(export_config.model, dict):
-        models_info = {}
-        for name, model in export_config.model.items():
-            save_path = os.path.join(predictor_path, name)
-            model_info = _export_single_model(
-                predictor_path=predictor_path,
-                model=model,
-                input_args=model_inputs[name] if model_inputs is not None else None,
-                save_path=save_path,
-                model_export_method=(
-                    predictor_type
-                    if export_config.model_export_method is None
-                    else export_config.model_export_method[name]
-                ),
-                model_export_kwargs=(
-                    {}
-                    if export_config.model_export_kwargs is None
-                    else export_config.model_export_kwargs[name]
-                ),
-            )
-            models_info[name] = model_info
-        predictor_init_kwargs["models"] = models_info
-    else:
-        save_path = predictor_path  # for single model exported files are put under `predictor_path` together with predictor_info.json
-        model_info = _export_single_model(
-            predictor_path=predictor_path,
-            model=export_config.model,
-            input_args=model_inputs,
-            save_path=save_path,
-            model_export_method=export_config.model_export_method or predictor_type,
-            model_export_kwargs=export_config.model_export_kwargs or {},
-        )
-        predictor_init_kwargs["model"] = model_info
-
-    # assemble predictor
-    predictor_info = PredictorInfo(**predictor_init_kwargs)
-    with PathManager.open(
-        os.path.join(predictor_path, "predictor_info.json"), "w"
-    ) as f:
-        json.dump(predictor_info.to_dict(), f, indent=4)
-
-    return predictor_path
-
-
 class ModelExportMethod(ABC):
    """
    Base class for "model export method". Each model export method can export a pytorch

--- a/d2go/export/exporter.py
+++ b/d2go/export/exporter.py
+#!/usr/bin/env python3
+# Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved
+
+
+"""
+API for exporting a pytorch model to a predictor, the predictor contains model(s) in
+deployable format and predefined functions as glue code. The exported predictor should
+generate same output as the original pytorch model. (See predictor/api.py for details of
+predictor)
+
+This API defines customizable methods for the pytorch model:
+    prepare_for_export (required by the default export_predictor): returns
+        PredictorExportConfig which tells information about how export the predictor.
+
+NOTE:
+    1: There's a difference between predictor type and model type. model type
+        refers to predefined deployable format such as caffe2, torchscript(_int8),
+        while the predictor type can be anything that "export_predictor" can
+        recognize.
+    2: The standard model exporting methods are provided by the library code, they're
+        meant to be modularized and can be used by customized export_predictor as well.
+"""
+
+import json
+import logging
+import os
+import sys
+from typing import Callable, Dict, NamedTuple, Optional, Tuple, Union
+
+import torch
+import torch.nn as nn
+from d2go.export.api import ModelExportMethod, ModelExportMethodRegistry
+from d2go.quantization.modeling import post_training_quantize
+from detectron2.utils.file_io import PathManager
+from mobile_cv.arch.utils import fuse_utils
+from mobile_cv.predictor.api import FuncInfo, ModelInfo, PredictorInfo
+from mobile_cv.predictor.builtin_functions import (
+    IdentityPostprocess,
+    IdentityPreprocess,
+    NaiveRunFunc,
+)
+
+TORCH_VERSION: Tuple[int, ...] = tuple(int(x) for x in torch.__version__.split(".")[:2])
+if TORCH_VERSION > (1, 10):
+    from torch.ao.quantization import convert
+    from torch.ao.quantization.quantize_fx import convert_fx
+else:
+    from torch.quantization import convert
+    from torch.quantization.quantize_fx import convert_fx
+
+logger = logging.getLogger(__name__)
+
+
+def convert_predictor(
+    cfg,
+    pytorch_model,
+    predictor_type,
+    data_loader,
+):
+    if "int8" in predictor_type:
+        if not cfg.QUANTIZATION.QAT.ENABLED:
+            logger.info(
+                "The model is not quantized during training, running post"
+                " training quantization ..."
+            )
+
+            pytorch_model = post_training_quantize(cfg, pytorch_model, data_loader)
+            # only check bn exists in ptq as qat still has bn inside fused ops
+            if fuse_utils.check_bn_exist(pytorch_model):
+                logger.warn("Post training quantized model has bn inside fused ops")
+        logger.info(f"Converting quantized model {cfg.QUANTIZATION.BACKEND}...")
+
+        if hasattr(pytorch_model, "prepare_for_quant_convert"):
+            pytorch_model = pytorch_model.prepare_for_quant_convert(cfg)
+        else:
+            # TODO(T93870381): move this to a default function
+            if cfg.QUANTIZATION.EAGER_MODE:
+                pytorch_model = convert(pytorch_model, inplace=False)
+            else:  # FX graph mode quantization
+                pytorch_model = convert_fx(pytorch_model)
+
+        logger.info("Quantized Model:\n{}".format(pytorch_model))
+    else:
+        pytorch_model = fuse_utils.fuse_model(pytorch_model)
+        logger.info("Fused Model:\n{}".format(pytorch_model))
+        if fuse_utils.count_bn_exist(pytorch_model) > 0:
+            logger.warning("BN existed in pytorch model after fusing.")
+    return pytorch_model
+
+
+def convert_and_export_predictor(
+    cfg,
+    pytorch_model,
+    predictor_type,
+    output_dir,
+    data_loader,
+):
+    """
+    Entry point for convert and export model. This involves two steps:
+        - convert: converting the given `pytorch_model` to another format, currently
+            mainly for quantizing the model.
+        - export: exporting the converted `pytorch_model` to predictor. This step
+            should not alter the behaviour of model.
+    """
+    pytorch_model = convert_predictor(cfg, pytorch_model, predictor_type, data_loader)
+    return export_predictor(cfg, pytorch_model, predictor_type, output_dir, data_loader)
+
+
+def export_predictor(cfg, pytorch_model, predictor_type, output_dir, data_loader):
+    """
+    Interface for exporting a pytorch model to predictor of given type. This function
+    can be override to achieve customized exporting procedure, eg. using non-default
+    optimization passes, composing traced models, etc.
+
+    Args:
+        cfg (CfgNode): the config
+        pytorch_model (nn.Module): a pytorch model, mostly also a meta-arch
+        predictor_type (str): a string which specifies the type of predictor, note that
+            the definition of type is interpreted by "export_predictor", the default
+            implementation uses the deployable model format (eg. caffe2_fp32,
+            torchscript_int8) as predictor type.
+        output_dir (str): the parent directory where the predictor will be saved
+        data_loader: data loader for the pytorch model
+
+    Returns:
+        predictor_path (str): the directory of exported predictor, a sub-directory of
+            "output_dir"
+    """
+    return default_export_predictor(
+        cfg, pytorch_model, predictor_type, output_dir, data_loader
+    )
+
+
+def _export_single_model(
+    predictor_path,
+    model,
+    input_args,
+    save_path,
+    model_export_method,
+    model_export_kwargs,
+):
+    assert isinstance(model, nn.Module), model
+    # model_export_method either inherits ModelExportMethod or is a key in the registry
+    model_export_method_str = None
+    if isinstance(model_export_method, str):
+        model_export_method_str = model_export_method
+        model_export_method = ModelExportMethodRegistry.get(model_export_method)
+    assert issubclass(model_export_method, ModelExportMethod), model_export_method
+    logger.info("Using model export method: {}".format(model_export_method))
+
+    load_kwargs = model_export_method.export(
+        model=model,
+        input_args=input_args,
+        save_path=save_path,
+        export_method=model_export_method_str,
+        **model_export_kwargs,
+    )
+    assert isinstance(load_kwargs, dict)
+    model_rel_path = os.path.relpath(save_path, predictor_path)
+    return ModelInfo(
+        path=model_rel_path,
+        export_method="{}.{}".format(
+            model_export_method.__module__, model_export_method.__qualname__
+        ),
+        load_kwargs=load_kwargs,
+    )
+
+
+def default_export_predictor(
+    cfg, pytorch_model, predictor_type, output_dir, data_loader
+):
+    # The default implementation acts based on the PredictorExportConfig returned by
+    # calling "prepare_for_export". It'll export all sub models in standard way
+    # according to the "predictor_type".
+    assert hasattr(pytorch_model, "prepare_for_export"), pytorch_model
+    inputs = next(iter(data_loader))
+    export_config = pytorch_model.prepare_for_export(cfg, inputs, predictor_type)
+    model_inputs = (
+        export_config.data_generator(inputs)
+        if export_config.data_generator is not None
+        else (inputs,)
+    )
+
+    predictor_path = os.path.join(output_dir, predictor_type)
+    PathManager.mkdirs(predictor_path)
+
+    predictor_init_kwargs = {
+        "preprocess_info": export_config.preprocess_info,
+        "postprocess_info": export_config.postprocess_info,
+        "run_func_info": export_config.run_func_info,
+    }
+
+    if isinstance(export_config.model, dict):
+        models_info = {}
+        for name, model in export_config.model.items():
+            save_path = os.path.join(predictor_path, name)
+            model_info = _export_single_model(
+                predictor_path=predictor_path,
+                model=model,
+                input_args=model_inputs[name] if model_inputs is not None else None,
+                save_path=save_path,
+                model_export_method=(
+                    predictor_type
+                    if export_config.model_export_method is None
+                    else export_config.model_export_method[name]
+                ),
+                model_export_kwargs=(
+                    {}
+                    if export_config.model_export_kwargs is None
+                    else export_config.model_export_kwargs[name]
+                ),
+            )
+            models_info[name] = model_info
+        predictor_init_kwargs["models"] = models_info
+    else:
+        save_path = predictor_path  # for single model exported files are put under `predictor_path` together with predictor_info.json
+        model_info = _export_single_model(
+            predictor_path=predictor_path,
+            model=export_config.model,
+            input_args=model_inputs,
+            save_path=save_path,
+            model_export_method=export_config.model_export_method or predictor_type,
+            model_export_kwargs=export_config.model_export_kwargs or {},
+        )
+        predictor_init_kwargs["model"] = model_info
+
+    # assemble predictor
+    predictor_info = PredictorInfo(**predictor_init_kwargs)
+    with PathManager.open(
+        os.path.join(predictor_path, "predictor_info.json"), "w"
+    ) as f:
+        json.dump(predictor_info.to_dict(), f, indent=4)
+
+    return predictor_path
--- a/d2go/modeling/meta_arch/rcnn.py
+++ b/d2go/modeling/meta_arch/rcnn.py
@@ -3,10 +3,14 @@


 import inspect
+import json
 import logging
+from typing import Any, Optional, Tuple

 import torch
 import torch.nn as nn
+from d2go.config import CfgNode
+from d2go.config.utils import flatten_config_dict
 from d2go.export.api import PredictorExportConfig
 from d2go.quantization.qconfig import set_backend_and_create_qconfig
 from detectron2.modeling import GeneralizedRCNN
@@ -515,3 +519,25 @@ def _cast_detection_model(model, device):
        pixel_std = pixel_std.to(device)
        model.normalizer = lambda x: (x - pixel_mean) / pixel_std
    return model
+
+
+def _update_export_config_with_extra_files(export_config, extra_files):
+    export_config_dict = export_config._asdict()
+    if export_config_dict["model_export_kwargs"] is None:
+        export_config_dict["model_export_kwargs"] = {}
+    export_config_dict["model_export_kwargs"]["_extra_files"] = extra_files
+    return PredictorExportConfig(**export_config_dict)
+
+
+@RCNN_PREPARE_FOR_EXPORT_REGISTRY.register()
+def prepare_for_export_with_inference_config(
+    self, cfg: CfgNode, inputs: Optional[Tuple[Any]], predictor_type: str
+) -> PredictorExportConfig:
+    """
+    For certain tasks, the exported model needs to encode config as part of the extra
+    files.
+    """
+    export_config = default_rcnn_prepare_for_export(self, cfg, inputs, predictor_type)
+    # Add "inference_config.json" for the _extra_files as part of model_export_kwargs
+    extra_files = {"inference_config.json": json.dumps(flatten_config_dict(cfg))}
+    return _update_export_config_with_extra_files(export_config, extra_files)
--- a/d2go/utils/testing/rcnn_helper.py
+++ b/d2go/utils/testing/rcnn_helper.py
@@ -9,8 +9,8 @@ from typing import Optional

 import d2go.data.transforms.box_utils as bu
 import torch
-from d2go.export.api import convert_and_export_predictor
 from d2go.export.d2_meta_arch import patch_d2_meta_arch
+from d2go.export.exporter import convert_and_export_predictor
 from d2go.runner import GeneralizedRCNNRunner
 from d2go.utils.testing.data_loader_helper import (
    create_detection_data_loader_on_toy_dataset,

--- a/tests/export/test_api.py
+++ b/tests/export/test_api.py
@@ -8,11 +8,8 @@ from typing import List

 import torch
 import torch.nn as nn
-from d2go.export.api import (
-    convert_and_export_predictor,
-    FuncInfo,
-    PredictorExportConfig,
-)
+from d2go.export.api import FuncInfo, PredictorExportConfig
+from d2go.export.exporter import convert_and_export_predictor
 from d2go.export.torchscript import (
    DefaultTorchscriptExport,
    TracingAdaptedTorchscriptExport,

--- a/tests/modeling/test_meta_arch_rcnn.py
+++ b/tests/modeling/test_meta_arch_rcnn.py
@@ -7,8 +7,8 @@ import os
 import unittest

 import torch
-from d2go.export.api import convert_and_export_predictor
 from d2go.export.d2_meta_arch import patch_d2_meta_arch
+from d2go.export.exporter import convert_and_export_predictor
 from d2go.runner import GeneralizedRCNNRunner
 from d2go.utils.testing.data_loader_helper import (
    create_detection_data_loader_on_toy_dataset,

--- a/tests/modeling/test_meta_arch_semantic_seg.py
+++ b/tests/modeling/test_meta_arch_semantic_seg.py
@@ -8,8 +8,8 @@ import tempfile
 import unittest

 import torch
-from d2go.export.api import convert_and_export_predictor
 from d2go.export.d2_meta_arch import patch_d2_meta_arch
+from d2go.export.exporter import convert_and_export_predictor
 from d2go.runner import Detectron2GoRunner
 from mobile_cv.predictor.api import create_predictor


--- a/tools/exporter.py
+++ b/tools/exporter.py
@@ -13,7 +13,7 @@ import typing

 import mobile_cv.lut.lib.pt.flops_utils as flops_utils
 from d2go.config import temp_defrost
-from d2go.export.api import convert_and_export_predictor
+from d2go.export.exporter import convert_and_export_predictor
 from d2go.setup import basic_argument_parser, prepare_for_launch, setup_after_launch
 from mobile_cv.common.misc.py import post_mortem_if_fail