[Refactor][API2.0] Api refactor2.0 (open-mmlab#529)

* [refactor][API2.0] Add onnx export and jit trace (open-mmlab#419) * first commit * add async call * add new api onnx export and jit trace * add decorator * fix ci * fix torchscript ci * fix loader * better pipemanager * remove comment, better import * add kwargs * remove comment * better pipeline manager * remove print * [Refactor][API2.0] Api partition calibration (open-mmlab#433) * first commit * add async call * add new api onnx export and jit trace * add decorator * fix ci * fix torchscript ci * fix loader * better pipemanager * remove comment, better import * add partition * move calibration * Better create_calib_table * better deploy * add kwargs * remove comment * better pipeline manager * rename api, remove reduant variable, and misc * [Refactor][API2.0] Api ncnn openvino (open-mmlab#435) * first commit * add async call * add new api onnx export and jit trace * add decorator * fix ci * fix torchscript ci * fix loader * better pipemanager * remove comment, better import * add ncnn api * finish ncnn api * add openvino support * add kwargs * remove comment * better pipeline manager * merge fix * merge util and onnx2ncnn * fix docstring * [Refactor][API2.0] API for TensorRT (open-mmlab#519) * first commit * add async call * add new api onnx export and jit trace * add decorator * fix ci * fix torchscript ci * fix loader * better pipemanager * remove comment, better import * add partition * move calibration * Better create_calib_table * better deploy * add kwargs * remove comment * Add tensorrt API * better pipeline manager * add tensorrt new api * remove print * rename api, remove reduant variable, and misc * add docstring * [Refactor][API2.0] Api ppl other (open-mmlab#528) * first commit * add async call * add new api onnx export and jit trace * add decorator * fix ci * fix torchscript ci * fix loader * better pipemanager * remove comment, better import * add kwargs * Add new APIS for pplnn sdk and misc * remove comment * better pipeline manager * merge fix * update tools/onnx2pplnn.py * rename function
humu789 · May 31, 2022 · b32fc41 · b32fc41
1 parent aabab46
commit b32fc41
Show file tree

Hide file tree

Showing 55 changed files with 1,595 additions and 728 deletions.
diff --git a/.gitignore b/.gitignore
@@ -143,3 +143,6 @@ bin/
 #
 !docs/zh_cn/build
 !docs/en/build
+
+# ncnn
+mmdeploy/backend/ncnn/onnx2ncnn
diff --git a/docs/en/tutorials/how_to_support_new_backends.md b/docs/en/tutorials/how_to_support_new_backends.md
@@ -38,11 +38,11 @@ The backends in MMDeploy must support the ONNX. The backend loads the ".onnx" fi
 
 
     if is_available():
-        from .utils import create_trt_engine, load_trt_engine, save_trt_engine
+        from .utils import from_onnx, load, save
         from .wrapper import TRTWrapper
 
         __all__ = [
-            'create_trt_engine', 'save_trt_engine', 'load_trt_engine', 'TRTWrapper'
+            'from_onnx', 'save', 'load', 'TRTWrapper'
         ]
     ```
 

diff --git a/docs/zh_cn/04-developer-guide/support_new_backend.md b/docs/zh_cn/04-developer-guide/support_new_backend.md
@@ -38,11 +38,11 @@ MMDeploy 中的后端必须支持 ONNX，因此后端能直接加载“.onnx”
 
 
     if is_available():
-        from .utils import create_trt_engine, load_trt_engine, save_trt_engine
+        from .utils import from_onnx, load, save
         from .wrapper import TRTWrapper
 
         __all__ = [
-            'create_trt_engine', 'save_trt_engine', 'load_trt_engine', 'TRTWrapper'
+            'from_onnx', 'save', 'load', 'TRTWrapper'
         ]
     ```
 

diff --git a/mmdeploy/apis/__init__.py b/mmdeploy/apis/__init__.py
@@ -1,14 +1,19 @@
 # Copyright (c) OpenMMLab. All rights reserved.
-from .calibration import create_calib_table
-from .extract_model import extract_model
-from .inference import inference_model
-from .pytorch2onnx import torch2onnx, torch2onnx_impl
-from .pytorch2torchscript import torch2torchscript, torch2torchscript_impl
-from .utils import build_task_processor, get_predefined_partition_cfg
-from .visualize import visualize_model
 
-__all__ = [
-    'create_calib_table', 'extract_model', 'inference_model', 'torch2onnx',
-    'torch2onnx_impl', 'torch2torchscript', 'torch2torchscript_impl',
-    'build_task_processor', 'get_predefined_partition_cfg', 'visualize_model'
-]
+# mmcv dependency
+try:
+    from .calibration import create_calib_input_data
+    from .extract_model import extract_model
+    from .inference import inference_model
+    from .pytorch2onnx import torch2onnx
+    from .pytorch2torchscript import torch2torchscript
+    from .utils import build_task_processor, get_predefined_partition_cfg
+    from .visualize import visualize_model
+
+    __all__ = [
+        'create_calib_input_data', 'extract_model', 'inference_model',
+        'torch2onnx', 'torch2torchscript', 'build_task_processor',
+        'get_predefined_partition_cfg', 'visualize_model'
+    ]
+except Exception:
+    pass
diff --git a/mmdeploy/apis/calibration.py b/mmdeploy/apis/calibration.py
@@ -1,107 +1,78 @@
 # Copyright (c) OpenMMLab. All rights reserved.
 from typing import Optional, Union
 
-import h5py
 import mmcv
 import torch
 from mmcv.parallel import MMDataParallel
 
-from mmdeploy.core import (RewriterContext, patch_model,
-                           reset_mark_function_count)
+from mmdeploy.core import patch_model
 from mmdeploy.utils import cfg_apply_marks, load_config
+from .core import PIPELINE_MANAGER, no_mp
+from .utils import create_calib_input_data as create_calib_input_data_impl
 
 
-def create_calib_table(calib_file: str,
-                       deploy_cfg: Union[str, mmcv.Config],
-                       model_cfg: Union[str, mmcv.Config],
-                       model_checkpoint: Optional[str] = None,
-                       dataset_cfg: Optional[Union[str, mmcv.Config]] = None,
-                       dataset_type: str = 'val',
-                       device: str = 'cuda:0',
-                       **kwargs) -> None:
-    """Create calibration table.
-
-    Examples:
-        >>> from mmdeploy.apis import create_calib_table
-        >>> from mmdeploy.utils import get_calib_filename, load_config
-        >>> deploy_cfg = 'configs/mmdet/detection/' \
-            'detection_tensorrt-int8_dynamic-320x320-1344x1344.py'
-        >>> deploy_cfg = load_config(deploy_cfg)[0]
-        >>> calib_file = get_calib_filename(deploy_cfg)
-        >>> model_cfg = 'mmdetection/configs/fcos/' \
-            'fcos_r50_caffe_fpn_gn-head_1x_coco.py'
-        >>> model_checkpoint = 'checkpoints/' \
-            'fcos_r50_caffe_fpn_gn-head_1x_coco-821213aa.pth'
-        >>> create_calib_table(calib_file, deploy_cfg, \
-            model_cfg, model_checkpoint, device='cuda:0')
+@PIPELINE_MANAGER.register_pipeline()
+def create_calib_input_data(calib_file: str,
+                            deploy_cfg: Union[str, mmcv.Config],
+                            model_cfg: Union[str, mmcv.Config],
+                            model_checkpoint: Optional[str] = None,
+                            dataset_cfg: Optional[Union[str,
+                                                        mmcv.Config]] = None,
+                            dataset_type: str = 'val',
+                            device: str = 'cpu') -> None:
+    """Create dataset for post-training quantization.
 
     Args:
-        calib_file (str): Input calibration file.
-        deploy_cfg (str | mmcv.Config): Deployment config.
-        model_cfg (str | mmcv.Config): The model config.
-        model_checkpoint (str): PyTorch model checkpoint, defaults to `None`.
-        dataset_cfg (str | mmcv.Config): Dataset config, defaults to `None`
-        dataset_type (str): A string specifying dataset type, e.g.: 'test',
-            'val', defaults to 'val'.
-        device (str): Specifying the device to run on, defaults to 'cuda:0'.
+        calib_file (str): The output calibration data file.
+        deploy_cfg (str | mmcv.Config): Deployment config file or
+            Config object.
+        model_cfg (str | mmcv.Config): Model config file or Config object.
+        model_checkpoint (str): A checkpoint path of PyTorch model,
+            defaults to `None`.
+        dataset_cfg (Optional[Union[str, mmcv.Config]], optional): Model
+            config to provide calibration dataset. If none, use `model_cfg`
+            as the dataset config. Defaults to None.
+        dataset_type (str, optional): The dataset type. Defaults to 'val'.
+        device (str, optional): Device to create dataset. Defaults to 'cpu'.
     """
-    if dataset_cfg is None:
-        dataset_cfg = model_cfg
+    with no_mp():
+        if dataset_cfg is None:
+            dataset_cfg = model_cfg
+
+        device_id = torch.device(device).index
+        if device_id is None:
+            device_id = 0
+
+        # load cfg if necessary
+        deploy_cfg, model_cfg = load_config(deploy_cfg, model_cfg)
 
-    # load cfg if necessary
-    deploy_cfg, model_cfg = load_config(deploy_cfg, model_cfg)
-    device_id = torch.device(device).index
-    if device_id is None:
-        device_id = 0
+        if dataset_cfg is None:
+            dataset_cfg = model_cfg
 
-    if dataset_cfg is None:
-        dataset_cfg = model_cfg
-    # load dataset_cfg if necessary
-    dataset_cfg = load_config(dataset_cfg)[0]
+        # load dataset_cfg if necessary
+        dataset_cfg = load_config(dataset_cfg)[0]
 
-    from mmdeploy.apis.utils import build_task_processor
-    task_processor = build_task_processor(model_cfg, deploy_cfg, device)
+        from mmdeploy.apis.utils import build_task_processor
+        task_processor = build_task_processor(model_cfg, deploy_cfg, device)
 
-    apply_marks = cfg_apply_marks(deploy_cfg)
-    backend = 'default'
-    model = task_processor.init_pytorch_model(model_checkpoint)
-    dataset = task_processor.build_dataset(dataset_cfg, dataset_type)
+        apply_marks = cfg_apply_marks(deploy_cfg)
 
-    # patch model
-    patched_model = patch_model(model, cfg=deploy_cfg, backend=backend)
+        model = task_processor.init_pytorch_model(model_checkpoint)
+        dataset = task_processor.build_dataset(dataset_cfg, dataset_type)
 
-    with h5py.File(calib_file, mode='w') as file:
-        calib_data_group = file.create_group('calib_data')
+        # patch model
+        patched_model = patch_model(model, cfg=deploy_cfg)
 
-        if not apply_marks:
-            # create end2end group
-            input_data_group = calib_data_group.create_group('end2end')
-            input_group = input_data_group.create_group('input')
         dataloader = task_processor.build_dataloader(
             dataset, 1, 1, dist=False, shuffle=False)
         patched_model = MMDataParallel(patched_model, device_ids=[device_id])
-        prog_bar = mmcv.ProgressBar(len(dataset))
-        for data_id, input_data in enumerate(dataloader):
-
-            if not apply_marks:
-                # save end2end data
-                input_tensor = task_processor.get_tensor_from_input(input_data)
-                input_ndarray = input_tensor.detach().cpu().numpy()
-                input_group.create_dataset(
-                    str(data_id),
-                    shape=input_ndarray.shape,
-                    compression='gzip',
-                    compression_opts=4,
-                    data=input_ndarray)
-
-            with torch.no_grad(), RewriterContext(
-                    cfg=deploy_cfg,
-                    backend=backend,
-                    create_calib=True,
-                    calib_file=file,
-                    data_id=data_id):
-                reset_mark_function_count()
-                _ = task_processor.run_inference(patched_model, input_data)
-            file.flush()
 
-            prog_bar.update()
+        create_calib_input_data_impl(
+            calib_file,
+            patched_model,
+            dataloader,
+            get_tensor_func=task_processor.get_tensor_from_input,
+            inference_func=task_processor.run_inference,
+            model_partition=apply_marks,
+            context_info=dict(cfg=deploy_cfg),
+            device=device)
diff --git a/mmdeploy/apis/core/__init__.py b/mmdeploy/apis/core/__init__.py
@@ -0,0 +1,4 @@
+# Copyright (c) OpenMMLab. All rights reserved.
+from .pipeline_manager import PIPELINE_MANAGER, no_mp
+
+__all__ = ['PIPELINE_MANAGER', 'no_mp']