Export Detic to ONNX or Torchscript

Hi,

I was wondering if anyone has been able to export Detic to onnx or torchscript or serve the model in any other way? 
There are three other issues on this topic here but non of them reached a conclusive answer. (issues: #61 #63 #68)

I'm using detectron2's [export_model](https://github.com/facebookresearch/detectron2/blob/bbdee4cf6bc100fedad7cfad3225bb1da12fa175/tools/deploy/export_model.py) script as mentioned in previous issues. 
Here's a snippet of the main part of the code:
``` 
import argparse
import os
import torch
import sys
from pathlib import Path
from torch import Tensor, nn

import detectron2.data.transforms as T
from detectron2.checkpoint import DetectionCheckpointer
from detectron2.config import get_cfg
from detectron2.data import build_detection_test_loader, detection_utils
from detectron2.export import TracingAdapter, dump_torchscript_IR
from detectron2.modeling import GeneralizedRCNN, RetinaNet, build_model
from detectron2.modeling.postprocessing import detector_postprocess
from detectron2.projects.point_rend import add_pointrend_config
from detectron2.structures import Boxes
from detectron2.utils.env import TORCH_VERSION
from detectron2.utils.file_io import PathManager
from detectron2.utils.logger import setup_logger

FILE = Path(__file__).resolve()
ROOT = FILE.parents[0] / 'Detic' # Detic root directory
CONFIGS = ROOT / 'configs'

if str(ROOT) not in sys.path:
    sys.path.append(str(ROOT))  # add ROOT to PATH

sys.path.insert(0, str(ROOT / 'third_party/CenterNet2/'))

os.chdir(ROOT)

from centernet.config import add_centernet_config
from detic.config import add_detic_config

def setup_cfg(args):
    cfg = get_cfg()
    # cuda context is initialized before creating dataloader, so we don't fork anymore
    cfg.DATALOADER.NUM_WORKERS = 0
    add_pointrend_config(cfg)
    add_centernet_config(cfg)
    add_detic_config(cfg)
    cfg.merge_from_file(args.config_file)
    print(args.opts)
    cfg.merge_from_list(args.opts)
    cfg.freeze()
    return cfg

# experimental. API not yet final
def export_tracing(torch_model, inputs):
    assert TORCH_VERSION >= (1, 8)
    image = inputs[0]["image"]
    inputs = [{"image": image}]  # remove other unused keys

    if isinstance(torch_model, GeneralizedRCNN):

        def inference(model, inputs):
            # use do_postprocess=False so it returns ROI mask
            inst = model.inference(inputs, do_postprocess=False)[0]
            return [{"instances": inst}]

    else:
        inference = None  # assume that we just call the model directly

    traceable_model = TracingAdapter(torch_model, inputs, inference)
    traceable_model.eval()
    
    if args.format == "torchscript":
        ts_model = torch.jit.trace(traceable_model, (image,))
        with PathManager.open(os.path.join(args.output, "model.ts"), "wb") as f:
            torch.jit.save(ts_model, f)
        dump_torchscript_IR(ts_model, args.output)
    elif args.format == "onnx":
        with PathManager.open(os.path.join(args.output, "model.onnx"), "wb") as f:
            torch.onnx.export(traceable_model, (image,), f, opset_version=16)
    logger.info("Inputs schema: " + str(traceable_model.inputs_schema))
    logger.info("Outputs schema: " + str(traceable_model.outputs_schema))

def get_sample_inputs(args):

    if args.sample_image is None:
        # get a first batch from dataset
        data_loader = build_detection_test_loader(cfg, cfg.DATASETS.TEST[0])
        first_batch = next(iter(data_loader))
        return first_batch
    else:
        # get a sample data
        original_image = detection_utils.read_image(args.sample_image, format=cfg.INPUT.FORMAT)
        # Do same preprocessing as DefaultPredictor
        aug = T.ResizeShortestEdge(
            [cfg.INPUT.MIN_SIZE_TEST, cfg.INPUT.MIN_SIZE_TEST], cfg.INPUT.MAX_SIZE_TEST
        )
        height, width = original_image.shape[:2]
        image = aug.get_transform(original_image).apply_image(original_image)
        image = torch.as_tensor(image.astype("float32").transpose(2, 0, 1))

        inputs = {"image": image, "height": height, "width": width}

        # Sample ready
        sample_inputs = [inputs]
        return sample_inputs


if __name__ == "__main__":
    parser = argparse.ArgumentParser(description="Export a model for deployment.")
    parser.add_argument(
        "--format",
        choices=["onnx", "torchscript"],
        help="output format",
        default="onnx",
    )
    parser.add_argument(
        "--export-method",
        choices=["tracing"],
        help="Method to export models",
        default="tracing",
    )
    parser.add_argument("--config-file", default="", metavar="FILE", help="path to config file")
    parser.add_argument("--sample-image", default=None, type=str, help="sample image for input")
    parser.add_argument("--output", help="output directory for the converted model")
    parser.add_argument(
        "opts",
        help="Modify config options using the command-line",
        default=None,
        nargs=argparse.REMAINDER,
    )
    args = parser.parse_args()
    logger = setup_logger()
    logger.info("Command line arguments: " + str(args))
    PathManager.mkdirs(args.output)

    cfg = setup_cfg(args)
    print(cfg)

    # create a torch model
    torch_model = build_model(cfg)
    DetectionCheckpointer(torch_model).resume_or_load(cfg.MODEL.WEIGHTS)

    # get sample data
    sample_inputs = get_sample_inputs(args)

    assert TORCH_VERSION >= (1, 8)
    image = sample_inputs[0]["image"]
    inputs = [{"image": image}]  # remove other unused keys

    # convert and save model
    if args.export_method == "tracing":
        exported_model = export_tracing(torch_model, sample_inputs)
```
This is how I'm running the code:
```
python export_model.py --config-file $detic_config_dir/Detic_LCOCOI21k_CLIP_SwinB_896b32_4x_ft4x_max-size.yaml  --output ./output  --export-method tracing --format torchscript/onnx --sample-image ./00001.jpg MODEL.WEIGHTS $detic_ckpt_dir/Detic_LCOCOI21k_CLIP_SwinB_896b32_4x_ft4x_max-size.pth MODEL.DEVICE cuda
```

I removed this line from `custom_rcnn.py` and exported the model to both onnx and torchscript formats:
```
box_features = _ScaleGradient.apply(box_features, 1.0 / self.num_cascade_stages)
```
There are soooo many tracer warnings (log in the first comment) but triton can serve both models (Status: READY). The problem is I'm still not able to get any inference results from the models. Here are the errors I'm getting:

ONNX:
```
root@lambda-quad:/workspace# python client.py 
Traceback (most recent call last):
  File "client.py", line 48, in <module>
    results = client.infer(model_name="detic_onnx", inputs=[request], outputs=outputs)
  File "/usr/local/lib/python3.8/dist-packages/tritonclient/http/__init__.py", line 1490, in infer
    _raise_if_error(response)
  File "/usr/local/lib/python3.8/dist-packages/tritonclient/http/__init__.py", line 65, in _raise_if_error
    raise error
tritonclient.utils.InferenceServerException: onnx runtime error 1: Non-zero status code returned while running Split node. Name:'/roi_heads/Split_3' Status Message: Cannot split using values in 'split' attribute. Axis=0 Input shape={0,22048} NumOutputs=1 Num entries in 'split' (must equal number of outputs) was 1 Sum of sizes in 'split' (must equal size of selected axis) was 256
```
Torchscript:
```
root@lambda-quad:/workspace# python client.py 
Traceback (most recent call last):
  File "client.py", line 48, in <module>
    results = client.infer(model_name="detic_torchscript", inputs=[request], outputs=outputs)
  File "/usr/local/lib/python3.8/dist-packages/tritonclient/http/__init__.py", line 1490, in infer
    _raise_if_error(response)
  File "/usr/local/lib/python3.8/dist-packages/tritonclient/http/__init__.py", line 65, in _raise_if_error
    raise error
tritonclient.utils.InferenceServerException: PyTorch execute failure: The following operation failed in the TorchScript interpreter.
Traceback of TorchScript, serialized code (most recent call last):
  File "code/__torch__/detectron2/export/flatten.py", line 26, in forward
    image_size = torch.stack([_1, _2])
    max_size, _3 = torch.max(torch.stack([image_size]), 0)
    _4 = torch.div(torch.add(max_size, CONSTANTS.c0), CONSTANTS.c1, rounding_mode="floor")
         ~~~~~~~~~ <--- HERE
    max_size0 = torch.mul(_4, CONSTANTS.c1)
    _5 = torch.sub(torch.select(max_size0, 0, -1), torch.select(image_size, 0, 1))

Traceback of TorchScript, original code (most recent call last):
/data2/ghazal/miniconda3/lib/python3.9/site-packages/detectron2/structures/image_list.py(101): from_tensors
/data2/ghazal/miniconda3/lib/python3.9/site-packages/detectron2/modeling/meta_arch/rcnn.py(229): preprocess_image
/data2/ghazal/projects/Real2Sim/object_tracking/matt3r_tracking/Detic/detic/modeling/meta_arch/custom_rcnn.py(96): inference
/data2/ghazal/projects/Real2Sim/object_tracking/matt3r_tracking/export_model.py(60): inference
/data2/ghazal/miniconda3/lib/python3.9/site-packages/detectron2/export/flatten.py(294): forward
/data2/ghazal/miniconda3/lib/python3.9/site-packages/torch/nn/modules/module.py(1182): _slow_forward
/data2/ghazal/miniconda3/lib/python3.9/site-packages/torch/nn/modules/module.py(1194): _call_impl
/data2/ghazal/miniconda3/lib/python3.9/site-packages/torch/jit/_trace.py(976): trace_module
/data2/ghazal/miniconda3/lib/python3.9/site-packages/torch/jit/_trace.py(759): trace
/data2/ghazal/projects/Real2Sim/object_tracking/matt3r_tracking/export_model.py(70): export_tracing
/data2/ghazal/projects/Real2Sim/object_tracking/matt3r_tracking/export_model.py(172): <module>
RuntimeError: Expected all tensors to be on the same device, but found at least two devices, cuda:0 and cpu!
```
Are these because of the tracer warnings? Can anyone help me solve this please?

@anshudaur Were you able to successfully get inference from the model you exported? If yes, would it be possible to share your code and your model?

Thank you!

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Export Detic to ONNX or Torchscript #107

Metadata

Assignees

Labels

Type

Fields

Projects

Milestone

Relationships

Development

Export Detic to ONNX or Torchscript #107

Description

Metadata

Metadata

Assignees

Labels

Type

Fields

Projects

Milestone

Relationships

Development

Issue actions