Add openlane v2 (#121)

cce49ba9 · Chengyu Wang · GitHub · dbf29e61 · cce49ba9 · cce49ba9
Unverified Commit cce49ba9 authored Apr 21, 2023 by Chengyu Wang Committed by GitHub Apr 21, 2023
20 changed files
--- a/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/core/bbox/__init__.py
+++ b/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/core/bbox/__init__.py
+from .assigners import *
+from .match_costs import *
\ No newline at end of file
--- a/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/core/bbox/assigners.py
+++ b/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/core/bbox/assigners.py
+# ==============================================================================
+# Binaries and/or source for the following packages or projects 
+# are presented under one or more of the following open source licenses:
+# assigners.py    The OpenLane-V2 Dataset Authors    Apache License, Version 2.0
+#
+# Contact wanghuijie@pjlab.org.cn if you have any issue.
+#
+# Copyright (c) 2023 The OpenLane-v2 Dataset Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+import torch
+from scipy.optimize import linear_sum_assignment
+
+from mmdet.core.bbox.builder import BBOX_ASSIGNERS
+from mmdet.core.bbox.assigners import HungarianAssigner, AssignResult
+
+
+@BBOX_ASSIGNERS.register_module()
+class LaneHungarianAssigner(HungarianAssigner):
+
+    def assign(self,
+               lane_pred,
+               cls_pred,
+               gt_lanes,
+               gt_labels,
+               img_meta,
+               gt_lanes_ignore=None,
+               eps=1e-7):
+        assert gt_lanes_ignore is None, \
+            'Only case when gt_lanes_ignore is None is supported.'
+        num_gts, num_lanes = gt_lanes.size(0), lane_pred.size(0)
+
+        # 1. assign -1 by default
+        assigned_gt_inds = lane_pred.new_full((num_lanes, ),
+                                              -1,
+                                              dtype=torch.long)
+        assigned_labels = lane_pred.new_full((num_lanes, ),
+                                             -1,
+                                             dtype=torch.long)
+        if num_gts == 0 or num_lanes == 0:
+            # No ground truth or boxes, return empty assignment
+            if num_gts == 0:
+                # No ground truth, assign all to background
+                assigned_gt_inds[:] = 0
+            return AssignResult(
+                num_gts, assigned_gt_inds, None, labels=assigned_labels)
+
+        # 2. compute the weighted costs
+        # classification and lanecost.
+        cls_cost = self.cls_cost(cls_pred, gt_labels)
+        # regression L1 cost
+        reg_cost = self.reg_cost(lane_pred, gt_lanes)
+        # weighted sum of above three costs
+        cost = cls_cost + reg_cost
+
+        # 3. do Hungarian matching on CPU using linear_sum_assignment
+        cost = cost.detach().cpu()
+        matched_row_inds, matched_col_inds = linear_sum_assignment(cost)
+        matched_row_inds = torch.from_numpy(matched_row_inds).to(
+            lane_pred.device)
+        matched_col_inds = torch.from_numpy(matched_col_inds).to(
+            lane_pred.device)
+
+        # 4. assign backgrounds and foregrounds
+        # assign all indices to backgrounds first
+        assigned_gt_inds[:] = 0
+        # assign foregrounds based on matching results
+        assigned_gt_inds[matched_row_inds] = matched_col_inds + 1
+        assigned_labels[matched_row_inds] = gt_labels[matched_col_inds]
+        return AssignResult(
+            num_gts, assigned_gt_inds, None, labels=assigned_labels)
--- a/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/core/bbox/match_costs.py
+++ b/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/core/bbox/match_costs.py
+# ==============================================================================
+# Binaries and/or source for the following packages or projects 
+# are presented under one or more of the following open source licenses:
+# match_costs.py    The OpenLane-V2 Dataset Authors    Apache License, Version 2.0
+#
+# Contact wanghuijie@pjlab.org.cn if you have any issue.
+#
+# Copyright (c) 2023 The OpenLane-v2 Dataset Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+import torch
+
+from mmdet.core.bbox.match_costs.builder import MATCH_COST
+
+
+@MATCH_COST.register_module()
+class LaneL1Cost:
+    r"""
+    Notes
+    -----
+    Adapted from https://github.com/open-mmlab/mmdetection/blob/master/mmdet/core/bbox/match_costs/match_cost.py#L11.
+
+    """
+    def __init__(self, weight=1.):
+        self.weight = weight
+
+    def __call__(self, lane_pred, gt_lanes):
+        lane_cost = torch.cdist(lane_pred, gt_lanes, p=1)
+        return lane_cost * self.weight
--- a/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/datasets/__init__.py
+++ b/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/datasets/__init__.py
+from .pipelines import *
+from .openlane_v2_dataset import *
\ No newline at end of file
--- a/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/datasets/openlane_v2_dataset.py
+++ b/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/datasets/openlane_v2_dataset.py
--- a/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/datasets/pipelines/__init__.py
+++ b/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/datasets/pipelines/__init__.py
+from .formating import *
+from .loading import *
+from .transforms import *
\ No newline at end of file
--- a/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/datasets/pipelines/formating.py
+++ b/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/datasets/pipelines/formating.py
+# ==============================================================================
+# Binaries and/or source for the following packages or projects 
+# are presented under one or more of the following open source licenses:
+# formating.py    The OpenLane-V2 Dataset Authors    Apache License, Version 2.0
+#
+# Contact wanghuijie@pjlab.org.cn if you have any issue.
+#
+# Copyright (c) 2023 The OpenLane-v2 Dataset Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+import numpy as np
+
+from mmcv.parallel import DataContainer as DC
+from mmdet.datasets import PIPELINES
+from mmdet.datasets.pipelines import to_tensor
+
+
+@PIPELINES.register_module()
+class CustomDefaultFormatBundle:
+
+    def __init__(self):
+        pass
+
+    def __call__(self, results):
+
+        temp = to_tensor(np.concatenate([i[None, ...] for i in results['img']], axis=0))
+        results['img'] = DC(temp.permute(0, 3, 1, 2), stack=True)
+        
+        if 'gt_lc' in results:
+            results['gt_lc'] = DC(to_tensor(results['gt_lc']))
+        if 'gt_lc_labels' in results:
+            results['gt_lc_labels'] = DC(to_tensor(results['gt_lc_labels']))
+        if 'gt_te' in results:
+            results['gt_te'] = DC(to_tensor(results['gt_te']))
+        if 'gt_te_labels' in results:
+            results['gt_te_labels'] = DC(to_tensor(results['gt_te_labels']))
+        if 'gt_topology_lclc' in results:
+            results['gt_topology_lclc'] = DC(to_tensor(results['gt_topology_lclc']))
+        if 'gt_topology_lcte' in results:
+            results['gt_topology_lcte'] = DC(to_tensor(results['gt_topology_lcte']))
+        
+        return results
--- a/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/datasets/pipelines/loading.py
+++ b/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/datasets/pipelines/loading.py
+# ==============================================================================
+# Binaries and/or source for the following packages or projects 
+# are presented under one or more of the following open source licenses:
+# loading.py    The OpenLane-V2 Dataset Authors    Apache License, Version 2.0
+#
+# Contact wanghuijie@pjlab.org.cn if you have any issue.
+#
+# Copyright (c) 2023 The OpenLane-v2 Dataset Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+import numpy as np
+
+import mmcv
+from mmdet.datasets import PIPELINES
+from mmdet3d.datasets.pipelines import LoadMultiViewImageFromFiles
+
+
+@PIPELINES.register_module()
+class CustomLoadMultiViewImageFromFiles(LoadMultiViewImageFromFiles):
+
+    def __call__(self, results):
+        filename = results['img_paths']
+        img = [mmcv.imread(name, self.color_type) for name in filename]
+        if self.to_float32:
+            img = [i.astype(np.float32) for i in img]
+        results['img'] = img
+        results['img_shape'] = [i.shape for i in results['img']]
+        return results
--- a/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/datasets/pipelines/transforms.py
+++ b/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/datasets/pipelines/transforms.py
+# ==============================================================================
+# Binaries and/or source for the following packages or projects 
+# are presented under one or more of the following open source licenses:
+# transforms.py    The OpenLane-V2 Dataset Authors    Apache License, Version 2.0
+#
+# Contact wanghuijie@pjlab.org.cn if you have any issue.
+#
+# Copyright (c) 2023 The OpenLane-v2 Dataset Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+import numpy as np
+from numpy import random
+from math import factorial
+
+import mmcv
+from mmdet.datasets import PIPELINES
+
+
+@PIPELINES.register_module()
+class ResizeFrontView:
+
+    def __init__(self):
+        pass
+
+    def __call__(self, results):
+        assert 'ring_front_center' in results['img_paths'][0], \
+            'the first image should be the front view'
+
+        #image
+        front_view = results['img'][0]
+        h, w, _ = front_view.shape
+        resiezed_front_view, w_scale, h_scale = mmcv.imresize(
+            front_view,
+            (h, w),
+            return_scale=True,
+        )
+        results['img'][0] = resiezed_front_view
+        results['img_shape'][0] = resiezed_front_view.shape
+
+        # gt
+        scale_factor = np.array(
+            [w_scale, h_scale, w_scale, h_scale],
+            dtype=np.float32,
+        )
+        results['scale_factor'] = scale_factor
+        if 'gt_te' in results:
+            results['gt_te'] = results['gt_te'] * results['scale_factor']
+
+        # intrinsic
+        lidar2cam_r = results['rots'][0]
+        lidar2cam_t = (-results['trans'][0]) @ lidar2cam_r.T
+        lidar2cam_rt = np.eye(4)
+        lidar2cam_rt[:3, :3] = lidar2cam_r.T
+        lidar2cam_rt[3, :3] = -lidar2cam_t
+
+        intrinsic = results['cam2imgs'][0]
+        viewpad = np.eye(4)
+        viewpad[:intrinsic.shape[0], :intrinsic.shape[1]] = intrinsic
+
+        cam_s = np.eye(4)
+        cam_s[0, 0] *= w_scale
+        cam_s[1, 1] *= h_scale
+
+        viewpad = cam_s @ viewpad 
+        intrinsic = viewpad[:intrinsic.shape[0], :intrinsic.shape[1]]
+        lidar2img_rt = (viewpad @ lidar2cam_rt.T)
+
+        results['cam_intrinsic'][0] = viewpad
+        results['lidar2img'][0] = lidar2img_rt
+        results['cam2imgs'][0] = intrinsic
+
+        return results
+
+@PIPELINES.register_module()
+class NormalizeMultiviewImage:
+    r"""
+    Notes
+    -----
+    Adapted from https://github.com/fundamentalvision/BEVFormer/blob/master/projects/mmdet3d_plugin/datasets/pipelines/transform_3d.py#L62.
+
+    Normalize the image.
+    Added key is "img_norm_cfg".
+    Args:
+        mean (sequence): Mean values of 3 channels.
+        std (sequence): Std values of 3 channels.
+        to_rgb (bool): Whether to convert the image from BGR to RGB,
+            default is true.
+    """
+
+    def __init__(self, mean, std, to_rgb=True):
+        self.mean = np.array(mean, dtype=np.float32)
+        self.std = np.array(std, dtype=np.float32)
+        self.to_rgb = to_rgb
+
+
+    def __call__(self, results):
+        """Call function to normalize images.
+        Args:
+            results (dict): Result dict from loading pipeline.
+        Returns:
+            dict: Normalized results, 'img_norm_cfg' key is added into
+                result dict.
+        """
+
+        results['img'] = [mmcv.imnormalize(img, self.mean, self.std, self.to_rgb) for img in results['img']]
+        results['img_norm_cfg'] = dict(
+            mean=self.mean, std=self.std, to_rgb=self.to_rgb)
+        return results
+
+    def __repr__(self):
+        repr_str = self.__class__.__name__
+        repr_str += f'(mean={self.mean}, std={self.std}, to_rgb={self.to_rgb})'
+        return repr_str
+
+@PIPELINES.register_module()
+class PhotoMetricDistortionMultiViewImage:
+    r"""
+    Notes
+    -----
+    Adapted from https://github.com/fundamentalvision/BEVFormer/blob/master/projects/mmdet3d_plugin/datasets/pipelines/transform_3d.py#L99.
+    
+    Apply photometric distortion to image sequentially, every transformation
+    is applied with a probability of 0.5. The position of random contrast is in
+    second or second to last.
+    1. random brightness
+    2. random contrast (mode 0)
+    3. convert color from BGR to HSV
+    4. random saturation
+    5. random hue
+    6. convert color from HSV to BGR
+    7. random contrast (mode 1)
+    8. randomly swap channels
+    Args:
+        brightness_delta (int): delta of brightness.
+        contrast_range (tuple): range of contrast.
+        saturation_range (tuple): range of saturation.
+        hue_delta (int): delta of hue.
+    """
+
+    def __init__(self,
+                 brightness_delta=32,
+                 contrast_range=(0.5, 1.5),
+                 saturation_range=(0.5, 1.5),
+                 hue_delta=18):
+        self.brightness_delta = brightness_delta
+        self.contrast_lower, self.contrast_upper = contrast_range
+        self.saturation_lower, self.saturation_upper = saturation_range
+        self.hue_delta = hue_delta
+
+    def __call__(self, results):
+        """Call function to perform photometric distortion on images.
+        Args:
+            results (dict): Result dict from loading pipeline.
+        Returns:
+            dict: Result dict with images distorted.
+        """
+        imgs = results['img']
+        new_imgs = []
+        for img in imgs:
+            assert img.dtype == np.float32, \
+                'PhotoMetricDistortion needs the input image of dtype np.float32,'\
+                ' please set "to_float32=True" in "LoadImageFromFile" pipeline'
+            # random brightness
+            if random.randint(2):
+                delta = random.uniform(-self.brightness_delta,
+                                    self.brightness_delta)
+                img += delta
+
+            # mode == 0 --> do random contrast first
+            # mode == 1 --> do random contrast last
+            mode = random.randint(2)
+            if mode == 1:
+                if random.randint(2):
+                    alpha = random.uniform(self.contrast_lower,
+                                        self.contrast_upper)
+                    img *= alpha
+
+            # convert color from BGR to HSV
+            img = mmcv.bgr2hsv(img)
+
+            # random saturation
+            if random.randint(2):
+                img[..., 1] *= random.uniform(self.saturation_lower,
+                                            self.saturation_upper)
+
+            # random hue
+            if random.randint(2):
+                img[..., 0] += random.uniform(-self.hue_delta, self.hue_delta)
+                img[..., 0][img[..., 0] > 360] -= 360
+                img[..., 0][img[..., 0] < 0] += 360
+
+            # convert color from HSV to BGR
+            img = mmcv.hsv2bgr(img)
+
+            # random contrast
+            if mode == 0:
+                if random.randint(2):
+                    alpha = random.uniform(self.contrast_lower,
+                                        self.contrast_upper)
+                    img *= alpha
+
+            # randomly swap channels
+            if random.randint(2):
+                img = img[..., random.permutation(3)]
+            new_imgs.append(img)
+        results['img'] = new_imgs
+        return results
+
+    def __repr__(self):
+        repr_str = self.__class__.__name__
+        repr_str += f'(\nbrightness_delta={self.brightness_delta},\n'
+        repr_str += 'contrast_range='
+        repr_str += f'{(self.contrast_lower, self.contrast_upper)},\n'
+        repr_str += 'saturation_range='
+        repr_str += f'{(self.saturation_lower, self.saturation_upper)},\n'
+        repr_str += f'hue_delta={self.hue_delta})'
+        return repr_str
+
+@PIPELINES.register_module()
+class CustomPadMultiViewImage:
+
+    def __init__(self, size_divisor=None, pad_val=0):
+        self.size_divisor = size_divisor
+        self.pad_val = pad_val
+
+    def __call__(self, results):
+        max_h = max([img.shape[0] for img in results['img']])
+        max_w = max([img.shape[1] for img in results['img']])
+        padded_img = [mmcv.impad(img, shape=(max_h, max_w), pad_val=self.pad_val) for img in results['img']]
+        if self.size_divisor is not None:
+            padded_img = [mmcv.impad_to_multiple(
+                img, self.size_divisor, pad_val=self.pad_val) for img in padded_img]
+        
+        results['img'] = padded_img
+        results['pad_shape'] = [img.shape for img in padded_img]
+        results['pad_fixed_size'] = None
+        results['pad_size_divisor'] = self.size_divisor
+
+        return results
+
+    def __repr__(self):
+        repr_str = self.__class__.__name__
+        repr_str += f'size_divisor={self.size_divisor}, '
+        repr_str += f'pad_val={self.pad_val})'
+        return repr_str
+
+@PIPELINES.register_module()
+class CustomParameterizeLane:
+
+    def __init__(self, method, method_para):
+        method_list = ['bezier', 'polygon', 'bezier_Direction_attribute', 'bezier_Endpointfixed']
+        self.method = method
+        if not self.method in method_list:
+            raise Exception("Not implemented!")
+        self.method_para = method_para
+
+    def __call__(self, results):
+        centerlines = results['gt_lc']
+        para_centerlines = getattr(self, self.method)(centerlines, **self.method_para)
+        results['gt_lc'] = para_centerlines
+        return results
+
+    def comb(self, n, k):
+        return factorial(n) // (factorial(k) * factorial(n - k))
+
+    def fit_bezier(self, points, n_control):
+        n_points = len(points)
+        A = np.zeros((n_points, n_control))
+        t = np.arange(n_points) / (n_points - 1)
+        for i in range(n_points):
+            for j in range(n_control):
+                A[i, j] = self.comb(n_control - 1, j) * np.power(1 - t[i], n_control - 1 - j) * np.power(t[i], j)
+        conts = np.linalg.lstsq(A, points, rcond=None)
+        return conts
+
+    def fit_bezier_Endpointfixed(self, points, n_control):
+        n_points = len(points)
+        A = np.zeros((n_points, n_control))
+        t = np.arange(n_points) / (n_points - 1)
+        for i in range(n_points):
+            for j in range(n_control):
+                A[i, j] = self.comb(n_control - 1, j) * np.power(1 - t[i], n_control - 1 - j) * np.power(t[i], j)
+        A_BE = A[1:-1, 1:-1]
+        _points = points[1:-1]
+        _points = _points - A[1:-1, 0].reshape(-1, 1) @ points[0].reshape(1, -1) - A[1:-1, -1].reshape(-1, 1) @ points[-1].reshape(1, -1)
+
+        conts = np.linalg.lstsq(A_BE, _points, rcond=None)
+
+        control_points = np.zeros((n_control, points.shape[1]))
+        control_points[0] = points[0]
+        control_points[-1] = points[-1]
+        control_points[1:-1] = conts[0]
+
+        return control_points
+
+    def bezier(self, input_data, n_control=2):
+
+        coeffs_list = []
+        for idx, centerline in enumerate(input_data):
+            sorted_x = np.array(centerline[:, 1])
+            sorted_y = np.array(centerline[:, 0])
+            points = np.array(list(zip(sorted_x, sorted_y)))
+            res = self.fit_bezier(points, n_control)[0]
+            start_res = res[0]
+            end_res = res[-1]
+            first_diff = (np.sum(np.square(start_res - points[0]))) + (np.sum(np.square(end_res - points[-1])))
+            second_diff = (np.sum(np.square(start_res - points[-1]))) + (np.sum(np.square(end_res - points[0])))
+
+            if first_diff <= second_diff:
+                fin_res = res
+            else:
+                fin_res = np.zeros_like(res)
+                for m in range(len(res)):
+                    fin_res[len(res) - m - 1] = res[m]
+
+            fin_res = np.clip(fin_res, 0, 1)
+            coeffs_list.append(np.reshape(np.float32(fin_res), (-1)))
+
+        return np.array(coeffs_list)
+
+    def bezier_Direction_attribute(self, input_data, n_control=3):
+        coeffs_list = []
+        for idx, centerline in enumerate(input_data):
+            centerline[:, 1] = centerline[:, 1]
+            centerline[:, 0] = centerline[:, 0]
+            sorted_x = np.array(centerline[:, 1])
+            sorted_y = np.array(centerline[:, 0])
+            points = np.array(list(zip(sorted_x, sorted_y)))
+            res = self.fit_bezier(points, n_control)[0]
+            fin_res = np.clip(res, 0, 1)
+            start_res = res[0]
+            end_res = res[-1]
+            first_diff = (np.sum(np.square(start_res - points[0]))) + (np.sum(np.square(end_res - points[-1])))
+            second_diff = (np.sum(np.square(start_res - points[-1]))) + (np.sum(np.square(end_res - points[0])))
+            if first_diff <= second_diff:
+                da = 0
+            else:
+                da = 1
+            fin_res = np.append(fin_res, da)
+            coeffs_list.append(np.reshape(np.float32(fin_res), (-1)))
+        return np.array(coeffs_list)
+
+    def bezier_Endpointfixed(self, input_data, n_control=2):
+        coeffs_list = []
+        for idx, centerline in enumerate(input_data):
+            res = self.fit_bezier_Endpointfixed(centerline, n_control)
+            coeffs = res.flatten()
+            coeffs_list.append(coeffs)
+        return np.array(coeffs_list, dtype=np.float32)
+
+    def polygon(self, input_data, key_rep='Bounding Box'):
+        keypoints = []
+        for idx, centerline in enumerate(input_data):
+            centerline[:, 1] = centerline[:, 1]
+            centerline[:, 0] = centerline[:, 0]
+            sorted_x = np.array(centerline[:, 1])
+            sorted_y = np.array(centerline[:, 0])
+            points = np.array(list(zip(sorted_x, sorted_y)))
+            if key_rep not in ['Bounding Box', 'SME', 'Extreme Points']:
+                raise Exception(f"{key_rep} not existed!")
+            elif key_rep == 'Bounding Box':
+                res = np.array(
+                    [points[:, 0].min(), points[:, 1].min(), points[:, 0].max(), points[:, 1].max()]).reshape((2, 2))
+                keypoints.append(np.reshape(np.float32(res), (-1)))
+            elif key_rep == 'SME':
+                res = np.array([points[0], points[-1], points[int(len(points) / 2)]])
+                keypoints.append(np.reshape(np.float32(res), (-1)))
+            else:
+                min_x = np.min([points[:, 0] for p in points])
+                ind_left = np.where(points[:, 0] == min_x)
+                max_x = np.max([points[:, 0] for p in points])
+                ind_right = np.where(points[:, 0] == max_x)
+                max_y = np.max([points[:, 1] for p in points])
+                ind_top = np.where(points[:, 1] == max_y)
+                min_y = np.min([points[:, 1] for p in points])
+                ind_botton = np.where(points[:, 1] == min_y)
+                res = np.array(
+                    [points[ind_left[0][0]], points[ind_right[0][0]], points[ind_top[0][0]], points[ind_botton[0][0]]])
+                keypoints.append(np.reshape(np.float32(res), (-1)))
+        return np.array(keypoints)
--- a/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/models/__init__.py
+++ b/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/models/__init__.py
+from .detectors import *
+from .heads import *
+from .necks import *
+from .modules import *
+from .backbones import *
--- a/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/models/backbones/__init__.py
+++ b/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/models/backbones/__init__.py
+from .intern_image import InternImage
+
+__all__ = ['InternImage']
--- a/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/models/backbones/intern_image.py
+++ b/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/models/backbones/intern_image.py
--- a/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/models/backbones/ops_dcnv3/functions/__init__.py
+++ b/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/models/backbones/ops_dcnv3/functions/__init__.py
+# --------------------------------------------------------
+# InternImage
+# Copyright (c) 2022 OpenGVLab
+# Licensed under The MIT License [see LICENSE for details]
+# --------------------------------------------------------
+
+from .dcnv3_func import DCNv3Function, dcnv3_core_pytorch
--- a/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/models/backbones/ops_dcnv3/functions/dcnv3_func.py
+++ b/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/models/backbones/ops_dcnv3/functions/dcnv3_func.py
+# --------------------------------------------------------
+# InternImage
+# Copyright (c) 2022 OpenGVLab
+# Licensed under The MIT License [see LICENSE for details]
+# --------------------------------------------------------
+
+from __future__ import absolute_import
+from __future__ import print_function
+from __future__ import division
+
+import torch
+import torch.nn.functional as F
+from torch.autograd import Function
+from torch.autograd.function import once_differentiable
+from torch.cuda.amp import custom_bwd, custom_fwd
+import DCNv3
+
+
+class DCNv3Function(Function):
+    @staticmethod
+    @custom_fwd
+    def forward(
+            ctx, input, offset, mask,
+            kernel_h, kernel_w, stride_h, stride_w,
+            pad_h, pad_w, dilation_h, dilation_w,
+            group, group_channels, offset_scale, im2col_step):
+        ctx.kernel_h = kernel_h
+        ctx.kernel_w = kernel_w
+        ctx.stride_h = stride_h
+        ctx.stride_w = stride_w
+        ctx.pad_h = pad_h
+        ctx.pad_w = pad_w
+        ctx.dilation_h = dilation_h
+        ctx.dilation_w = dilation_w
+        ctx.group = group
+        ctx.group_channels = group_channels
+        ctx.offset_scale = offset_scale
+        ctx.im2col_step = im2col_step
+        output = DCNv3.dcnv3_forward(
+            input, offset, mask, kernel_h,
+            kernel_w, stride_h, stride_w, pad_h,
+            pad_w, dilation_h, dilation_w, group,
+            group_channels, offset_scale, ctx.im2col_step)
+        ctx.save_for_backward(input, offset, mask)
+
+        return output
+
+    @staticmethod
+    @once_differentiable
+    @custom_bwd
+    def backward(ctx, grad_output):
+        input, offset, mask = ctx.saved_tensors
+        grad_input, grad_offset, grad_mask = \
+            DCNv3.dcnv3_backward(
+                input, offset, mask, ctx.kernel_h,
+                ctx.kernel_w, ctx.stride_h, ctx.stride_w, ctx.pad_h,
+                ctx.pad_w, ctx.dilation_h, ctx.dilation_w, ctx.group,
+                ctx.group_channels, ctx.offset_scale, grad_output.contiguous(), ctx.im2col_step)
+
+        return grad_input, grad_offset, grad_mask, \
+            None, None, None, None, None, None, None, None, None, None, None, None
+
+    @staticmethod
+    def symbolic(g, input, offset, mask, kernel_h, kernel_w, stride_h,
+                 stride_w, pad_h, pad_w, dilation_h, dilation_w, group,
+                 group_channels, offset_scale, im2col_step):
+        """Symbolic function for mmdeploy::DCNv3.
+
+        Returns:
+            DCNv3 op for onnx.
+        """
+        return g.op(
+            'mmdeploy::TRTDCNv3',
+            input,
+            offset,
+            mask,
+            kernel_h_i=int(kernel_h),
+            kernel_w_i=int(kernel_w),
+            stride_h_i=int(stride_h),
+            stride_w_i=int(stride_w),
+            pad_h_i=int(pad_h),
+            pad_w_i=int(pad_w),
+            dilation_h_i=int(dilation_h),
+            dilation_w_i=int(dilation_w),
+            group_i=int(group),
+            group_channels_i=int(group_channels),
+            offset_scale_f=float(offset_scale),
+            im2col_step_i=int(im2col_step),
+        )
+
+def _get_reference_points(spatial_shapes, device, kernel_h, kernel_w, dilation_h, dilation_w, pad_h=0, pad_w=0, stride_h=1, stride_w=1):
+    _, H_, W_, _ = spatial_shapes
+    H_out = (H_ - (dilation_h * (kernel_h - 1) + 1)) // stride_h + 1
+    W_out = (W_ - (dilation_w * (kernel_w - 1) + 1)) // stride_w + 1
+
+    ref_y, ref_x = torch.meshgrid(
+        torch.linspace(
+            # pad_h + 0.5,
+            # H_ - pad_h - 0.5,
+            (dilation_h * (kernel_h - 1)) // 2 + 0.5,
+            (dilation_h * (kernel_h - 1)) // 2 + 0.5 + (H_out - 1) * stride_h,
+            H_out,
+            dtype=torch.float32,
+            device=device),
+        torch.linspace(
+            # pad_w + 0.5,
+            # W_ - pad_w - 0.5,
+            (dilation_w * (kernel_w - 1)) // 2 + 0.5,
+            (dilation_w * (kernel_w - 1)) // 2 + 0.5 + (W_out - 1) * stride_w,
+            W_out,
+            dtype=torch.float32,
+            device=device))
+    ref_y = ref_y.reshape(-1)[None] / H_
+    ref_x = ref_x.reshape(-1)[None] / W_
+
+    ref = torch.stack((ref_x, ref_y), -1).reshape(
+        1, H_out, W_out, 1, 2)
+
+    return ref
+
+
+def _generate_dilation_grids(spatial_shapes, kernel_h, kernel_w, dilation_h, dilation_w, group, device):
+    _, H_, W_, _ = spatial_shapes
+    points_list = []
+    x, y = torch.meshgrid(
+        torch.linspace(
+            -((dilation_w * (kernel_w - 1)) // 2),
+            -((dilation_w * (kernel_w - 1)) // 2) +
+            (kernel_w - 1) * dilation_w, kernel_w,
+            dtype=torch.float32,
+            device=device),
+        torch.linspace(
+            -((dilation_h * (kernel_h - 1)) // 2),
+            -((dilation_h * (kernel_h - 1)) // 2) +
+            (kernel_h - 1) * dilation_h, kernel_h,
+            dtype=torch.float32,
+            device=device))
+
+    points_list.extend([x / W_, y / H_])
+    grid = torch.stack(points_list, -1).reshape(-1, 1, 2).\
+        repeat(1, group, 1).permute(1, 0, 2)
+    grid = grid.reshape(1, 1, 1, group * kernel_h * kernel_w, 2)
+
+    return grid
+
+
+def dcnv3_core_pytorch(
+        input, offset, mask, kernel_h,
+        kernel_w, stride_h, stride_w, pad_h,
+        pad_w, dilation_h, dilation_w, group,
+        group_channels, offset_scale):
+    # for debug and test only,
+    # need to use cuda version instead
+    input = F.pad(
+        input,
+        [0, 0, pad_h, pad_h, pad_w, pad_w])
+    N_, H_in, W_in, _ = input.shape
+    _, H_out, W_out, _ = offset.shape
+
+    ref = _get_reference_points(
+        input.shape, input.device, kernel_h, kernel_w, dilation_h, dilation_w, pad_h, pad_w, stride_h, stride_w)
+    grid = _generate_dilation_grids(
+        input.shape, kernel_h, kernel_w, dilation_h, dilation_w, group, input.device)
+    spatial_norm = torch.tensor([W_in, H_in]).reshape(1, 1, 1, 2).\
+        repeat(1, 1, 1, group*kernel_h*kernel_w).to(input.device)
+
+    sampling_locations = (ref + grid * offset_scale).repeat(N_, 1, 1, 1, 1).flatten(3, 4) + \
+        offset * offset_scale / spatial_norm
+
+    P_ = kernel_h * kernel_w
+    sampling_grids = 2 * sampling_locations - 1
+    # N_, H_in, W_in, group*group_channels -> N_, H_in*W_in, group*group_channels -> N_, group*group_channels, H_in*W_in -> N_*group, group_channels, H_in, W_in
+    input_ = input.view(N_, H_in*W_in, group*group_channels).transpose(1, 2).\
+        reshape(N_*group, group_channels, H_in, W_in)
+    # N_, H_out, W_out, group*P_*2 -> N_, H_out*W_out, group, P_, 2 -> N_, group, H_out*W_out, P_, 2 -> N_*group, H_out*W_out, P_, 2
+    sampling_grid_ = sampling_grids.view(N_, H_out*W_out, group, P_, 2).transpose(1, 2).\
+        flatten(0, 1)
+    # N_*group, group_channels, H_out*W_out, P_
+    sampling_input_ = F.grid_sample(
+        input_, sampling_grid_, mode='bilinear', padding_mode='zeros', align_corners=False)
+
+    # (N_, H_out, W_out, group*P_) -> N_, H_out*W_out, group, P_ -> (N_, group, H_out*W_out, P_) -> (N_*group, 1, H_out*W_out, P_)
+    mask = mask.view(N_, H_out*W_out, group, P_).transpose(1, 2).\
+        reshape(N_*group, 1, H_out*W_out, P_)
+    output = (sampling_input_ * mask).sum(-1).view(N_,
+                                                   group*group_channels, H_out*W_out)
+
+    return output.transpose(1, 2).reshape(N_, H_out, W_out, -1).contiguous()
--- a/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/models/backbones/ops_dcnv3/make.sh
+++ b/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/models/backbones/ops_dcnv3/make.sh
+#!/usr/bin/env bash
+# --------------------------------------------------------
+# InternImage
+# Copyright (c) 2022 OpenGVLab
+# Licensed under The MIT License [see LICENSE for details]
+# --------------------------------------------------------
+
+python setup.py build install
--- a/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/models/backbones/ops_dcnv3/modules/__init__.py
+++ b/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/models/backbones/ops_dcnv3/modules/__init__.py
--- a/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/models/backbones/ops_dcnv3/modules/dcnv3.py
+++ b/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/models/backbones/ops_dcnv3/modules/dcnv3.py
--- a/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/models/backbones/ops_dcnv3/setup.py
+++ b/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/models/backbones/ops_dcnv3/setup.py
--- a/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/models/backbones/ops_dcnv3/src/cpu/dcnv3_cpu.cpp
+++ b/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/models/backbones/ops_dcnv3/src/cpu/dcnv3_cpu.cpp
--- a/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/models/backbones/ops_dcnv3/src/cpu/dcnv3_cpu.h
+++ b/autonomous_driving/openlane-v2/plugin/mmdet3d/baseline/models/backbones/ops_dcnv3/src/cpu/dcnv3_cpu.h