Source code for cosense3d.agents.utils.transform



import torch
import numpy as np
from scipy.spatial.transform.rotation import Rotation as R
from torch_scatter import scatter_mean

from cosense3d.utils import pclib, box_utils
from cosense3d.modules.utils.common import limit_period


[docs]def add_rotate(tf, rot):
    if isinstance(rot, list) and len(rot) == 3:
        # param: [roll, pitch, yaw] in radian
        rot = pclib.rotation_matrix(rot, degrees=False)
        rot = torch.from_numpy(rot).to(tf.device)
        tf[:3, :3] = rot @ tf[:3, :3]
    elif isinstance(rot, torch.Tensor):
        assert rot.shape[0] == 4
        tf = rot.to(tf.device) @ tf
    else:
        raise NotImplementedError
    return tf


[docs]def add_flip(tf, flip_idx, flip_axis='xy'):
    # flip_idx =1 : flip x
    # flip_idx =2 : flip y
    # flip_idx =3 : flip x & y
    rot = torch.eye(4).to(tf.device)
    # flip x
    if 'x' in flip_axis and (flip_idx == 1 or flip_idx == 3):
        rot[0, 0] *= -1
    # flip y
    if 'y' in flip_axis and (flip_idx == 2 or flip_idx == 3):
        rot[1, 1] *= -1
    tf = rot @ tf
    return tf


[docs]def add_scale(tf, scale_ratio):
    scale = torch.eye(4).to(tf.device)
    scale[[0, 1, 2], [0, 1, 2]] = scale_ratio
    tf = scale @ tf
    return tf


[docs]def apply_transform(data, transform, key):
    if (transform.cpu() == torch.eye(4)).all():
        return
    if key == 'points':
        C = data['points'].shape[-1]
        points = data['points'][:, :3]
        points = torch.cat([points, torch.ones_like(points[:, :1])], dim=-1).T
        points = (transform @ points).T

        if C > 3:
            data['points'] = torch.cat([points[:, :3],
                                        data['points'][:, 3:]], dim=-1)
        else:
            data['points'] = points
    elif 'annos_global' == key or 'annos_local' == key:
        box_key = f"{key.split('_')[1]}_bboxes_3d"
        if box_key not in data or data[box_key] is None:
            return
        boxes = data[box_key]
        data[box_key][:, :7] = box_utils.transform_boxes_3d(boxes[:, :7], transform, mode=7)
    elif key == 'annos_global_pred':
        preds = data['bboxes_3d_pred']
        boxes = data['global_bboxes_3d'][..., :7].detach().clone()
        boxes = boxes.unsqueeze(0).repeat(2, 1, 1)
        boxes[..., [0, 1, 2, 6]] = data['bboxes_3d_pred']
        boxes = box_utils.transform_boxes_3d(boxes.view(-1, 7), transform, mode=7)
        data['bboxes_3d_pred'] = boxes[..., [0, 1, 2, 6]].reshape(*preds.shape)
    elif key == 'img':
        for i in range(len(data['img'])):
            data['extrinsics'][i] = data['extrinsics'][i] @ transform.inverse()
            data['lidar2img'][i] = data['intrinsics'][i] @ data['extrinsics'][i]
    elif key == 'bev_tgt_pts' and key in data:
        if key not in data or data[key] is None:
            return
        points = data['bev_tgt_pts'].clone()
        points[:, 2] = 0
        points = torch.cat([points, torch.ones_like(points[:, :1])], dim=-1).T
        points = (transform @ points).T
        data['bev_tgt_pts'][:, :2] = points[:, :2]
    elif 'roadline' in key and key in data:
        if key not in data or data[key] is None:
            return
        points = data[key][:, :2].clone()
        points = torch.cat([points, torch.ones_like(points)], dim=-1).T
        points[2] = 0
        points = (transform @ points).T
        data[key][:, :2] = points[:, :2]


[docs]def filter_range(data, lidar_range, key):
    if 'points' in key:
        mask = filter_range_mask(data[key], lidar_range)
        points = data[key][mask]
        if len(points) == 0:
            # pad empty point cloud with random points to ensure batch norm validity
            points = data[key].new_zeros((8, points.shape[-1]))
            points[:, :2] = torch.rand_like(points[:, :2]) * 2 - 1
            points[:, 3] = -1
            points[:, -1] = data[key][:, -1].min()
        data[key] = points
    elif 'annos_global' == key or 'annos_local' == key:
        coor = key.split('_')[1]
        if f'{coor}_bboxes_3d' not in data or data[f'{coor}_bboxes_3d'] is None:
            return
        mask = filter_range_mask(data[f'{coor}_bboxes_3d'][:, :3], lidar_range)
        data[f'{coor}_bboxes_3d'] = data[f'{coor}_bboxes_3d'][mask]
        data[f'{coor}_labels_3d'] = data[f'{coor}_labels_3d'][mask]
        data[f'{coor}_bboxes_id'] = data[f'{coor}_bboxes_id'][mask]
        data[f'{coor}_names'] = [data[f'{coor}_names'][i] for i, m in enumerate(mask) if m]
        if coor == 'global' and 'bboxes_3d_pred' in data:
            data['bboxes_3d_pred'] = data['bboxes_3d_pred'][:, mask]


[docs]def filter_range_mask(points, lidar_range, eps=1e-4):
    lr = lidar_range.to(points.device)
    mask = (points[:, :3] > lr[:3].view(1, 3) + eps) & (points[:, :3] < lr[3:].view(1, 3) - eps)
    return mask.all(dim=-1)


[docs]def generate_bev_tgt_pts(points, data, transform=None, sam_res=0.4, map_res=0.2, range=50,
                         max_num_pts=5000, discrete=False):
    if 'bevmap' not in data or data['bevmap'] is None:
        return None
    bevmap = data['bevmap']
    bevmap_coor = data['bevmap_coor']
    sx, sy = bevmap.shape[:2]
    points2d = points[:, :2]
    points2d = points2d[(points2d.abs() <= range).all(1)]
    device = points2d.device

    # sample random points
    offsets = torch.randn((len(points2d), 10, 2), device=device) * 3
    points2d = (points2d.reshape(-1, 1, 2) + offsets).reshape(-1, 2)
    points2d = torch.unique(torch.floor(points2d / sam_res).int(), dim=0) * sam_res
    if not discrete:
        points2d = points2d + torch.randn_like(points2d)

    # transform points to global coordinates
    if transform is not None:
        points = torch.cat([points2d,
                              torch.zeros_like(points2d[:, :1]),
                              torch.ones_like(points2d[:, :1])],
                             dim=-1)
        points = transform @ points.T
    else:
        points = points2d.T

    xs = torch.floor((points[0] - bevmap_coor[0]) / map_res).int()
    ys = torch.floor((points[1] - bevmap_coor[1]) / map_res).int()
    xs = torch.clamp(xs, 0, sx - 1).long()
    ys = torch.clamp(ys, 0, sy - 1).long()
    road_mask = bevmap[xs, ys]

    bev_pts = torch.cat([points2d, road_mask.unsqueeze(1)], dim=1)
    return bev_pts[torch.randperm(len(bev_pts))[:max_num_pts]]


[docs]class DataOnlineProcessor:
[docs]    @staticmethod
    def update_transform_with_aug(transform, aug_params):
        if 'rot' in aug_params:
            transform = add_rotate(transform, aug_params['rot'])
        if 'flip' in aug_params:
            transform = add_flip(transform, **aug_params['flip'])
        if 'scale' in aug_params:
            transform = add_scale(transform, aug_params['scale'])
        return transform

[docs]    @staticmethod
    def apply_transform(data, transform, apply_to=['points']):
        for k in apply_to:
            apply_transform(data, transform, k)

[docs]    @staticmethod
    def cav_aug_transform(data, transform, aug_params,
                          apply_to=['points', 'imgs', 'annos_global']):
        # augmentation
        if aug_params is not None:
            transform = DataOnlineProcessor.update_transform_with_aug(transform, aug_params)

        DataOnlineProcessor.apply_transform(data, transform, apply_to)

[docs]    @staticmethod
    def filter_range(data, lidar_range, apply_to: list):
        for k in apply_to:
            filter_range(data, lidar_range, k)

[docs]    @staticmethod
    @torch.no_grad()
    def free_space_augmentation(data, d: float=10.0, h: float=-1.5, step: float=1.5, res=0.25):
        lidar = data['points']
        # get point lower than z_min=1.5m
        m = lidar[:, 2] < h
        points = lidar[m][:, :3]

        # generate free space points based on points
        dists = torch.norm(points[:, :2], dim=1).reshape(-1, 1)
        delta_d = torch.arange(1, d, step,
                               device=lidar.device).reshape(1, -1)
        steps = delta_d.shape[1]
        tmp = (dists - delta_d) / dists  # Nxsteps
        xyz_new = points[:, None, :] * tmp[:, :, None]  # Nxstepsx3

        # 1.remove free space points with negative distances to lidar center
        # 2.remove free space points higher than z_min
        # 3.remove duplicated points with resolution 1m
        xyz_new = xyz_new[tmp > 0]
        xyz_new = xyz_new[(xyz_new[..., 2] < h)]
        xyz_new = xyz_new[torch.randperm(len(xyz_new))]
        selected = torch.unique(torch.floor(xyz_new * res).long(), return_inverse=True, dim=0)[1]
        xyz_new = scatter_mean(src=xyz_new, index=selected, dim=0)

        # pad free space point intensity as -1
        xyz_new = torch.cat([xyz_new, - torch.ones_like(xyz_new[:, :1])], dim=-1)
        data['points'] = torch.cat([lidar, xyz_new], dim=0)

[docs]    @staticmethod
    @torch.no_grad()
    def adaptive_free_space_augmentation(data: dict, min_h: float=-1.5, steps: int=20,
                                         alpha: float=0.05, res: float=0.5, time_idx: int=None):
        r"""
        Add free space points according to the distance of points to the origin.

        .. raw:: html

           <pre>
           lidar origin ->  *
                         *  *
                      *     * h
                   *  ele   *
                 ************
                        d

           </pre>

        Assume the :math:`\theta = \frac{\\pi}{2} - \text{ele}` (elevation angle),
        :math:`\alpha` = average angle between two lidar rings,
        :math:`d_k` is the ground distance of the :math:`n_{th}` lidar ring to lidar origin, :math:`k=1,...,n`,
        :math:`\delta_d` is the distance between two neighboring lidar rings,
        then

        .. math::
            d &= h \tan(\theta) \\
            \delta_d &= d_n - d_{n-1} = d_n - h\tan(\arctan(\frac{h}{d_n}) - \alpha)

        we sample free space points in the ground distance of :math:`\delta_d` relative to each ring
        with the given 'step' distance.

        :param data: input data dict containing 'points'.
        :param min_h: minimum sample height relative to lidar origin. Default is -1.5.
        :param steps: number of points to be sampled for each lidar ray. Default is 20.
        :param alpha: average angle offset between two neighboring lidar casting rays. Default is 0.05.
        :param res: resolution for down-sampling the free space points. Default is 0.5.
        :param time_idx: if provided, time will be copied from the original points to free space points.
        :return:
            updated data.
        """

        lidar = data['points']
        # get point lower than z_min=1.5m
        m = lidar[:, 2] < min_h
        points = lidar[m]

        # generate free space points based on points
        dn = torch.norm(points[:, :2], dim=1).view(-1, 1)
        dn1 = - points[:, 2:3] * torch.tan(torch.atan2(dn, -points[:, 2:3]) - alpha)
        delta_d = dn - dn1
        steps_arr = torch.linspace(0, 1, steps + 1)[:-1].view(1, steps).to(delta_d.device)
        tmp = (dn - steps_arr * delta_d) / dn  # Nxsteps
        xyz_new = points[:, None, :3] * tmp[:, :, None]  # Nxstepsx3
        if time_idx is not None:
            times = points[:, time_idx].view(-1, 1, 1).repeat(1, steps, 1)
            xyz_new = torch.cat([xyz_new, times], dim=-1)

        # 1.remove free space points with negative distances to lidar center
        # 2.remove free space points higher than z_min
        # 3.remove duplicated points with resolution 1m
        xyz_new = xyz_new[tmp > 0]
        # xyz_new = xyz_new[(xyz_new[..., 2] < min_h)]
        xyz_new = xyz_new[torch.randperm(len(xyz_new))]
        uniq, selected = torch.unique(torch.floor(xyz_new[..., :3] * res).long(), return_inverse=True, dim=0)
        # xyz = torch.zeros_like(xyz_new[:len(uniq)])
        tmin = xyz_new[:, -1].min()
        xyz_new[:, -1] -= tmin
        xyz_new = scatter_mean(src=xyz_new, index=selected, dim=0)
        xyz_new[:, -1] += tmin

        # pad free space point intensity as -1
        xyz_new = torch.cat([xyz_new[:, :3], - torch.ones_like(xyz_new[:, :1]), xyz_new[:, 3:]], dim=-1)
        pad_dim = lidar.shape[-1] - xyz_new.shape[-1]
        if pad_dim > 0:
            xyz_new = torch.cat([xyz_new, torch.zeros_like(xyz_new[:, :1]).repeat(1, pad_dim)], dim=-1)
        data['points'] = torch.cat([lidar, xyz_new], dim=0)

[docs]    @staticmethod
    @torch.no_grad()
    def generate_sparse_target_bev_points(data: dict,
                                          transform=None,
                                          sam_res=0.4,
                                          map_res=0.2,
                                          range=50,
                                          max_num_pts=3000,
                                          discrete=False):
        data['bev_tgt_pts'] = generate_bev_tgt_pts(
            data['points'], data,
            transform, sam_res, map_res, range, max_num_pts, discrete
        )

        # from cosense3d.utils.vislib import draw_points_boxes_plt, plt
        # lidar = data['points'].cpu().numpy()
        # pts = data['bev_tgt_pts'].cpu().numpy()
        # pos = pts[:, 2] == 1
        # neg = pts[:, 2] == 0
        #
        # ax = draw_points_boxes_plt(
        #     pc_range=50,
        #     points=pts[pos, :],
        #     points_c='r',
        #     return_ax=True
        # )
        # ax.plot(pts[neg, 0], pts[neg, 1], '.', c='b', markersize=1)
        # ax.plot(lidar[:, 0], lidar[:, 1], '.', c='gray', markersize=1)
        # plt.savefig("/home/yuan/Downloads/tmp.png")
        # plt.close()

[docs]    @staticmethod
    @torch.no_grad()
    def generate_sparse_target_roadline_points(data: dict,
                                               transform=None,
                                               map_res=0.2,
                                               range=50,
                                               kernel=3,
                                               max_num_pts=3000):
        if 'bevmap' not in data or data['bevmap'] is None:
            return
        bevmap = data['bevmap'].clone().float()
        bevmap[bevmap==0] = -1
        bevmap_coor = data['bevmap_coor']
        sx, sy = bevmap.shape[:2]
        filters = torch.ones(1, 1, kernel, kernel, device=bevmap.device) / (kernel ** 2 * 2)
        road = torch.conv2d(bevmap[None, None], filters).squeeze()
        mask = (road < 0.5) & (road > -0.5)
        inds = torch.where(mask)
        scores = 1 - road[mask].abs()
        coords = torch.stack(inds).T * map_res + 2.5 * map_res - range

        data['roadline_tgts'] = torch.cat([coords, scores.unsqueeze(1)], dim=1)