bev-project/mmdet3d/models/vtransforms/base.py

from typing import Tuple

import torch
from mmcv.runner import force_fp32
from torch import nn

from mmdet3d.ops import bev_pool

__all__ = ["BaseTransform", "BaseDepthTransform"]

def boolmask2idx(mask):
    # A utility function, workaround for ONNX not supporting 'nonzero'
    return torch.nonzero(mask).squeeze(1).tolist()

def gen_dx_bx(xbound, ybound, zbound):
    dx = torch.Tensor([row[2] for row in [xbound, ybound, zbound]])
    bx = torch.Tensor([row[0] + row[2] / 2.0 for row in [xbound, ybound, zbound]])
    nx = torch.LongTensor(
        [(row[1] - row[0]) / row[2] for row in [xbound, ybound, zbound]]
    )
    return dx, bx, nx


class BaseTransform(nn.Module):
    def __init__(
        self,
        in_channels: int,
        out_channels: int,
        image_size: Tuple[int, int],
        feature_size: Tuple[int, int],
        xbound: Tuple[float, float, float],
        ybound: Tuple[float, float, float],
        zbound: Tuple[float, float, float],
        dbound: Tuple[float, float, float],
        use_points='lidar', 
        depth_input='scalar',
        height_expand=True, #// changed 
        add_depth_features=False,  #//
    ) -> None:
        super().__init__()
        self.in_channels = in_channels
        self.image_size = image_size
        self.feature_size = feature_size
        self.xbound = xbound
        self.ybound = ybound
        self.zbound = zbound
        self.dbound = dbound
        self.use_points = use_points
        assert use_points in ['radar', 'lidar']
        self.depth_input=depth_input
        assert depth_input in ['scalar', 'one-hot']
        self.height_expand = height_expand
        self.add_depth_features = add_depth_features

        dx, bx, nx = gen_dx_bx(self.xbound, self.ybound, self.zbound)
        self.dx = nn.Parameter(dx, requires_grad=False)
        self.bx = nn.Parameter(bx, requires_grad=False)
        self.nx = nn.Parameter(nx, requires_grad=False)

        self.C = out_channels
        self.frustum = self.create_frustum()
        self.D = self.frustum.shape[0]
        self.fp16_enabled = False

    @force_fp32()
    def create_frustum(self):
        iH, iW = self.image_size
        fH, fW = self.feature_size

        ds = (
            torch.arange(*self.dbound, dtype=torch.float)
            .view(-1, 1, 1)
            .expand(-1, fH, fW)
        )
        D, _, _ = ds.shape

        xs = (
            torch.linspace(0, iW - 1, fW, dtype=torch.float)
            .view(1, 1, fW)
            .expand(D, fH, fW)
        )
        ys = (
            torch.linspace(0, iH - 1, fH, dtype=torch.float)
            .view(1, fH, 1)
            .expand(D, fH, fW)
        )

        frustum = torch.stack((xs, ys, ds), -1)
        return nn.Parameter(frustum, requires_grad=False)

    @force_fp32()
    def get_geometry(
        self,
        camera2lidar_rots,
        camera2lidar_trans,
        intrins,
        post_rots,
        post_trans,
        **kwargs,
    ):
        B, N, _ = camera2lidar_trans.shape

        # undo post-transformation
        # B x N x D x H x W x 3
        points = self.frustum - post_trans.view(B, N, 1, 1, 1, 3)
        points = (
            torch.inverse(post_rots)
            .view(B, N, 1, 1, 1, 3, 3)
            .matmul(points.unsqueeze(-1))
        )
        # cam_to_lidar
        points = torch.cat(
            (
                points[:, :, :, :, :, :2] * points[:, :, :, :, :, 2:3],
                points[:, :, :, :, :, 2:3],
            ),
            5,
        )
        combine = camera2lidar_rots.matmul(torch.inverse(intrins))
        points = combine.view(B, N, 1, 1, 1, 3, 3).matmul(points).squeeze(-1)
        points += camera2lidar_trans.view(B, N, 1, 1, 1, 3)

        if "extra_rots" in kwargs:
            extra_rots = kwargs["extra_rots"]
            points = (
                extra_rots.view(B, 1, 1, 1, 1, 3, 3)
                .repeat(1, N, 1, 1, 1, 1, 1)
                .matmul(points.unsqueeze(-1))
                .squeeze(-1)
            )
        if "extra_trans" in kwargs:
            extra_trans = kwargs["extra_trans"]
            points += extra_trans.view(B, 1, 1, 1, 1, 3).repeat(1, N, 1, 1, 1, 1)

        return points

    def get_cam_feats(self, x):
        raise NotImplementedError

    @force_fp32()
    def bev_pool(self, geom_feats, x):
        B, N, D, H, W, C = x.shape
        Nprime = B * N * D * H * W

        # flatten x
        x = x.reshape(Nprime, C)

        # flatten indices
        geom_feats = ((geom_feats - (self.bx - self.dx / 2.0)) / self.dx).long()
        geom_feats = geom_feats.view(Nprime, 3)
        batch_ix = torch.cat(
            [
                torch.full([Nprime // B, 1], ix, device=x.device, dtype=torch.long)
                for ix in range(B)
            ]
        )
        geom_feats = torch.cat((geom_feats, batch_ix), 1)

        # filter out points that are outside box
        kept = (
            (geom_feats[:, 0] >= 0)
            & (geom_feats[:, 0] < self.nx[0])
            & (geom_feats[:, 1] >= 0)
            & (geom_feats[:, 1] < self.nx[1])
            & (geom_feats[:, 2] >= 0)
            & (geom_feats[:, 2] < self.nx[2])
        )
        x = x[kept]
        geom_feats = geom_feats[kept]

        x = bev_pool(x, geom_feats, B, self.nx[2], self.nx[0], self.nx[1])

        # collapse Z
        final = torch.cat(x.unbind(dim=2), 1)

        return final

    @force_fp32()
    def forward(
        self,
        img,
        points,
        radar, 
        camera2ego,
        lidar2ego,
        lidar2camera,
        lidar2image,
        camera_intrinsics,
        camera2lidar,
        img_aug_matrix,
        lidar_aug_matrix,
        **kwargs,
    ):
        rots = camera2ego[..., :3, :3]
        trans = camera2ego[..., :3, 3]
        intrins = camera_intrinsics[..., :3, :3]
        post_rots = img_aug_matrix[..., :3, :3]
        post_trans = img_aug_matrix[..., :3, 3]
        lidar2ego_rots = lidar2ego[..., :3, :3]
        lidar2ego_trans = lidar2ego[..., :3, 3]
        camera2lidar_rots = camera2lidar[..., :3, :3]
        camera2lidar_trans = camera2lidar[..., :3, 3]

        extra_rots = lidar_aug_matrix[..., :3, :3]
        extra_trans = lidar_aug_matrix[..., :3, 3]

        geom = self.get_geometry(
            camera2lidar_rots,
            camera2lidar_trans,
            intrins,
            post_rots,
            post_trans,
            extra_rots=extra_rots,
            extra_trans=extra_trans,
        )
        mats_dict = {
            'intrin_mats': camera_intrinsics, 
            'ida_mats': img_aug_matrix, 
            'bda_mat': lidar_aug_matrix,
            'sensor2ego_mats': camera2ego, 
        }
        x = self.get_cam_feats(img, mats_dict)

        use_depth = False
        if type(x) == tuple:
            x, depth = x 
            use_depth = True
        
        x = self.bev_pool(geom, x)

        if use_depth:
            return x, depth 
        else:
            return x


class BaseDepthTransform(BaseTransform):
    @force_fp32()
    def forward(
        self,
        img,
        points,
        radar, 
        sensor2ego,
        lidar2ego,
        lidar2camera,
        lidar2image,
        cam_intrinsic,
        camera2lidar,
        img_aug_matrix,
        lidar_aug_matrix,
        **kwargs,
    ):
        rots = sensor2ego[..., :3, :3]
        trans = sensor2ego[..., :3, 3]
        intrins = cam_intrinsic[..., :3, :3]
        post_rots = img_aug_matrix[..., :3, :3]
        post_trans = img_aug_matrix[..., :3, 3]
        lidar2ego_rots = lidar2ego[..., :3, :3]
        lidar2ego_trans = lidar2ego[..., :3, 3]
        camera2lidar_rots = camera2lidar[..., :3, :3]
        camera2lidar_trans = camera2lidar[..., :3, 3]

        if self.use_points == 'radar':
            points = radar

        if self.height_expand:
            for b in range(len(points)):
                points_repeated = points[b].repeat_interleave(8, dim=0)
                points_repeated[:, 2] = torch.arange(0.25, 2.25, 0.25).repeat(points[b].shape[0])
                points[b] = points_repeated

        batch_size = len(points)
        depth_in_channels = 1 if self.depth_input=='scalar' else self.D
        if self.add_depth_features:
            depth_in_channels += points[0].shape[1]

        depth = torch.zeros(batch_size, img.shape[1], depth_in_channels, *self.image_size, device=points[0].device)


        for b in range(batch_size):
            cur_coords = points[b][:, :3]
            cur_img_aug_matrix = img_aug_matrix[b]
            cur_lidar_aug_matrix = lidar_aug_matrix[b]
            cur_lidar2image = lidar2image[b]

            # inverse aug
            cur_coords -= cur_lidar_aug_matrix[:3, 3]
            cur_coords = torch.inverse(cur_lidar_aug_matrix[:3, :3]).matmul(
                cur_coords.transpose(1, 0)
            )
            # lidar2image
            cur_coords = cur_lidar2image[:, :3, :3].matmul(cur_coords)
            cur_coords += cur_lidar2image[:, :3, 3].reshape(-1, 3, 1)
            # get 2d coords
            dist = cur_coords[:, 2, :]
            cur_coords[:, 2, :] = torch.clamp(cur_coords[:, 2, :], 1e-5, 1e5)
            cur_coords[:, :2, :] /= cur_coords[:, 2:3, :]

            # imgaug
            cur_coords = cur_img_aug_matrix[:, :3, :3].matmul(cur_coords)
            cur_coords += cur_img_aug_matrix[:, :3, 3].reshape(-1, 3, 1)
            cur_coords = cur_coords[:, :2, :].transpose(1, 2)

            # normalize coords for grid sample
            cur_coords = cur_coords[..., [1, 0]]

            on_img = (
                (cur_coords[..., 0] < self.image_size[0])
                & (cur_coords[..., 0] >= 0)
                & (cur_coords[..., 1] < self.image_size[1])
                & (cur_coords[..., 1] >= 0)
            )
            for c in range(on_img.shape[0]):
                masked_coords = cur_coords[c, on_img[c]].long()
                masked_dist = dist[c, on_img[c]]

                if self.depth_input == 'scalar':
                    depth[b, c, 0, masked_coords[:, 0], masked_coords[:, 1]] = masked_dist
                elif self.depth_input == 'one-hot':
                    # Clamp depths that are too big to D
                    # These can arise when the point range filter is different from the dbound. 
                    masked_dist = torch.clamp(masked_dist, max=self.D-1)
                    depth[b, c, masked_dist.long(), masked_coords[:, 0], masked_coords[:, 1]] = 1.0

                if self.add_depth_features:
                    depth[b, c, -points[b].shape[-1]:, masked_coords[:, 0], masked_coords[:, 1]] = points[b][boolmask2idx(on_img[c])].transpose(0,1)

        extra_rots = lidar_aug_matrix[..., :3, :3]
        extra_trans = lidar_aug_matrix[..., :3, 3]
        geom = self.get_geometry(
            camera2lidar_rots,
            camera2lidar_trans,
            intrins,
            post_rots,
            post_trans,
            extra_rots=extra_rots,
            extra_trans=extra_trans,
        )

        mats_dict = {
            'intrin_mats': intrins, 
            'ida_mats': img_aug_matrix, 
            'bda_mat': lidar_aug_matrix,
            'sensor2ego_mats': sensor2ego, 
        }
        x = self.get_cam_feats(img, depth, mats_dict)

        use_depth = False
        if type(x) == tuple:
            x, depth = x 
            use_depth = True
        
        x = self.bev_pool(geom, x)

        if use_depth:
            return x, depth 
        else:
            return x
[Major] Code release. 2022-06-03 12:21:18 +08:00			`from typing import Tuple`

			`import torch`
			`from mmcv.runner import force_fp32`
			`from torch import nn`

			`from mmdet3d.ops import bev_pool`

			`__all__ = ["BaseTransform", "BaseDepthTransform"]`

Add BEVFusion-R (#443) 2023-07-08 10:53:36 +08:00			`def boolmask2idx(mask):`
			`# A utility function, workaround for ONNX not supporting 'nonzero'`
			`return torch.nonzero(mask).squeeze(1).tolist()`
[Major] Code release. 2022-06-03 12:21:18 +08:00
			`def gen_dx_bx(xbound, ybound, zbound):`
			`dx = torch.Tensor([row[2] for row in [xbound, ybound, zbound]])`
			`bx = torch.Tensor([row[0] + row[2] / 2.0 for row in [xbound, ybound, zbound]])`
			`nx = torch.LongTensor(`
			`[(row[1] - row[0]) / row[2] for row in [xbound, ybound, zbound]]`
			`)`
			`return dx, bx, nx`


			`class BaseTransform(nn.Module):`
			`def __init__(`
			`self,`
			`in_channels: int,`
			`out_channels: int,`
			`image_size: Tuple[int, int],`
			`feature_size: Tuple[int, int],`
			`xbound: Tuple[float, float, float],`
			`ybound: Tuple[float, float, float],`
			`zbound: Tuple[float, float, float],`
			`dbound: Tuple[float, float, float],`
Add BEVFusion-R (#443) 2023-07-08 10:53:36 +08:00			`use_points='lidar',`
			`depth_input='scalar',`
Complete project state snapshot: Phase 4B RMT-PPAD Integration 🎯 Training Status: - Current Epoch: 2/10 (13.3% complete) - Segmentation Dice: 0.9594 - Detection IoU: 0.5742 - Training stable with 8 GPUs 🔧 Technical Achievements: - ✅ RMT-PPAD Transformer segmentation decoder integrated - ✅ Task-specific GCA architecture optimized - ✅ Multi-scale feature fusion (180×180, 360×360, 600×600) - ✅ Adaptive scale weight learning implemented - ✅ BEVFusion multi-task framework enhanced 📊 Performance Highlights: - Divider segmentation: 0.9793 Dice (excellent) - Pedestrian crossing: 0.9812 Dice (excellent) - Stop line: 0.9812 Dice (excellent) - Carpark area: 0.9802 Dice (excellent) - Walkway: 0.9401 Dice (good) - Drivable area: 0.8959 Dice (good) 🛠️ Code Changes Included: - Enhanced BEVFusion model (bevfusion.py) - RMT-PPAD integration modules (rmtppad_integration.py) - Transformer segmentation head (enhanced_transformer.py) - GCA module optimizations (gca.py) - Configuration updates (Phase 4B configs) - Training scripts and automation tools - Comprehensive documentation and analysis reports 📅 Snapshot Date: Fri Nov 14 09:06:09 UTC 2025 📍 Environment: Docker container 🎯 Phase: RMT-PPAD Integration Complete 2025-11-14 17:06:09 +08:00			`height_expand=True, #// changed`
			`add_depth_features=False, #//`
[Major] Code release. 2022-06-03 12:21:18 +08:00			`) -> None:`
			`super().__init__()`
			`self.in_channels = in_channels`
			`self.image_size = image_size`
			`self.feature_size = feature_size`
			`self.xbound = xbound`
			`self.ybound = ybound`
			`self.zbound = zbound`
			`self.dbound = dbound`
Add BEVFusion-R (#443) 2023-07-08 10:53:36 +08:00			`self.use_points = use_points`
			`assert use_points in ['radar', 'lidar']`
			`self.depth_input=depth_input`
			`assert depth_input in ['scalar', 'one-hot']`
			`self.height_expand = height_expand`
			`self.add_depth_features = add_depth_features`
[Major] Code release. 2022-06-03 12:21:18 +08:00
			`dx, bx, nx = gen_dx_bx(self.xbound, self.ybound, self.zbound)`
			`self.dx = nn.Parameter(dx, requires_grad=False)`
			`self.bx = nn.Parameter(bx, requires_grad=False)`
			`self.nx = nn.Parameter(nx, requires_grad=False)`

			`self.C = out_channels`
			`self.frustum = self.create_frustum()`
			`self.D = self.frustum.shape[0]`
			`self.fp16_enabled = False`

			`@force_fp32()`
			`def create_frustum(self):`
			`iH, iW = self.image_size`
			`fH, fW = self.feature_size`

			`ds = (`
			`torch.arange(*self.dbound, dtype=torch.float)`
			`.view(-1, 1, 1)`
			`.expand(-1, fH, fW)`
			`)`
			`D, _, _ = ds.shape`

			`xs = (`
			`torch.linspace(0, iW - 1, fW, dtype=torch.float)`
			`.view(1, 1, fW)`
			`.expand(D, fH, fW)`
			`)`
			`ys = (`
			`torch.linspace(0, iH - 1, fH, dtype=torch.float)`
			`.view(1, fH, 1)`
			`.expand(D, fH, fW)`
			`)`

			`frustum = torch.stack((xs, ys, ds), -1)`
			`return nn.Parameter(frustum, requires_grad=False)`

			`@force_fp32()`
			`def get_geometry(`
			`self,`
Add training details (#150) * [Major] Update training details. * [Minor] Update README.md. * [Minor] Remove comment. 2022-09-27 06:24:38 +08:00			`camera2lidar_rots,`
			`camera2lidar_trans,`
[Major] Code release. 2022-06-03 12:21:18 +08:00			`intrins,`
			`post_rots,`
			`post_trans,`
			`**kwargs,`
			`):`
Add training details (#150) * [Major] Update training details. * [Minor] Update README.md. * [Minor] Remove comment. 2022-09-27 06:24:38 +08:00			`B, N, _ = camera2lidar_trans.shape`

[Major] Code release. 2022-06-03 12:21:18 +08:00			`# undo post-transformation`
			`# B x N x D x H x W x 3`
			`points = self.frustum - post_trans.view(B, N, 1, 1, 1, 3)`
			`points = (`
			`torch.inverse(post_rots)`
			`.view(B, N, 1, 1, 1, 3, 3)`
			`.matmul(points.unsqueeze(-1))`
			`)`
Add training details (#150) * [Major] Update training details. * [Minor] Update README.md. * [Minor] Remove comment. 2022-09-27 06:24:38 +08:00			`# cam_to_lidar`
[Major] Code release. 2022-06-03 12:21:18 +08:00			`points = torch.cat(`
			`(`
			`points[:, :, :, :, :, :2] * points[:, :, :, :, :, 2:3],`
			`points[:, :, :, :, :, 2:3],`
			`),`
			`5,`
			`)`
Add training details (#150) * [Major] Update training details. * [Minor] Update README.md. * [Minor] Remove comment. 2022-09-27 06:24:38 +08:00			`combine = camera2lidar_rots.matmul(torch.inverse(intrins))`
[Major] Code release. 2022-06-03 12:21:18 +08:00			`points = combine.view(B, N, 1, 1, 1, 3, 3).matmul(points).squeeze(-1)`
Add training details (#150) * [Major] Update training details. * [Minor] Update README.md. * [Minor] Remove comment. 2022-09-27 06:24:38 +08:00			`points += camera2lidar_trans.view(B, N, 1, 1, 1, 3)`
[Major] Code release. 2022-06-03 12:21:18 +08:00
			`if "extra_rots" in kwargs:`
			`extra_rots = kwargs["extra_rots"]`
			`points = (`
			`extra_rots.view(B, 1, 1, 1, 1, 3, 3)`
			`.repeat(1, N, 1, 1, 1, 1, 1)`
			`.matmul(points.unsqueeze(-1))`
			`.squeeze(-1)`
			`)`
			`if "extra_trans" in kwargs:`
			`extra_trans = kwargs["extra_trans"]`
			`points += extra_trans.view(B, 1, 1, 1, 1, 3).repeat(1, N, 1, 1, 1, 1)`

			`return points`

			`def get_cam_feats(self, x):`
			`raise NotImplementedError`

			`@force_fp32()`
			`def bev_pool(self, geom_feats, x):`
			`B, N, D, H, W, C = x.shape`
			`Nprime = B * N * D * H * W`

			`# flatten x`
			`x = x.reshape(Nprime, C)`

			`# flatten indices`
			`geom_feats = ((geom_feats - (self.bx - self.dx / 2.0)) / self.dx).long()`
			`geom_feats = geom_feats.view(Nprime, 3)`
			`batch_ix = torch.cat(`
			`[`
			`torch.full([Nprime // B, 1], ix, device=x.device, dtype=torch.long)`
			`for ix in range(B)`
			`]`
			`)`
			`geom_feats = torch.cat((geom_feats, batch_ix), 1)`

			`# filter out points that are outside box`
			`kept = (`
			`(geom_feats[:, 0] >= 0)`
			`& (geom_feats[:, 0] < self.nx[0])`
			`& (geom_feats[:, 1] >= 0)`
			`& (geom_feats[:, 1] < self.nx[1])`
			`& (geom_feats[:, 2] >= 0)`
			`& (geom_feats[:, 2] < self.nx[2])`
			`)`
			`x = x[kept]`
			`geom_feats = geom_feats[kept]`

			`x = bev_pool(x, geom_feats, B, self.nx[2], self.nx[0], self.nx[1])`

			`# collapse Z`
			`final = torch.cat(x.unbind(dim=2), 1)`

			`return final`

			`@force_fp32()`
			`def forward(`
			`self,`
			`img,`
			`points,`
Add BEVFusion-R (#443) 2023-07-08 10:53:36 +08:00			`radar,`
[Major] Code release. 2022-06-03 12:21:18 +08:00			`camera2ego,`
			`lidar2ego,`
			`lidar2camera,`
			`lidar2image,`
			`camera_intrinsics,`
Add training details (#150) * [Major] Update training details. * [Minor] Update README.md. * [Minor] Remove comment. 2022-09-27 06:24:38 +08:00			`camera2lidar,`
[Major] Code release. 2022-06-03 12:21:18 +08:00			`img_aug_matrix,`
			`lidar_aug_matrix,`
			`**kwargs,`
			`):`
			`rots = camera2ego[..., :3, :3]`
			`trans = camera2ego[..., :3, 3]`
			`intrins = camera_intrinsics[..., :3, :3]`
			`post_rots = img_aug_matrix[..., :3, :3]`
			`post_trans = img_aug_matrix[..., :3, 3]`
			`lidar2ego_rots = lidar2ego[..., :3, :3]`
			`lidar2ego_trans = lidar2ego[..., :3, 3]`
Add training details (#150) * [Major] Update training details. * [Minor] Update README.md. * [Minor] Remove comment. 2022-09-27 06:24:38 +08:00			`camera2lidar_rots = camera2lidar[..., :3, :3]`
			`camera2lidar_trans = camera2lidar[..., :3, 3]`

[Major] Code release. 2022-06-03 12:21:18 +08:00			`extra_rots = lidar_aug_matrix[..., :3, :3]`
			`extra_trans = lidar_aug_matrix[..., :3, 3]`

			`geom = self.get_geometry(`
Add training details (#150) * [Major] Update training details. * [Minor] Update README.md. * [Minor] Remove comment. 2022-09-27 06:24:38 +08:00			`camera2lidar_rots,`
			`camera2lidar_trans,`
[Major] Code release. 2022-06-03 12:21:18 +08:00			`intrins,`
			`post_rots,`
			`post_trans,`
			`extra_rots=extra_rots,`
Add training details (#150) * [Major] Update training details. * [Minor] Update README.md. * [Minor] Remove comment. 2022-09-27 06:24:38 +08:00			`extra_trans=extra_trans,`
[Major] Code release. 2022-06-03 12:21:18 +08:00			`)`
Add BEVFusion-R (#443) 2023-07-08 10:53:36 +08:00			`mats_dict = {`
			`'intrin_mats': camera_intrinsics,`
			`'ida_mats': img_aug_matrix,`
			`'bda_mat': lidar_aug_matrix,`
			`'sensor2ego_mats': camera2ego,`
			`}`
			`x = self.get_cam_feats(img, mats_dict)`

			`use_depth = False`
			`if type(x) == tuple:`
			`x, depth = x`
			`use_depth = True`

[Major] Code release. 2022-06-03 12:21:18 +08:00			`x = self.bev_pool(geom, x)`
Add BEVFusion-R (#443) 2023-07-08 10:53:36 +08:00
			`if use_depth:`
			`return x, depth`
			`else:`
			`return x`

[Major] Code release. 2022-06-03 12:21:18 +08:00

			`class BaseDepthTransform(BaseTransform):`
			`@force_fp32()`
			`def forward(`
			`self,`
			`img,`
			`points,`
Add BEVFusion-R (#443) 2023-07-08 10:53:36 +08:00			`radar,`
[Major] Code release. 2022-06-03 12:21:18 +08:00			`sensor2ego,`
			`lidar2ego,`
			`lidar2camera,`
			`lidar2image,`
			`cam_intrinsic,`
Add training details (#150) * [Major] Update training details. * [Minor] Update README.md. * [Minor] Remove comment. 2022-09-27 06:24:38 +08:00			`camera2lidar,`
[Major] Code release. 2022-06-03 12:21:18 +08:00			`img_aug_matrix,`
			`lidar_aug_matrix,`
			`**kwargs,`
			`):`
			`rots = sensor2ego[..., :3, :3]`
			`trans = sensor2ego[..., :3, 3]`
			`intrins = cam_intrinsic[..., :3, :3]`
			`post_rots = img_aug_matrix[..., :3, :3]`
			`post_trans = img_aug_matrix[..., :3, 3]`
			`lidar2ego_rots = lidar2ego[..., :3, :3]`
			`lidar2ego_trans = lidar2ego[..., :3, 3]`
Add training details (#150) * [Major] Update training details. * [Minor] Update README.md. * [Minor] Remove comment. 2022-09-27 06:24:38 +08:00			`camera2lidar_rots = camera2lidar[..., :3, :3]`
			`camera2lidar_trans = camera2lidar[..., :3, 3]`

Add BEVFusion-R (#443) 2023-07-08 10:53:36 +08:00			`if self.use_points == 'radar':`
			`points = radar`

			`if self.height_expand:`
			`for b in range(len(points)):`
			`points_repeated = points[b].repeat_interleave(8, dim=0)`
			`points_repeated[:, 2] = torch.arange(0.25, 2.25, 0.25).repeat(points[b].shape[0])`
			`points[b] = points_repeated`
[Major] Code release. 2022-06-03 12:21:18 +08:00
			`batch_size = len(points)`
Add BEVFusion-R (#443) 2023-07-08 10:53:36 +08:00			`depth_in_channels = 1 if self.depth_input=='scalar' else self.D`
			`if self.add_depth_features:`
			`depth_in_channels += points[0].shape[1]`

			`depth = torch.zeros(batch_size, img.shape[1], depth_in_channels, *self.image_size, device=points[0].device)`

[Major] Code release. 2022-06-03 12:21:18 +08:00
			`for b in range(batch_size):`
Add training details (#150) * [Major] Update training details. * [Minor] Update README.md. * [Minor] Remove comment. 2022-09-27 06:24:38 +08:00			`cur_coords = points[b][:, :3]`
[Major] Code release. 2022-06-03 12:21:18 +08:00			`cur_img_aug_matrix = img_aug_matrix[b]`
			`cur_lidar_aug_matrix = lidar_aug_matrix[b]`
			`cur_lidar2image = lidar2image[b]`

Add training details (#150) * [Major] Update training details. * [Minor] Update README.md. * [Minor] Remove comment. 2022-09-27 06:24:38 +08:00			`# inverse aug`
			`cur_coords -= cur_lidar_aug_matrix[:3, 3]`
			`cur_coords = torch.inverse(cur_lidar_aug_matrix[:3, :3]).matmul(`
			`cur_coords.transpose(1, 0)`
			`)`
[Major] Code release. 2022-06-03 12:21:18 +08:00			`# lidar2image`
			`cur_coords = cur_lidar2image[:, :3, :3].matmul(cur_coords)`
			`cur_coords += cur_lidar2image[:, :3, 3].reshape(-1, 3, 1)`
			`# get 2d coords`
			`dist = cur_coords[:, 2, :]`
			`cur_coords[:, 2, :] = torch.clamp(cur_coords[:, 2, :], 1e-5, 1e5)`
			`cur_coords[:, :2, :] /= cur_coords[:, 2:3, :]`

			`# imgaug`
			`cur_coords = cur_img_aug_matrix[:, :3, :3].matmul(cur_coords)`
			`cur_coords += cur_img_aug_matrix[:, :3, 3].reshape(-1, 3, 1)`
			`cur_coords = cur_coords[:, :2, :].transpose(1, 2)`

			`# normalize coords for grid sample`
			`cur_coords = cur_coords[..., [1, 0]]`

			`on_img = (`
			`(cur_coords[..., 0] < self.image_size[0])`
			`& (cur_coords[..., 0] >= 0)`
			`& (cur_coords[..., 1] < self.image_size[1])`
			`& (cur_coords[..., 1] >= 0)`
			`)`
Add training details (#150) * [Major] Update training details. * [Minor] Update README.md. * [Minor] Remove comment. 2022-09-27 06:24:38 +08:00			`for c in range(on_img.shape[0]):`
[Major] Code release. 2022-06-03 12:21:18 +08:00			`masked_coords = cur_coords[c, on_img[c]].long()`
			`masked_dist = dist[c, on_img[c]]`
Add BEVFusion-R (#443) 2023-07-08 10:53:36 +08:00
			`if self.depth_input == 'scalar':`
			`depth[b, c, 0, masked_coords[:, 0], masked_coords[:, 1]] = masked_dist`
			`elif self.depth_input == 'one-hot':`
			`# Clamp depths that are too big to D`
			`# These can arise when the point range filter is different from the dbound.`
			`masked_dist = torch.clamp(masked_dist, max=self.D-1)`
			`depth[b, c, masked_dist.long(), masked_coords[:, 0], masked_coords[:, 1]] = 1.0`

			`if self.add_depth_features:`
			`depth[b, c, -points[b].shape[-1]:, masked_coords[:, 0], masked_coords[:, 1]] = points[b][boolmask2idx(on_img[c])].transpose(0,1)`
[Major] Code release. 2022-06-03 12:21:18 +08:00
Add training details (#150) * [Major] Update training details. * [Minor] Update README.md. * [Minor] Remove comment. 2022-09-27 06:24:38 +08:00			`extra_rots = lidar_aug_matrix[..., :3, :3]`
			`extra_trans = lidar_aug_matrix[..., :3, 3]`
[Major] Code release. 2022-06-03 12:21:18 +08:00			`geom = self.get_geometry(`
Add training details (#150) * [Major] Update training details. * [Minor] Update README.md. * [Minor] Remove comment. 2022-09-27 06:24:38 +08:00			`camera2lidar_rots,`
			`camera2lidar_trans,`
[Major] Code release. 2022-06-03 12:21:18 +08:00			`intrins,`
			`post_rots,`
			`post_trans,`
Add training details (#150) * [Major] Update training details. * [Minor] Update README.md. * [Minor] Remove comment. 2022-09-27 06:24:38 +08:00			`extra_rots=extra_rots,`
			`extra_trans=extra_trans,`
[Major] Code release. 2022-06-03 12:21:18 +08:00			`)`

Add BEVFusion-R (#443) 2023-07-08 10:53:36 +08:00			`mats_dict = {`
			`'intrin_mats': intrins,`
			`'ida_mats': img_aug_matrix,`
			`'bda_mat': lidar_aug_matrix,`
			`'sensor2ego_mats': sensor2ego,`
			`}`
			`x = self.get_cam_feats(img, depth, mats_dict)`

			`use_depth = False`
			`if type(x) == tuple:`
			`x, depth = x`
			`use_depth = True`

[Major] Code release. 2022-06-03 12:21:18 +08:00			`x = self.bev_pool(geom, x)`
Add BEVFusion-R (#443) 2023-07-08 10:53:36 +08:00
			`if use_depth:`
			`return x, depth`
			`else:`
			`return x`