Merge branch 'main' of https://github.com/pypose/pypose

HongLouyemeng · Sep 24, 2023 · a1a419e · a1a419e
2 parents af6d5e8 + c1aa35c
commit a1a419e
Show file tree

Hide file tree

Showing 10 changed files with 357 additions and 6 deletions.
diff --git a/.gitignore b/.gitignore
@@ -151,6 +151,7 @@ examples/module/pcr/data/*
 examples/module/pcr/save/*
 examples/module/spline/save/*
 examples/module/mpc/save/*
+examples/module/reprojpgo/save/*
 *epnp-test-data.pt*
 *icp-test-data.pt*
 *__MACOSX
diff --git a/docs/source/convert.rst b/docs/source/convert.rst
@@ -23,3 +23,4 @@ Convert
     cart2homo
     homo2cart
     point2pixel
+    pixel2point
diff --git a/examples/module/reprojpgo/dataset.py b/examples/module/reprojpgo/dataset.py
@@ -0,0 +1,133 @@
+import cv2
+import torch
+import numpy as np
+import pypose as pp
+import matplotlib as mpl
+from pathlib import Path
+import matplotlib.pyplot as plt
+from torch.utils.data import Dataset
+from matplotlib.cm import ScalarMappable
+from mpl_toolkits.axes_grid1 import make_axes_locatable
+from torchvision.datasets.utils import download_and_extract_archive
+
+
+class MiniTartanAir(Dataset):
+    link = 'https://github.com/pypose/pypose/releases/download/v0.5.0/MiniTartanAir.pt.zip'
+    def __init__(self, dataroot: Path, download = True):
+        super().__init__()
+        if download:
+            download_and_extract_archive(self.link, str(dataroot))
+        self.NED2CV = pp.from_matrix(torch.tensor(
+            [[0., 1., 0., 0.],
+             [0., 0., 1., 0.],
+             [1., 0., 0., 0.],
+             [0., 0., 0., 1.]], dtype=torch.float32),
+            pp.SE3_type)
+        self.CV2NED = self.NED2CV.Inv()
+
+        data_source = torch.load(Path(dataroot, "MiniTartanAir.pt"))
+        self.images = data_source["images"]
+        self.flows: torch.Tensor = data_source["flows"]
+        self.depths = data_source["depths"]
+        self.gt_motions = data_source["gt_traj"]
+        self.length = self.flows.size(0)
+
+    def __len__(self):
+        return self.length
+
+    def __getitem__(self, index):
+        image1 = self.images[index] / 255.            # image size [3, 480, 640]
+        image2 = self.images[index + 1] / 255.        # image size [3, 480, 640]
+        flow = self.flows[index].to(torch.float32)    # flow size  [2, 480, 640]
+        depth = self.depths[index].to(torch.float32)  # depth size [1, 480, 640]
+        gt_motion = self.NED2CV @ self.gt_motions[index] @ self.CV2NED
+
+        pts1 = self.select_points(image1)
+        pts2 = self.match_points(pts1, flow)
+        pts1_z = depth[0, pts1[..., 1], pts1[..., 0]]
+
+        H, W = image1.size(-2), image1.size(-1) # mask out points outside images
+        mask = torch.logical_and(pts2[..., 1] < H, pts2[..., 0] < W)
+        pts1, pts2, pts1_z = pts1[mask], pts2[mask], pts1_z[mask]
+
+        return image1, image2, pts1_z, pts1, pts2, gt_motion
+
+    @staticmethod
+    def select_points(image: torch.Tensor, num_point: int = 100):
+        image_grad = torch.nn.functional.conv2d(
+            image.unsqueeze(dim=0),
+            torch.tensor(
+                [[0, 1, 0], [1, -4, 1], [0, 1, 0]]
+            ).float().expand((1, 3, 3, 3)),
+            padding=1
+        )[0].abs()
+        image_grad_avg = image_grad.mean(dim=(1, 2), keepdim=True)
+        image_grad_std = image_grad.std(dim=(1, 2), keepdim=True)
+        # Positions with sufficient gradient (feature) > +3std
+        points = image_grad > image_grad_avg + 3. * image_grad_std
+        border_mask = torch.zeros_like(points)
+        border_mask[..., 5:-5, 5:-5] = 1.
+
+        points = points * border_mask
+        selected_points = torch.nonzero(points, as_tuple=False)
+
+        # Randomly select points
+        perm = torch.randperm(selected_points.shape[0])[:num_point]
+        # vu -> uv coordinate
+        pts_uv = selected_points[perm][..., 1:].roll(shifts=1, dims=[1])
+        return pts_uv
+
+    @staticmethod
+    def match_points(pts1: torch.Tensor, flow: torch.Tensor):
+        return pts1 + flow[..., pts1[..., 1], pts1[..., 0]].T
+
+
+def visualize_image(img: torch.Tensor):
+    display_img = img.permute((1, 2, 0)).cpu().numpy() * 255
+    display_img = display_img.astype(np.uint8)
+    display_img = cv2.cvtColor(display_img, cv2.COLOR_BGR2GRAY)
+    display_img = np.stack([display_img] * 3, axis=2)
+    return display_img
+
+
+def visualize(img1, img2, pts1, pts2, target, loss, step):
+    plt.ion()
+
+    img1 = visualize_image(img1)    # Convert to black&white OpenCV displayable
+    img2 = visualize_image(img2)    # format
+
+    color_map = mpl.colormaps['coolwarm']
+    color_normalizer = mpl.colors.Normalize(vmin=0, vmax=1)
+    display_img = np.concatenate([img1, img2], axis=1)
+
+    pts3d = pp.function.geometry.pixel2point(target.pts1, target.depth, target.K)
+    reproj_uv = pp.function.point2pixel(pts3d, target.K, target.T.Inv())
+    reproj_uv = reproj_uv.detach().cpu()
+
+    reproj_err = torch.norm(pts2 - reproj_uv, dim=1).detach().cpu().numpy()
+
+    plt.clf()
+    plt.axis('off')
+    plt.imshow(display_img, interpolation='nearest')
+    for idx in range(target.pts1.size(0)):
+        err = reproj_err[idx].item()
+        u1, v1 = pts1[idx, 0].item(), pts1[idx, 1].item()
+        reproj_u, reproj_v = reproj_uv[idx, 0].item(), reproj_uv[idx, 1].item()
+        plt.plot(
+            [u1, reproj_u + img1.shape[1]],
+            [v1, reproj_v]
+            , color=color_map(err)
+        )
+    plt.title(f"Step: {step}, ReprojErr: {round(reproj_err.mean().item(), 3)},"
+              f"Residual: {round(loss.item(), 3)}")
+    divider = make_axes_locatable(plt.gca())
+    cax = divider.append_axes("right", size="5%", pad=0.05)
+    plt.colorbar(ScalarMappable(norm=color_normalizer, cmap=color_map), cax=cax)
+    plt.pause(0.1)
+
+
+def report_pose_error(curr_pose: pp.SE3, gt_pose: pp.SE3):
+    _err = (curr_pose.Inv() * gt_pose)
+    _err_rot = _err.rotation().Log().norm(dim=-1).item() * (180 / np.pi)
+    _err_trans = _err.translation().norm(dim=-1).item()
+    print(f"Err Rot (deg): {round(_err_rot, 4)} | Err Trans (m): {round(_err_trans, 4)}")
diff --git a/examples/module/reprojpgo/readme.md b/examples/module/reprojpgo/readme.md
@@ -0,0 +1,36 @@
+# Reprojection Error Pose Graph Optimization
+
+![Reprojerr_Visualization](https://user-images.githubusercontent.com/47029019/257399825-2f47931c-adc8-494e-99c6-d0c2c5d7c306.gif)
+
+An example for pose graph optimization between adjacent frames using cropped trajectory from [the TartanAir dataset](https://theairlab.org/tartanair-dataset/) (Easy, abandoned factory, sequence P001).
+
+## Installation
+
+  * matplotlib
+  * opencv-python
+
+
+## Run
+
+```bash
+python examples/module/reprojpgo/reprojpgo.py
+```
+
+Or
+
+```bash
+python examples/module/reprojpgo/reprojpgo.py --device cuda --vectorize
+```
+
+* Other supported arguments:
+  ```
+    Pose Graph Optimization
+
+    optional arguments:
+      -h, --help           show this help message and exit
+      --dataroot DATAROOT  dataset location (default: ./data/Reprojerr_Example)
+      --device DEVICE      cuda or cpu (default: cuda)
+      --vectorize          to accelerate computation (will use more RAM)
+      --dnoise DEPTH_NOISE noise level on point depth (default: 0.1)
+      --pnoise POSE_NOISE  noise level on initial pose (default: 0.1)
+  ```
diff --git a/examples/module/reprojpgo/reprojpgo.py b/examples/module/reprojpgo/reprojpgo.py
@@ -0,0 +1,87 @@
+import torch
+import argparse
+import pypose as pp
+from torch import nn
+from pathlib import Path
+from pypose.optim import LM
+from pypose.optim.kernel import Huber
+from pypose.optim.solver import Cholesky
+from pypose.optim.strategy import TrustRegion
+from pypose.optim.corrector import FastTriggs
+from pypose.optim.scheduler import StopOnPlateau
+from pypose.function.geometry import pixel2point, reprojerr
+from dataset import MiniTartanAir, visualize, report_pose_error
+
+
+class LocalBundleAdjustment(nn.Module):
+    def __init__(self, K, pts1, pts2, depth, init_T) -> None:
+        super().__init__()
+        self.register_buffer("K", K)
+        self.register_buffer("pts1", pts1)  # N x 2, uv coordinate
+        self.register_buffer("pts2", pts2)  # N x 2, uv coordinate
+
+        self.T = pp.Parameter(init_T)
+        self.depth = nn.Parameter(depth)
+
+    def forward(self) -> torch.Tensor:
+        pts3d = pixel2point(self.pts1, self.depth, self.K)
+        return reprojerr(pts3d, self.pts2, self.K, self.T.Inv(), reduction='none')
+
+
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser(
+        description="Estimate camera motion by optimizing reprojerr graph "
+                    "between adjacent frames")
+    parser.add_argument("--dataroot", action="store",
+                        default="./examples/module/reprojpgo/save/",
+                        help="Root directory for the dataset")
+    parser.add_argument("--device", action="store", default="cuda",
+                        help="Device to run optimization (cuda / cpu)")
+    parser.add_argument("--vectorize", action="store_true", default=True,
+                        help="Vectorize when optimizing reprojerr graph.")
+    parser.add_argument("--dnoise", default=0.1, type=float,
+                        help="Noise level of the depth")
+    parser.add_argument("--pnoise", default=0.1, type=float,
+                        help="Noise level of the pose")
+    args = parser.parse_args()
+    dataroot = Path(args.dataroot)
+    device, vectorize = args.device, args.vectorize
+    K = torch.tensor([[320., 0., 320.], [0., 320., 240.], [0., 0., 1.]])
+
+    dataset = MiniTartanAir(dataroot=dataroot)
+
+    for img1, img2, depth, pts1, pts2, gt_motion in dataset:
+        # Noisy initial pose and depth noise ~ N(avg=0, std=args.pnoise)
+        init_T = (gt_motion * pp.randn_SE3(sigma=args.pnoise)).to(device)
+        depth = depth + torch.randn_like(depth) * args.dnoise
+
+        print('Initial Motion Error:')
+        report_pose_error(init_T, gt_motion.to(device))
+
+        graph = LocalBundleAdjustment(K, pts1, pts2, depth, init_T).to(device)
+        kernel = Huber(delta=0.1)
+        corrector = FastTriggs(kernel)
+        optimizer = LM(graph, solver=Cholesky(),
+                              strategy=TrustRegion(radius=1e3),
+                              kernel=kernel,
+                              corrector=corrector,
+                              min=1e-8,
+                              reject=128,
+                              vectorize=vectorize)
+        scheduler = StopOnPlateau(optimizer, steps=25,
+                                             patience=4,
+                                             decreasing=1e-6,
+                                             verbose=True)
+
+        # Optimize Reproject Pose Graph Optimization ###########################
+        while scheduler.continual():
+            loss = optimizer.step(input=())
+            visualize(img1, img2, pts1, pts2, graph, loss, scheduler.steps)
+            scheduler.step(loss)
+        ########################################################################
+
+        optimized_T = pp.SE3(graph.T.data.detach())
+
+        print('Optimized Motion Error')
+        report_pose_error(optimized_T, gt_motion.to(device))
+        print("\n\n")
diff --git a/pypose/_version.py b/pypose/_version.py
@@ -1 +1 @@
-__version__ = "0.6.1"
+__version__ = "0.6.2"
diff --git a/pypose/function/geometry.py b/pypose/function/geometry.py
@@ -111,6 +111,62 @@ def point2pixel(points, intrinsics, extrinsics=None):
     return homo2cart(points @ intrinsics.mT)
 
 
+def pixel2point(pixels, depth, intrinsics):
+    r'''
+    Convert batch of pixels with depth into points (in camera coordinate)
+
+    Args:
+        pixels: (``torch.Tensor``) The 2d coordinates of pixels in the camera
+            pixel coordinate.
+            Shape has to be (..., N, 2)
+
+        depth: (``torch.Tensor``) The depths of pixels with respect to the
+            sensor plane.
+            Shape has to be (..., N)
+
+        intrinsics: (``torch.Tensor``): The intrinsic parameters of cameras.
+            The shape has to be (..., 3, 3).
+
+    Returns:
+        ``torch.Tensor`` The associated 3D-points with shape (..., N, 3)
+
+    Example:
+        >>> import torch, pypose as pp
+        >>> f, (H, W) = 2, (9, 9) # focal length and image height, width
+        >>> intrinsics = torch.tensor([[f, 0, H / 2],
+        ...                            [0, f, W / 2],
+        ...                            [0, 0,   1  ]])
+        >>> pixels = torch.tensor([[0.5, 0.0],
+        ...                        [1.0, 0.0],
+        ...                        [0.0, 1.3],
+        ...                        [1.0, 0.0],
+        ...                        [0.5, 1.5],
+        ...                        [5.0, 1.5]])
+        >>> depths = torch.tensor([5.0, 3.0, 6.5, 2.0, 0.5, 0.7])
+        >>> points = pp.pixel2point(pixels, depths, intrinsics)
+        tensor([[-10.0000, -11.2500,   5.0000],
+                [ -5.2500,  -6.7500,   3.0000],
+                [-14.6250, -10.4000,   6.5000],
+                [ -3.5000,  -4.5000,   2.0000],
+                [ -1.0000,  -0.7500,   0.5000],
+                [  0.1750,  -1.0500,   0.7000]])
+    '''
+    assert pixels.size(-1) == 2, "Pixels shape incorrect"
+    assert depth.size(-1) == pixels.size(-2), "Depth shape does not match pixels"
+    assert intrinsics.size(-1) == intrinsics.size(-2) == 3, "Intrinsics shape incorrect."
+
+    fx, fy = intrinsics[..., 0, 0], intrinsics[..., 1, 1]
+    cx, cy = intrinsics[..., 0, 2], intrinsics[..., 1, 2]
+
+    assert not torch.any(fx == 0), "fx Cannot contain zero"
+    assert not torch.any(fy == 0), "fy Cannot contain zero"
+
+    pts3d_z = depth
+    pts3d_x = ((pixels[..., 0] - cx) * pts3d_z) / fx
+    pts3d_y = ((pixels[..., 1] - cy) * pts3d_z) / fy
+    return torch.stack([pts3d_x, pts3d_y, pts3d_z], dim=-1)
+
+
 def reprojerr(points, pixels, intrinsics, extrinsics=None, reduction='none'):
     r'''
     Calculates batched per-pixel reprojection error (pixel distance) for points either in

diff --git a/pypose/optim/optimizer.py b/pypose/optim/optimizer.py
@@ -46,7 +46,10 @@ def normalize_RWJ(self, R, weight, J):
             weight_diag = []
             for w, r in zip(weight, R):
                 ni = r.numel() * w.shape[-1] / w.numel()
-                weight_diag += [w] * int(ni)
+                w = w.view(*w.shape, 1, 1) if r.shape[-1] == 1 else w
+                ws = w.view(-1, w.shape[-2], w.shape[-1]).split(1, 0)
+                ws = [wsi.squeeze(0) for wsi in ws]
+                weight_diag += ws * int(ni)
             weight_diag = torch.block_diag(*weight_diag)
         R = [r.reshape(-1) for r in R]
         J = torch.cat(J) if isinstance(J, (tuple, list)) else J