Change Fisheye62 projection to match perception models

Summary: I wrote the unit test attached to triple check we were matching the perception cameras - but we were not. So I ported the code exactly and now we exactly match the perception cameras behavior. Looking at the code it seems to be a legit bug - and when I read the code my mental model says this may make a significant difference if the radial distortion parameters are high (which they are in BTL). However - Rosetta continues to be an enigma to me and it seems to hardly make a difference... Differential Revision: D60927097 fbshipit-source-id: 15e04b50634d8c236bfaf89fcf6f43aeff1ede7d

Change Fisheye62 projection to match perception models
Summary: I wrote the unit test attached to triple check we were matching the perception cameras - but we were not. So I ported the code exactly and now we exactly match the perception cameras behavior. Looking at the code it seems to be a legit bug - and when I read the code my mental model says this may make a significant difference if the radial distortion parameters are high (which they are in BTL). However - Rosetta continues to be an enigma to me and it seems to hardly make a difference... Differential Revision: D60927097 fbshipit-source-id: 15e04b50634d8c236bfaf89fcf6f43aeff1ede7d
b91ae53d · Patrick Snape · Facebook GitHub Bot · b0810efa · b91ae53d · b91ae53d
Commit b91ae53d authored Aug 17, 2024 by Patrick Snape Committed by Facebook GitHub Bot Aug 17, 2024
Hide whitespace changes
Inline Side-by-side

Showing with 136 additions and 28 deletions

drtk/utils/projection.py drtk/utils/projection.py +44 -28

test/perception_parity_test.py test/perception_parity_test.py +92 -0

No files found.
--- a/drtk/utils/projection.py
+++ b/drtk/utils/projection.py
@@ -162,7 +162,8 @@ def project_fisheye_distort_62(
    fov: Optional[th.Tensor] = None,
 ) -> th.Tensor:
    """Project camera-space points to distort pixel-space points using the
-    OculusVisionFishEye62 distortion model.
+    Fisheye62 distortion model. See the perception camera model implementation
+    where this was copied from here: https://fburl.com/code/oqpu8xdm

    v_cam:      N x V x 3
    focal:      N x 2 x 2
@@ -170,45 +171,60 @@ def project_fisheye_distort_62(
    D:          N x 8
    fov:        N x 1
    """
+    assert (
+        D.shape[1] == 8
+    ), f"Fisheye62 model requires 8 distortion parameters: {D.shape}"

-    # See https://www.internalfb.com/code/fbsource/[188bdaeaad64]/arvr/projects/nimble/prod/pynimble/visualization/shaders.py?lines=103-123
-    # a more readible version: https://euratom-software.github.io/calcam/html/intro_theory.html
    if fov is None:
        with th.no_grad():
-            # TODO: bug.
-            # Fisheye62 uses 8 parameters, and the first 4 can be used
-            # by the same FOV estimation equation as fisheye distortion.
-            # However, the code takes the coeffs at indices -4, -3, -2,
-            # -1: which take the last 4 values, instead of the first 4.
            fov = estimate_fisheye_fov(D)

    z = v_cam[:, :, 2:3]
    z = th.where(z < 0, z.clamp(max=-1e-8), z.clamp(min=1e-8))

    v_proj = v_cam[:, :, :2] / z
-    r = v_proj.pow(2).sum(-1).sqrt()  # rp
+    r = v_proj.pow(2).sum(-1).sqrt()
    r = r.clamp(max=fov, min=1e-8 * th.ones_like(fov))
    theta = th.atan(r)
-    theta_d = theta * (
-        1
-        + D[:, 0:1] * theta.pow(2)
-        + D[:, 1:2] * theta.pow(4)
-        + D[:, 2:3] * theta.pow(6)
-        + D[:, 3:4] * theta.pow(8)
-        + D[:, 4:5] * theta.pow(10)
-        + D[:, 5:6] * theta.pow(12)
+    theta2 = theta * theta
+
+    k0 = D[:, 0].unsqueeze(1)
+    k1 = D[:, 1].unsqueeze(1)
+    k2 = D[:, 2].unsqueeze(1)
+    k3 = D[:, 3].unsqueeze(1)
+    k4 = D[:, 4].unsqueeze(1)
+    k5 = D[:, 5].unsqueeze(1)
+    p0 = D[:, 6].unsqueeze(1)
+    p1 = D[:, 7].unsqueeze(1)
+
+    theta3 = theta2 * theta
+    theta5 = theta2 * theta3
+    theta7 = theta2 * theta5
+    theta9 = theta2 * theta7
+    theta11 = theta2 * theta9
+    theta13 = theta2 * theta11
+
+    thetad = (
+        theta
+        + k0 * theta3
+        + k1 * theta5
+        + k2 * theta7
+        + k3 * theta9
+        + k4 * theta11
+        + k5 * theta13
    )
+
    r = th.where(r < 0, r.clamp(max=-1e-8), r.clamp(min=1e-8))
-    v_proj_dist = v_proj * (theta_d / r)[..., None]
+    v_proj_dist = v_proj * (thetad / r)[..., None]

-    # Tangential Distortion
-    x = v_proj_dist[:, :, 0]
-    y = v_proj_dist[:, :, 1]
+    x_r = v_proj_dist[:, :, 0]
+    y_r = v_proj_dist[:, :, 1]

-    xtan = D[:, 6:7] * (r.pow(2) + 2 * x.pow(2)) + 2 * D[:, 7:8] * x * y
-    ytan = 2 * D[:, 6:7] * x * y + D[:, 7:8] * (r.pow(2) + 2 * y.pow(2))
+    rRadial2 = x_r * x_r + y_r * y_r
+    x_t = (2 * x_r * x_r + rRadial2) * p0 + (2 * x_r * y_r) * p1
+    y_t = (2 * x_r * y_r) * p0 + (2 * y_r * y_r + rRadial2) * p1

-    pTangential = th.cat([xtan[..., None], ytan[..., None]], dim=-1)
+    pTangential = th.cat([x_t[..., None], y_t[..., None]], dim=-1)

    v_proj_dist = v_proj_dist + pTangential

@@ -275,13 +291,13 @@ def estimate_fisheye_fov(D: Union[np.ndarray, th.Tensor]) -> th.Tensor:
    zeros = np.zeros_like(coefs[:, 0])
    coefs = np.stack(
        [
-            9 * coefs[:, -1],
+            9 * coefs[:, 3],
            zeros,
-            7 * coefs[:, -2],
+            7 * coefs[:, 2],
            zeros,
-            5 * coefs[:, -3],
+            5 * coefs[:, 1],
            zeros,
-            3 * coefs[:, -4],
+            3 * coefs[:, 0],
            zeros,
            ones,
        ],

--- a/test/perception_parity_test.py
+++ b/test/perception_parity_test.py
+# (c) Meta Platforms, Inc. and affiliates. Confidential and proprietary.
+from unittest import TestCase
+
+import numpy as np
+import torch as th
+from arvr.projects.facetracking.hmd.pythonbindings.engine import camera_operator
+
+# @manual=fbsource//arvr/projects/codec_avatar/drtk:utils
+from drtk.utils.projection import project_fisheye_distort_62
+
+
+def get_meshgrid_vec(width: int, height: int) -> np.ndarray:
+    image_indices = np.meshgrid(np.arange(width), np.arange(height))
+    image_indices = np.stack(image_indices, axis=-1)
+    return image_indices.reshape(-1, 2).astype(np.float32)
+
+
+def generate_unit_plane(
+    camera: camera_operator.CameraOperator, width: int, height: int
+) -> np.ndarray:
+    image_indices_vec = get_meshgrid_vec(width, height)
+
+    uv_positions_2d = camera.unproject_unit_plane(
+        image_indices_vec, apply_undistortion=False
+    ).astype(np.float64)
+
+    uv_positions_3d = np.concatenate(
+        [
+            uv_positions_2d,
+            np.ones([image_indices_vec.shape[0], 1], dtype=uv_positions_2d.dtype),
+        ],
+        axis=1,
+    )
+    return uv_positions_3d
+
+
+class PerceptionParityTest(TestCase):
+    def setUp(self):
+        np.random.seed(42)
+
+    def test_fisheye62(self) -> None:
+        # Hardcoded fisheye62 with no flips and no LUT
+        n_distortion_parameters = 8
+        width = 100
+        height = 200
+        random_intrinsics = np.eye(4, dtype=np.float64)
+        random_intrinsics[0, 0] = np.random.uniform(low=0.9, high=1.0) * max(
+            height, width
+        )
+        random_intrinsics[1, 1] = random_intrinsics[0, 0]
+        random_intrinsics[0, 2] = np.random.uniform(low=0.4, high=0.6) * width
+        random_intrinsics[1, 2] = np.random.uniform(low=0.4, high=0.6) * height
+        distortion = np.random.uniform(low=-0.1, high=0.1, size=n_distortion_parameters)
+
+        # Crate the perception fisheye62 camera
+        fisheye = camera_operator.CameraOperator.init_with_fisheye(
+            extrinsic_matrix=np.eye(4).astype(np.float64),
+            intrinsic_matrix=random_intrinsics,
+            distortion=distortion,
+            width=width,
+            height=height,
+            name="test",
+            id=12,
+        )
+        self.assertEqual(fisheye.model_type, "FISHEYE62_WITH_BOTH_FOCAL")
+
+        # Create the unprojected points using the perception camera (these are
+        # effectively arbitrary)
+        unit_plane_points = generate_unit_plane(fisheye, width, height)
+
+        perception_output = fisheye.apply_intrinsic(
+            unit_plane_points, apply_distortion=True
+        )
+
+        # Compare with drtk
+        focal = th.tensor(fisheye.intrinsic_matrix[:2, :2], dtype=th.float)
+        drtk_output = project_fisheye_distort_62(
+            th.tensor(unit_plane_points, dtype=th.float).unsqueeze(0),
+            th.diag_embed(th.diagonal(focal)).unsqueeze(0),
+            th.tensor(
+                [
+                    fisheye.principal_point_x,
+                    fisheye.principal_point_y,
+                ],
+                dtype=th.float,
+            ).unsqueeze(0),
+            th.tensor(fisheye.distortion, dtype=th.float).unsqueeze(0),
+        )
+
+        np.testing.assert_allclose(
+            perception_output, drtk_output.squeeze(0).numpy(), atol=1e-4, rtol=1e-4
+        )