orthographic

fwilliams · fwilliams · commit 7e85a0e8ada3 · 2026-01-29T21:39:37.000-08:00
Signed-off-by: Francis Williams &lt;francis@fwilliams.info&gt;
diff --git a/src/fvdb/detail/ops/gsplat/GaussianProjectionUT.cu b/src/fvdb/detail/ops/gsplat/GaussianProjectionUT.cu
@@ -60,6 +60,17 @@ template <typename T> class OpenCVCameraModel {
         : K(K_in) {
         deviceAssertOrTrap(K != nullptr);
 
+        // Orthographic is a camera model choice; it is only supported for the undistorted pinhole
+        // math path (no OpenCV distortion).
+        orthographic = (cameraModel == CameraModel::ORTHOGRAPHIC);
+
+        if (cameraModel == CameraModel::ORTHOGRAPHIC) {
+            radial = tangential = thinPrism = nullptr;
+            numRadial = numTangential = numThinPrism = 0;
+            model                                    = Model::NONE;
+            return;
+        }
+
         if (cameraModel == CameraModel::PINHOLE) {
             radial = tangential = thinPrism = nullptr;
             numRadial = numTangential = numThinPrism = 0;
@@ -120,12 +131,17 @@ template <typename T> class OpenCVCameraModel {
     }
 
     // Project a 3D point in camera coordinates to pixel coordinates using this camera model
-    // (pinhole + distortion + intrinsics).
+    // (pinhole/orthographic + distortion + intrinsics).
     __device__ Vec2
     project(const Vec3 &p_cam) const {
-        // Normalize by depth.
-        const T z_inv = T(1) / max(p_cam[2], T(1e-6));
-        const Vec2 p_normalized(p_cam[0] * z_inv, p_cam[1] * z_inv);
+        // Normalize to camera plane.
+        Vec2 p_normalized;
+        if (orthographic) {
+            p_normalized = Vec2(p_cam[0], p_cam[1]);
+        } else {
+            const T z_inv = T(1) / max(p_cam[2], T(1e-6));
+            p_normalized  = Vec2(p_cam[0] * z_inv, p_cam[1] * z_inv);
+        }
 
         const Vec2 p_distorted = applyDistortion(p_normalized);
 
@@ -150,7 +166,8 @@ template <typename T> class OpenCVCameraModel {
 
     // Camera intrinsics pointer (typically points into shared memory).
     // This avoids copying a Mat3 into registers per-thread.
-    const Mat3 *K = nullptr;
+    const Mat3 *K     = nullptr;
+    bool orthographic = false;
 
     // Coefficients for the distortion model.
     const T *radial     = nullptr;     // k1..k6 (but k4..k6 only used in rational model)
@@ -283,7 +300,8 @@ template <typename ScalarType> struct WorldToPixelTransform {
                          const RigidTransform<ScalarType> &xf,
                          Vec2 &out_pix) const {
         const Vec3 p_cam = xf.apply(p_world);
-        // Perspective only (ortho is not meaningful for distorted camera models).
+        // Note: `CameraModel::ORTHOGRAPHIC` still uses the same behind-camera check, but does not
+        // divide by depth in the camera model projection step.
         if (p_cam[2] <= ScalarType(0)) {
             // Ensure deterministic output to avoid UB on callers that assign/read even on invalid
             // projections. This value is ignored when we treat BehindCamera as a hard reject.
@@ -803,8 +821,7 @@ dispatchGaussianProjectionForwardUT<torch::kCUDA>(
     const float nearPlane,
     const float farPlane,
     const float minRadius2d,
-    const bool calcCompensations,
-    const bool ortho) {
+    const bool calcCompensations) {
     FVDB_FUNC_RANGE();
 
     TORCH_CHECK_VALUE(means.is_cuda(), "means must be a CUDA tensor");
@@ -817,7 +834,7 @@ dispatchGaussianProjectionForwardUT<torch::kCUDA>(
     TORCH_CHECK_VALUE(projectionMatrices.is_cuda(), "projectionMatrices must be a CUDA tensor");
     TORCH_CHECK_VALUE(distortionCoeffs.is_cuda(), "distortionCoeffs must be a CUDA tensor");
     TORCH_CHECK_VALUE(distortionCoeffs.dim() == 2, "distortionCoeffs must be 2D");
-    if (cameraModel == CameraModel::PINHOLE) {
+    if (cameraModel == CameraModel::PINHOLE || cameraModel == CameraModel::ORTHOGRAPHIC) {
         // Accept any K (including 0); ignored.
     } else if (cameraModel == CameraModel::OPENCV_RADTAN_5 ||
                cameraModel == CameraModel::OPENCV_RATIONAL_8 ||
@@ -857,10 +874,7 @@ dispatchGaussianProjectionForwardUT<torch::kCUDA>(
     using scalar_t = float;
 
     const size_t NUM_BLOCKS = GET_BLOCKS(C * N, 256);
-    // This kernel currently implements the (distorted) perspective camera model.
-    // Keep parity with the reference kernel: orthographic is not supported here.
-    TORCH_CHECK_VALUE(!ortho,
-                      "GaussianProjectionForwardUT does not support orthographic projection");
+    // Orthographic is supported only for CameraModel::ORTHOGRAPHIC (undistorted).
 
     const size_t SHARED_MEM_SIZE = C * (3 * sizeof(nanovdb::math::Mat3<scalar_t>) +
                                         2 * sizeof(nanovdb::math::Vec3<scalar_t>)) +
@@ -915,8 +929,7 @@ dispatchGaussianProjectionForwardUT<torch::kCPU>(
     const float nearPlane,
     const float farPlane,
     const float minRadius2d,
-    const bool calcCompensations,
-    const bool ortho) {
+    const bool calcCompensations) {
     TORCH_CHECK_NOT_IMPLEMENTED(false, "GaussianProjectionForwardUT not implemented on the CPU");
 }
 
@@ -939,8 +952,7 @@ dispatchGaussianProjectionForwardUT<torch::kPrivateUse1>(
     const float nearPlane,
     const float farPlane,
     const float minRadius2d,
-    const bool calcCompensations,
-    const bool ortho) {
+    const bool calcCompensations) {
     TORCH_CHECK_NOT_IMPLEMENTED(false,
                                 "GaussianProjectionForwardUT not implemented for this device type");
 }
diff --git a/src/fvdb/detail/ops/gsplat/GaussianProjectionUT.h b/src/fvdb/detail/ops/gsplat/GaussianProjectionUT.h
@@ -25,6 +25,9 @@ enum class CameraModel : int32_t {
     // Pinhole intrinsics only (no distortion).
     PINHOLE = 0,
 
+    // Orthographic intrinsics (no distortion).
+    ORTHOGRAPHIC = 5,
+
     // OpenCV variants which are just pinhole intrinsics + optional distortion (all of them use the
     // same [C,12] distortion coefficients layout: [k1,k2,k3,k4,k5,k6,p1,p2,s1,s2,s3,s4]).
     OPENCV_RADTAN_5            = 1, // polynomial radial (k1,k2,k3) + tangential (p1,p2)).
@@ -83,6 +86,7 @@ struct UTParams {
 /// @param[in] cameraModel Camera model used to interpret `distortionCoeffs`.
 /// @param[in] distortionCoeffs Distortion coefficients for each camera.
 ///   - CameraModel::PINHOLE: ignored (use [C,0] or [C,K] tensor).
+///   - CameraModel::ORTHOGRAPHIC: ignored (use [C,0] or [C,K] tensor).
 ///   - CameraModel::OPENCV_*: expects [C,12] coefficients in the following order:
 ///       [k1,k2,k3,k4,k5,k6,p1,p2,s1,s2,s3,s4]
 ///     where k1..k6 are radial (rational), p1,p2 are tangential, and s1..s4 are thin-prism.
@@ -94,7 +98,6 @@ struct UTParams {
 /// @param[in] minRadius2d Minimum 2D radius threshold; Gaussians with projected radius <= this
 /// value are clipped/discarded
 /// @param[in] calcCompensations Whether to calculate view-dependent compensation factors
-/// @param[in] ortho Whether to use orthographic projection instead of perspective
 ///
 /// @return std::tuple containing:
 ///         - Radii of 2D Gaussians [C, N]
@@ -114,15 +117,14 @@ dispatchGaussianProjectionForwardUT(
     const RollingShutterType rollingShutterType,
     const UTParams &utParams,
     const CameraModel cameraModel,
-    const torch::Tensor &distortionCoeffs, // [C, 12] for OPENCV_*, or [C, 0] for NONE
+    const torch::Tensor &distortionCoeffs, // [C, 12] for OPENCV_*, or [C, 0] for PINHOLE/ORTHO
     const int64_t imageWidth,
     const int64_t imageHeight,
     const float eps2d,
     const float nearPlane,
     const float farPlane,
     const float minRadius2d,
-    const bool calcCompensations,
-    const bool ortho);
+    const bool calcCompensations);
 
 } // namespace ops
 } // namespace detail
diff --git a/src/tests/GaussianProjectionUTTest.cpp b/src/tests/GaussianProjectionUTTest.cpp
@@ -189,7 +189,6 @@ TEST_F(GaussianProjectionUTTestFixture, CenteredGaussian_NoDistortion_AnalyticMe
                                                           nearPlane,
                                                           farPlane,
                                                           minRadius2d,
-                                                          false,
                                                           false);
 
     auto means2d_cpu = means2d.cpu();
@@ -219,6 +218,78 @@ TEST_F(GaussianProjectionUTTestFixture, CenteredGaussian_NoDistortion_AnalyticMe
     EXPECT_NEAR(conics_cpu[0][0][2].item<float>(), expected_c, 1e-3f);
 }
 
+TEST_F(GaussianProjectionUTTestFixture, Orthographic_NoDistortion_AnalyticMeanAndDepth) {
+    const int64_t C = 1;
+
+    const float x = 1.0f, y = -2.0f, z = 10.0f;
+    means     = torch::tensor({{x, y, z}}, torch::kFloat32);
+    quats     = torch::tensor({{1.0f, 0.0f, 0.0f, 0.0f}}, torch::kFloat32);
+    logScales = torch::log(torch::tensor({{0.2f, 0.3f, 0.4f}}, torch::kFloat32));
+
+    worldToCamMatricesStart =
+        torch::eye(4, torch::TensorOptions().dtype(torch::kFloat32)).unsqueeze(0).expand({C, 4, 4});
+    worldToCamMatricesEnd = worldToCamMatricesStart.clone();
+
+    const float fx = 123.0f, fy = 77.0f, cx = 320.0f, cy = 240.0f;
+    projectionMatrices = torch::zeros({C, 3, 3}, torch::TensorOptions().dtype(torch::kFloat32));
+    auto projectionMatricesAcc     = projectionMatrices.accessor<float, 3>();
+    projectionMatricesAcc[0][0][0] = fx;
+    projectionMatricesAcc[0][1][1] = fy;
+    projectionMatricesAcc[0][0][2] = cx;
+    projectionMatricesAcc[0][1][2] = cy;
+    projectionMatricesAcc[0][2][2] = 1.0f;
+
+    cameraModel      = CameraModel::ORTHOGRAPHIC;
+    distortionCoeffs = torch::zeros({C, 0}, torch::kFloat32);
+
+    imageWidth  = 640;
+    imageHeight = 480;
+    eps2d       = 0.3f;
+    nearPlane   = 0.1f;
+    farPlane    = 100.0f;
+    minRadius2d = 0.0f;
+
+    utParams                              = UTParams{};
+    utParams.inImageMargin                = 0.1f;
+    utParams.requireAllSigmaPointsInImage = true;
+
+    means                   = means.cuda();
+    quats                   = quats.cuda();
+    logScales               = logScales.cuda();
+    worldToCamMatricesStart = worldToCamMatricesStart.cuda();
+    worldToCamMatricesEnd   = worldToCamMatricesEnd.cuda();
+    projectionMatrices      = projectionMatrices.cuda();
+    distortionCoeffs        = distortionCoeffs.cuda();
+
+    const auto [radii, means2d, depths, conics, compensations] =
+        dispatchGaussianProjectionForwardUT<torch::kCUDA>(means,
+                                                          quats,
+                                                          logScales,
+                                                          worldToCamMatricesStart,
+                                                          worldToCamMatricesEnd,
+                                                          projectionMatrices,
+                                                          RollingShutterType::NONE,
+                                                          utParams,
+                                                          cameraModel,
+                                                          distortionCoeffs,
+                                                          imageWidth,
+                                                          imageHeight,
+                                                          eps2d,
+                                                          nearPlane,
+                                                          farPlane,
+                                                          minRadius2d,
+                                                          false);
+
+    auto means2d_cpu = means2d.cpu();
+    auto depths_cpu  = depths.cpu();
+    auto radii_cpu   = radii.cpu();
+
+    EXPECT_GT(radii_cpu[0][0].item<int32_t>(), 0);
+    EXPECT_NEAR(depths_cpu[0][0].item<float>(), z, 1e-4f);
+    EXPECT_NEAR(means2d_cpu[0][0][0].item<float>(), fx * x + cx, 1e-3f);
+    EXPECT_NEAR(means2d_cpu[0][0][1].item<float>(), fy * y + cy, 1e-3f);
+}
+
 TEST_F(GaussianProjectionUTTestFixture, OffAxisTinyGaussian_NoDistortion_MeanMatchesPinhole) {
     const int64_t C = 1;
 
@@ -283,7 +354,6 @@ TEST_F(GaussianProjectionUTTestFixture, OffAxisTinyGaussian_NoDistortion_MeanMat
                                                           nearPlane,
                                                           farPlane,
                                                           minRadius2d,
-                                                          false,
                                                           false);
 
     auto means2d_cpu       = means2d.cpu();
@@ -379,7 +449,6 @@ TEST_F(GaussianProjectionUTTestFixture, MultiCamera_RadTanDistortion_PerCameraPa
                                                           nearPlane,
                                                           farPlane,
                                                           minRadius2d,
-                                                          false,
                                                           false);
 
     auto radii_cpu   = radii.cpu();
@@ -475,7 +544,6 @@ TEST_F(GaussianProjectionUTTestFixture,
                                                           nearPlane,
                                                           farPlane,
                                                           minRadius2d,
-                                                          false,
                                                           false);
 
     auto radii_cpu   = radii.cpu();
@@ -569,7 +637,6 @@ TEST_F(GaussianProjectionUTTestFixture,
                                                           nearPlane,
                                                           farPlane,
                                                           minRadius2d,
-                                                          false,
                                                           false);
 
     auto radii_cpu   = radii.cpu();
@@ -671,7 +738,6 @@ TEST_F(GaussianProjectionUTTestFixture,
                                                           nearPlane,
                                                           farPlane,
                                                           minRadius2d,
-                                                          false,
                                                           false);
 
     auto radii_cpu   = radii.cpu();
@@ -768,7 +834,6 @@ TEST_F(GaussianProjectionUTTestFixture,
                                                           nearPlane,
                                                           farPlane,
                                                           minRadius2d,
-                                                          false,
                                                           false);
 
     auto radii_cpu   = radii.cpu();
@@ -837,7 +902,6 @@ TEST_F(GaussianProjectionUTTestFixture, RadTanThinPrism_IgnoresK456EvenIfNonZero
                                                           nearPlane,
                                                           farPlane,
                                                           minRadius2d,
-                                                          false,
                                                           false);
 
     auto radii_cpu   = radii.cpu();
@@ -922,7 +986,6 @@ TEST_F(GaussianProjectionUTTestFixture,
                                                           nearPlane,
                                                           farPlane,
                                                           minRadius2d,
-                                                          false,
                                                           false);
 
     // When the UT kernel discards a Gaussian, only radii are defined to be 0; other outputs are
@@ -997,7 +1060,6 @@ TEST_F(GaussianProjectionUTTestFixture,
                                                           nearPlane,
                                                           farPlane,
                                                           minRadius2d,
-                                                          false,
                                                           false);
 
     auto radii_cpu = radii.cpu();
@@ -1069,7 +1131,6 @@ TEST_F(GaussianProjectionUTTestFixture, RollingShutterNone_DepthUsesStartPoseNot
                                                           nearPlane,
                                                           farPlane,
                                                           minRadius2d,
-                                                          false,
                                                           false);
 
     auto depths_cpu = depths.cpu();