openvdb · fwilliams · Feb 4, 2026 · Jan 20, 2026 · Jan 20, 2026 · Jan 20, 2026
@@ -110,6 +110,7 @@ set(FVDB_CU_FILES
     fvdb/detail/ops/gsplat/GaussianMCMCRelocation.cu
     fvdb/detail/ops/gsplat/GaussianProjectionBackward.cu
     fvdb/detail/ops/gsplat/GaussianProjectionForward.cu
+    fvdb/detail/ops/gsplat/GaussianProjectionUT.cu
     fvdb/detail/ops/gsplat/GaussianProjectionJaggedBackward.cu
     fvdb/detail/ops/gsplat/GaussianProjectionJaggedForward.cu
     fvdb/detail/ops/gsplat/GaussianRasterizeBackward.cu
@@ -171,7 +172,7 @@ set_target_properties(
     CXX_STANDARD 20
     CXX_STANDARD_REQUIRED ON
     CXX_EXTENSIONS ON
-    CUDA_STANDARD 20
+              CUDA_STANDARD 20
     CUDA_STANDARD_REQUIRED ON
     POSITION_INDEPENDENT_CODE ON
     INTERFACE_POSITION_INDEPENDENT_CODE ON)

@@ -1307,7 +1307,7 @@ GridBatchImpl::deserializeV0(const torch::Tensor &serialized) {
     };
 
     TORCH_CHECK(serialized.scalar_type() == torch::kInt8, "Serialized data must be of type int8");
-    TORCH_CHECK(serialized.numel() >= sizeof(V01Header),
+    TORCH_CHECK(serialized.numel() >= static_cast<int64_t>(sizeof(V01Header)),
                 "Serialized data is too small to be a valid grid handle");
 
     const int8_t *serializedPtr = serialized.data_ptr<int8_t>();
@@ -1316,7 +1316,7 @@ GridBatchImpl::deserializeV0(const torch::Tensor &serialized) {
     TORCH_CHECK(header->magic == 0x0F0F0F0F0F0F0F0F,
                 "Serialized data is not a valid grid handle. Bad magic.");
     TORCH_CHECK(header->version == 0, "Serialized data is not a valid grid handle. Bad version.");
-    TORCH_CHECK(serialized.numel() == header->totalBytes,
+    TORCH_CHECK(static_cast<uint64_t>(serialized.numel()) == header->totalBytes,
                 "Serialized data is not a valid grid handle. Bad total bytes.");
 
     const uint64_t numGrids = header->numGrids;
@@ -1752,7 +1752,7 @@ GridBatchImpl::dilate(const int64_t dilationAmount) {
 c10::intrusive_ptr<GridBatchImpl>
 GridBatchImpl::dilate(const std::vector<int64_t> dilationAmount) {
     c10::DeviceGuard guard(device());
-    TORCH_CHECK_VALUE(dilationAmount.size() == batchSize(),
+    TORCH_CHECK_VALUE(static_cast<int64_t>(dilationAmount.size()) == batchSize(),
                       "dilationAmount should have same size as batch size, got ",
                       dilationAmount.size(),
                       " != ",

@@ -91,15 +91,7 @@ template <typename T, bool Ortho> struct ProjectionForward {
           mOutDepthsAcc(outDepths.packed_accessor64<T, 2, torch::RestrictPtrTraits>()),
           mOutConicsAcc(outConics.packed_accessor64<T, 3, torch::RestrictPtrTraits>()),
           mOutCompensationsAcc(outCompensations.defined() ? outCompensations.data_ptr<T>()
-                                                          : nullptr) {
-        mMeansAcc     = means.packed_accessor64<T, 2, torch::RestrictPtrTraits>();
-        mQuatsAcc     = quats.packed_accessor64<T, 2, torch::RestrictPtrTraits>();
-        mLogScalesAcc = logScales.packed_accessor64<T, 2, torch::RestrictPtrTraits>();
-        mWorldToCamMatricesAcc =
-            worldToCamMatrices.packed_accessor32<T, 3, torch::RestrictPtrTraits>();
-        mProjectionMatricesAcc =
-            projectionMatrices.packed_accessor32<T, 3, torch::RestrictPtrTraits>();
-    }
+                                                          : nullptr) {}
 
     inline __device__ Mat3
     computeCovarianceMatrix(int64_t gid) const {

@@ -0,0 +1,121 @@
+// Copyright Contributors to the OpenVDB Project
+// SPDX-License-Identifier: Apache-2.0
+//
+#ifndef FVDB_DETAIL_OPS_GSPLAT_GAUSSIANPROJECTIONUT_H
+#define FVDB_DETAIL_OPS_GSPLAT_GAUSSIANPROJECTIONUT_H
+
+#include <ATen/core/TensorBody.h>
+#include <torch/types.h>
+
+#include <tuple>
+
+namespace fvdb {
+namespace detail {
+namespace ops {
+
+enum class RollingShutterType { NONE = 0, VERTICAL = 1, HORIZONTAL = 2 };
+
+// Distortion model for camera projection in the UT kernel.
+//
+// Distortion coefficients are supplied as a single tensor `distortionCoeffs` and interpreted
+// according to this enum.
+enum class DistortionModel : int32_t {
+    NONE = 0,
+
+    // OpenCV variants (all use the same [C,12] coefficient layout):
+    //   [k1,k2,k3,k4,k5,k6,p1,p2,s1,s2,s3,s4]
+    //
+    // The enum exists mostly for clarity + runtime validation of coefficient usage.
+    OPENCV_RADTAN_5            = 1, // polynomial radial (k1,k2,k3) + tangential (p1,p2)
+    OPENCV_RATIONAL_8          = 2, // rational radial (k1..k6) + tangential (p1,p2)
+    OPENCV_RADTAN_THIN_PRISM_9 = 3, // polynomial radial + tangential + thin-prism (s1..s4)
+    OPENCV_THIN_PRISM_12       = 4, // rational radial + tangential + thin-prism (s1..s4)
+};
+
+struct UTParams {
+    float alpha = 0.1f; // Blending parameter for UT
+    float beta  = 2.0f; // Scaling parameter for UT
+    float kappa = 0.0f; // Additional scaling parameter for UT
+    // For a 3D Unscented Transform with the standard \(2D+1\) formulation, D=3 => 7 points.
+    // This implementation currently supports only this 3D case.
+    int numSigmaPoints  = 7;
+    float inImageMargin = 0.1f; // Margin for in-image check
+    bool requireAllSigmaPointsInImage =
+        true; // Require all sigma points to be in image to consider a Gaussian valid
+};
+
+/// @brief Project 3D Gaussians to 2D screen space pixel coordinates for rendering
+///
+/// This function transforms 3D Gaussians to 2D screen space by applying camera projections.
+/// It computes the 2D means, depths, 2D covariance matrices (conics), and potentially compensation
+/// factors to accurately represent the 3D Gaussians in 2D for later rasterization.
+///
+/// The origin of the 2D pixel coordinates is the top-left corner of the image, with positive x-axis
+/// pointing to the right and positive y-axis pointing downwards.
+///
+/// @attention The output radii of 3D Gaussians that are discarded (due to clipping or projection
+/// too small) are set to zero, but the other output values of discarded Gaussians are uninitialized
+/// (undefined).
+///
+/// @tparam DeviceType Device type template parameter (torch::kCUDA or torch::kCPU)
+///
+/// @param[in] means 3D positions of Gaussians [N, 3] where N is number of Gaussians
+/// @param[in] quats Quaternion rotations of Gaussians [N, 4] in format (w, x, y, z)
+/// @param[in] logScales Log-scale factors of Gaussians [N, 3] (natural log), representing extent in
+/// each dimension
+/// @param[in] worldToCamMatricesStart Camera view matrices at the start of the frame. Shape [C, 4,
+/// 4] where C is number of cameras
+/// @param[in] worldToCamMatricesEnd Camera view matrices at the end of the frame. Shape [C, 4, 4]
+/// where C is number of cameras
+/// @param[in] projectionMatrices Camera intrinsic matrices [C, 3, 3]
+/// @param[in] rollingShutterType Type of rolling shutter effect to apply
+/// @param[in] utParams Unscented Transform parameters
+/// @param[in] distortionModel Distortion model used to interpret `distortionCoeffs`.
+/// @param[in] distortionCoeffs Distortion coefficients for each camera.
+///   - DistortionModel::NONE: ignored (use [C,0] or [C,K] tensor).
+///   - DistortionModel::OPENCV_*: expects [C,12] coefficients in the following order:
+///       [k1,k2,k3,k4,k5,k6,p1,p2,s1,s2,s3,s4]
+///     where k1..k6 are radial (rational), p1,p2 are tangential, and s1..s4 are thin-prism.
+/// @param[in] imageWidth Width of the output image in pixels
+/// @param[in] imageHeight Height of the output image in pixels
+/// @param[in] eps2d 2D projection epsilon for numerical stability
+/// @param[in] nearPlane Near clipping plane distance
+/// @param[in] farPlane Far clipping plane distance
+/// @param[in] minRadius2d Minimum 2D radius threshold; Gaussians with projected radius <= this
+/// value are clipped/discarded
+/// @param[in] calcCompensations Whether to calculate view-dependent compensation factors
+/// @param[in] ortho Whether to use orthographic projection instead of perspective
+///
+/// @return std::tuple containing:
+///         - Radii of 2D Gaussians [C, N]
+///         - 2D projected Gaussian centers [C, N, 2]
+///         - Depths of Gaussians [C, N]
+///         - Covariance matrices in conic form [C, N, 3] representing (a, b, c) in ax² + 2bxy + cy²
+///         - Compensation factors [C, N] (if calc_compensations is true, otherwise empty tensor)
+template <torch::DeviceType>
+std::tuple<torch::Tensor, torch::Tensor, torch::Tensor, torch::Tensor, torch::Tensor>
+dispatchGaussianProjectionForwardUT(
+    const torch::Tensor &means,                   // [N, 3]
+    const torch::Tensor &quats,                   // [N, 4]
+    const torch::Tensor &logScales,               // [N, 3]
+    const torch::Tensor &worldToCamMatricesStart, // [C, 4, 4]
+    const torch::Tensor &worldToCamMatricesEnd,   // [C, 4, 4]
+    const torch::Tensor &projectionMatrices,      // [C, 3, 3]
+    const RollingShutterType rollingShutterType,
+    const UTParams &utParams,
+    const DistortionModel distortionModel,
+    const torch::Tensor &distortionCoeffs, // [C, 12] for OPENCV_*, or [C, 0] for NONE
+    const int64_t imageWidth,
+    const int64_t imageHeight,
+    const float eps2d,
+    const float nearPlane,
+    const float farPlane,
+    const float minRadius2d,
+    const bool calcCompensations,
+    const bool ortho);
+
+} // namespace ops
+} // namespace detail
+} // namespace fvdb
+
+#endif // FVDB_DETAIL_OPS_GSPLAT_GAUSSIANPROJECTIONUT_H