File size: 13,629 Bytes

50a800c

"""
Core NKSR wrapper: high-level mesh reconstruction API.
"""

from __future__ import annotations

from dataclasses import dataclass
from pathlib import Path
from typing import Optional, Union, Callable
import warnings

import numpy as np
import torch


try:
    import nksr
except ImportError as exc:
    raise ImportError(
        "The `nksr` package is required but not installed. "
        "Please install it from https://github.com/nv-tlabs/NKSR:\n"
        "  git clone https://github.com/nv-tlabs/NKSR.git\n"
        "  cd NKSR && pip install --no-build-isolation package/\n"
        "See the README for environment setup details."
    ) from exc


@dataclass
class MeshResult:
    """Result container for a reconstructed mesh."""

    vertices: np.ndarray
    """(V, 3) float array of mesh vertex positions."""

    faces: np.ndarray
    """(F, 3) int array of triangle face indices."""

    vertex_colors: Optional[np.ndarray] = None
    """(V, 3) float array of per-vertex colors, if texture was reconstructed."""

    def save(self, path: Union[str, Path]) -> None:
        """Save the mesh to a file using Trimesh."""
        import trimesh

        mesh = trimesh.Trimesh(
            vertices=self.vertices,
            faces=self.faces,
            vertex_colors=self.vertex_colors,
        )
        mesh.export(str(path))


class NKSRMeshReconstructor:
    """
    High-level wrapper around the NKSR reconstructor.

    This class hides the internal complexity of NKSR and exposes a single
    ``reconstruct()`` call that takes a point cloud (with optional normals)
    and returns a watertight triangle mesh.

    Parameters
    ----------
    device : str or torch.device, optional
        PyTorch device to run inference on. Default ``"cuda:0"``.
    config : str, optional
        NKSR model configuration to load.  Default ``"ks"`` (kitchen-sink,
        general-purpose pretrained model).  Other options include ``"snet"``
        (ShapeNet objects with normals) and ``"snet-wonormal"`` (ShapeNet
        without normals).
    chunk_tmp_device : str or torch.device, optional
        Temporary offload device for finished chunks when reconstructing very
        large scenes.  Default ``"cpu"``.  Set to ``None`` to disable
        off-loading (keeps everything on *device*).
    """

    def __init__(
        self,
        device: Union[str, torch.device] = "cuda:0",
        config: str = "ks",
        chunk_tmp_device: Optional[Union[str, torch.device]] = "cpu",
    ):
        self.device = torch.device(device)
        self.reconstructor = nksr.Reconstructor(self.device, config=config)

        if chunk_tmp_device is not None:
            self.reconstructor.chunk_tmp_device = torch.device(chunk_tmp_device)

        self._config_name = config

    # ------------------------------------------------------------------ #
    #  Public API                                                        #
    # ------------------------------------------------------------------ #

    def reconstruct(
        self,
        points: np.ndarray,
        normals: Optional[np.ndarray] = None,
        sensor_positions: Optional[np.ndarray] = None,
        colors: Optional[np.ndarray] = None,
        *,
        detail_level: float = 1.0,
        voxel_size: Optional[float] = None,
        chunk_size: float = -1.0,
        overlap_ratio: float = 0.05,
        approx_kernel_grad: bool = False,
        solver_max_iter: int = 2000,
        solver_tol: float = 1e-5,
        nystrom_min_depth: int = 100,
        fused_mode: bool = True,
        mise_iter: int = 1,
        estimate_normals_if_missing: bool = True,
        normal_knn: int = 64,
        normal_drop_threshold_deg: float = 85.0,
    ) -> MeshResult:
        """
        Reconstruct a watertight mesh from a point cloud.

        Parameters
        ----------
        points : np.ndarray
            (N, 3) array of point positions.
        normals : np.ndarray, optional
            (N, 3) array of **oriented** point normals.  If ``None`` and
            *sensor_positions* are also ``None``, normals are estimated on
            the fly (requires *estimate_normals_if_missing* = ``True``).
        sensor_positions : np.ndarray, optional
            (N, 3) array of per-point sensor/camera positions.  When normals
            are missing, NKSR can infer orientation from the point-to-sensor
            vector using the internal ``get_estimate_normal_preprocess_fn``.
        colors : np.ndarray, optional
            (N, 3) array of RGB colors in ``[0, 255]`` or ``[0, 1]``.  If
            provided, the returned mesh will contain per-vertex colors.
        detail_level : float, default 1.0
            Trade-off between smoothness and detail.  ``0.0`` = very smooth,
            ``1.0`` = maximum detail (may over-fit noise).  Ignored when
            *chunk_size* > 0 or *voxel_size* is set.
        voxel_size : float, optional
            Explicit voxel size controlling the reconstruction resolution.
            Overrides *detail_level*.
        chunk_size : float, default -1.0
            Spatial extent of each chunk for out-of-core reconstruction.
            ``-1.0`` disables chunking (process everything at once).  Positive
            values are required for very large point clouds (> few million
            points) to avoid out-of-memory errors.
        overlap_ratio : float, default 0.05
            Overlap between adjacent chunks (as a fraction of *chunk_size*).
        approx_kernel_grad : bool, default False
            Whether to approximate kernel gradients — slightly faster but a
            bit less accurate.
        solver_max_iter : int, default 2000
            Maximum iterations for the sparse PCG linear solver.
        solver_tol : float, default 1e-5
            Convergence tolerance for the PCG solver.
        nystrom_min_depth : int, default 100
            Minimum depth for the Nyström low-rank approximation used by the
            kernel field.
        fused_mode : bool, default True
            Memory-efficient fusion mode when chunking is enabled.
        mise_iter : int, default 1
            Number of MISE (Multi-resolution IsoSurface Extraction) iterations.
            ``0`` = base grid resolution, each additional iteration doubles
            the effective resolution in subdivided cells.
        estimate_normals_if_missing : bool, default True
            If ``True`` and no normals are provided, estimate them from the
            local geometry.  This only works well when the surface is
            sufficiently sampled.
        normal_knn : int, default 64
            k-NN neighborhood size for on-the-fly normal estimation.
        normal_drop_threshold_deg : float, default 85.0
            Maximum angle (in degrees) between the estimated normal and the
            point-to-sensor vector.  Points exceeding this are dropped.

        Returns
        -------
        MeshResult
            Container with ``vertices``, ``faces``, and optionally
            ``vertex_colors``.

        Notes
        -----
        1. **Normals matter.**  NKSR is designed for oriented normals.  If
           your input lacks them, the wrapper will try to estimate them, but
           orientation may be arbitrary (leading to inside-out meshes).
           Providing *sensor_positions* gives the best auto-orientation.
        2. **Scale.**  The default ``voxel_size`` in the ``"ks"`` config is
           ``0.1``.  If your point cloud is in millimetres and represents a
           room-scale scene, ``0.1`` = 10 cm, which is reasonable.  Adjust
           *voxel_size* or scale your data accordingly.
        3. **Chunking.**  When ``chunk_size > 0``, *detail_level* and
           *voxel_size* are ignored by the underlying NKSR code.  To control
           detail in chunked mode, pre-scale the point cloud by
           ``0.1 / desired_voxel_size``.
        """
        points = self._to_tensor(points, "points")

        # ---- handle normals ------------------------------------------------
        preprocess_fn: Optional[Callable] = None

        if normals is not None:
            normals = self._to_tensor(normals, "normals")
        elif sensor_positions is not None:
            sensor_positions = self._to_tensor(sensor_positions, "sensor_positions")
            preprocess_fn = nksr.get_estimate_normal_preprocess_fn(
                knn=normal_knn,
                drop_threshold_degrees=normal_drop_threshold_deg,
            )
        elif estimate_normals_if_missing:
            warnings.warn(
                "No normals or sensor positions provided. "
                "Estimating normals from geometry — orientation may be arbitrary. "
                "Consider providing sensor_positions for best results.",
                UserWarning,
            )
            normals = self._estimate_normals_from_points(points, normal_knn)

        # ---- colors ---------------------------------------------------------
        color_tensor: Optional[torch.Tensor] = None
        if colors is not None:
            colors = np.asarray(colors)
            if colors.max() > 1.0:
                colors = colors / 255.0
            color_tensor = self._to_tensor(colors, "colors")

        # ---- reconstruct ----------------------------------------------------
        field = self.reconstructor.reconstruct(
            xyz=points,
            normal=normals,
            sensor=sensor_positions,
            detail_level=detail_level,
            voxel_size=voxel_size,
            chunk_size=chunk_size,
            overlap_ratio=overlap_ratio,
            approx_kernel_grad=approx_kernel_grad,
            solver_max_iter=solver_max_iter,
            solver_tol=solver_tol,
            nystrom_min_depth=nystrom_min_depth,
            fused_mode=fused_mode,
            preprocess_fn=preprocess_fn,
        )

        # ---- optional texture ------------------------------------------------
        if color_tensor is not None:
            field.set_texture_field(nksr.fields.PCNNField(points, color_tensor))
            if mise_iter < 2:
                warnings.warn(
                    "Color reconstruction requested but mise_iter < 2. "
                    "Increasing to 2 for better color resolution.",
                    UserWarning,
                )
                mise_iter = 2

        # ---- extract mesh ---------------------------------------------------
        mesh = field.extract_dual_mesh(mise_iter=mise_iter)

        vertices = mesh.v.cpu().numpy() if hasattr(mesh.v, "cpu") else np.asarray(mesh.v)
        faces = mesh.f.cpu().numpy() if hasattr(mesh.f, "cpu") else np.asarray(mesh.f)

        vertex_colors = None
        if hasattr(mesh, "c") and mesh.c is not None:
            vertex_colors = (
                mesh.c.cpu().numpy() if hasattr(mesh.c, "cpu") else np.asarray(mesh.c)
            )

        return MeshResult(
            vertices=vertices,
            faces=faces,
            vertex_colors=vertex_colors,
        )

    # ------------------------------------------------------------------ #
    #  Helpers                                                           #
    # ------------------------------------------------------------------ #

    def _to_tensor(self, arr: np.ndarray, name: str) -> torch.Tensor:
        """Convert a numpy array to a float tensor on the target device."""
        arr = np.asarray(arr)
        if arr.ndim != 2 or arr.shape[1] != 3:
            raise ValueError(
                f"{name} must have shape (N, 3), got {arr.shape}"
            )
        return torch.from_numpy(arr).float().to(self.device)

    def _estimate_normals_from_points(
        self, points: torch.Tensor, k: int = 64
    ) -> torch.Tensor:
        """
        Fast PCA-based normal estimation using PyTorch (no Open3D dependency).

        This estimates **unoriented** normals.  Orientation is arbitrary,
        so the resulting mesh may be inside-out.
        """
        # Simple k-NN with brute force — acceptable for moderate N (< 100k).
        # For larger clouds the user should pre-compute normals externally.
        N = points.shape[0]
        if N > 100_000:
            warnings.warn(
                f"Point cloud has {N} points; on-the-fly normal estimation "
                f"may be slow. Consider pre-computing normals with Open3D.",
                UserWarning,
            )

        # Build a KD-tree or use brute force — we use a chunked brute-force
        # approach to keep memory reasonable.
        batch_size = 4096
        normals_list = []

        for i in range(0, N, batch_size):
            batch = points[i : i + batch_size]  # (B, 3)
            # pairwise distances to all points
            dists = torch.cdist(batch, points)  # (B, N)
            _, idx = torch.topk(dists, k=min(k, N), dim=-1, largest=False)  # (B, k)
            neighbors = points[idx]  # (B, k, 3)
            centered = neighbors - neighbors.mean(dim=1, keepdim=True)  # (B, k, 3)
            cov = centered.transpose(1, 2) @ centered  # (B, 3, 3)
            # smallest eigenvector = normal
            eigvals, eigvecs = torch.linalg.eigh(cov)
            normal = eigvecs[:, :, 0]  # (B, 3)
            normals_list.append(normal)

        normals = torch.cat(normals_list, dim=0)
        # arbitrary orientation — flip to point roughly outward from centroid
        centroid = points.mean(dim=0, keepdim=True)
        outward = points - centroid
        flip = (normals * outward).sum(dim=-1, keepdim=True) < 0
        normals = torch.where(flip, -normals, normals)
        return normals