nvidia-holoscan · snknitheesh · May 30, 2026 · May 30, 2026 · May 30, 2026 · May 30, 2026
diff --git a/applications/CMakeLists.txt b/applications/CMakeLists.txt
@@ -49,6 +49,8 @@ add_holohub_application(deltacast_receiver DEPENDS
 
 add_holohub_application(depth_anything_v2)
 
+add_holohub_application(depth_to_point_cloud_demo DEPENDS OPERATORS depth_to_point_cloud)
+
 add_subdirectory(distributed)
 
 add_holohub_application(endoscopy_depth_estimation)

diff --git a/applications/depth_to_point_cloud_demo/CMakeLists.txt b/applications/depth_to_point_cloud_demo/CMakeLists.txt
@@ -0,0 +1,33 @@
+# SPDX-FileCopyrightText: Copyright (c) 2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: Apache-2.0
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+project(depth_to_point_cloud_demo NONE)
+
+find_package(holoscan 4.0.0 REQUIRED CONFIG
+             PATHS "/opt/nvidia/holoscan" "/workspace/holoscan-sdk/install")
+
+if(BUILD_TESTING)
+  add_test(NAME depth_to_point_cloud_demo_python_test
+    COMMAND python3 ${CMAKE_CURRENT_SOURCE_DIR}/depth_to_point_cloud_demo.py --frames 10
+    WORKING_DIRECTORY ${CMAKE_CURRENT_BINARY_DIR})
+
+  set_property(TEST depth_to_point_cloud_demo_python_test PROPERTY ENVIRONMENT
+               "PYTHONPATH=${GXF_LIB_DIR}/../python/lib:${CMAKE_BINARY_DIR}/python/lib")
+
+  set_tests_properties(depth_to_point_cloud_demo_python_test
+    PROPERTIES
+      PASS_REGULAR_EXPRESSION "valid="
+      FAIL_REGULAR_EXPRESSION "(^|[^a-z])Error;ERROR;Failed")
+endif()
diff --git a/applications/depth_to_point_cloud_demo/README.md b/applications/depth_to_point_cloud_demo/README.md
@@ -0,0 +1,87 @@
+# Depth to Point Cloud Demo
+
+A minimal demo of the [`depth_to_point_cloud`](../../operators/depth_to_point_cloud) operator.
+
+Here **hardware-free** means the input is produced by an on-GPU synthetic data generator
+(`SyntheticDepthGeneratorOp`) rather than a physical sensor: no depth camera, recorded dataset, or
+depth-estimation network is required, so the demo runs in CI on any GPU. The generator emits a
+synthetic organized depth image (a gently tilting plane) plus an aligned RGB image entirely on the
+GPU; the operator deprojects it into an organized `H x W x 3` point cloud, and the demo reports the
+valid-point count and Z range each frame.
+
+## Run
+
+```bash
+# Synthetic source (default, hardware-free, CI-friendly):
+./holohub run depth_to_point_cloud_demo
+# equivalently:
+./holohub run depth_to_point_cloud_demo synthetic
+
+# or directly:
+python3 applications/depth_to_point_cloud_demo/depth_to_point_cloud_demo.py --frames 100
+```
+
+Expected output (per frame):
+
+```text
+[depth_to_point_cloud_demo] points=307200 valid=307200 z=[1.xxx, 2.xxx] m
+```
+
+### Sources (`--source` / run modes)
+
+The demo selects its input source with `--source`, exposed as HoloHub run modes:
+
+| Mode / `--source` | Description |
+| --- | --- |
+| `synthetic` (default) | On-GPU synthetic depth + RGB generator. No hardware, runs in CI. |
+| `realsense` | Live Intel RealSense camera (see caveat below). |
+
+### Interactive 3D visualization (`--visualize`)
+
+By default the demo ends in a headless, CI-friendly `PointCloudStatsOp` sink that just reports
+per-frame statistics. Pass `--visualize` to instead render the cloud in `HolovizOp` as 3D points:
+
+```bash
+python3 applications/depth_to_point_cloud_demo/depth_to_point_cloud_demo.py --visualize
+```
+
+With `--visualize`, the organized `H x W x 3` cloud is compacted to `N x 3` with invalid (NaN)
+points dropped before being handed to `HolovizOp` as a `points_3d` primitive. This path needs a
+display and is therefore disabled by default (the CI mode keeps the statistics sink).
+
+## Pipeline
+
+```text
+SyntheticDepthGeneratorOp  --depth-->  DepthToPointCloudOp  --point_cloud-->  PointCloudStatsOp
+                           --color-->                                         (or HolovizOp with --visualize)
+```
+
+## Using a real Intel RealSense camera
+
+`--source realsense` is scaffolded but **not yet runnable from this Python demo**. The
+[`realsense_camera`](../../operators/realsense_camera) operator is currently C++-only (it ships no
+Python bindings), and it emits its `depth_buffer` / `color_buffer` as GXF `VideoBuffer`s, whereas
+`DepthToPointCloudOp` consumes a GXF `Tensor`. Wiring them from Python therefore requires:
+
+1. Python bindings for `realsense_camera` (add an `operators/realsense_camera/python/` module).
+2. A `FormatConverterOp` between the camera and the operator to convert `VideoBuffer` → `Tensor`
+   (and `RGBA8` → `RGB8` for the color path).
+3. Feeding intrinsics — either statically (`fx/fy/cx/cy`) or by consuming the camera's
+   `depth_camera_model` output through the operator's optional `intrinsics` input.
+
+Selecting `--source realsense` today raises a clear `NotImplementedError` pointing here. The wiring,
+once the bindings exist, is:
+
+```python
+from holohub.realsense_camera import RealsenseCameraOp  # requires new Python bindings
+
+camera = RealsenseCameraOp(self, name="camera", allocator=...)
+# camera.depth_buffer / color_buffer are VideoBuffers -> convert to Tensor via FormatConverterOp,
+# then feed DepthToPointCloudOp. RealSense depth is float32 meters (units_transform applied), so
+# use depth_scale=1.0 — not 0.001 (the 0.001 uint16-millimeter value is only for raw Z16 sources).
+```
+
+## Requirements
+
+- Holoscan SDK ≥ 4.0.0, CUDA, CuPy. Builds the `depth_to_point_cloud` operator (declared as a
+  dependency). Platforms: `x86_64`, `aarch64`.
diff --git a/applications/depth_to_point_cloud_demo/depth_to_point_cloud_demo.py b/applications/depth_to_point_cloud_demo/depth_to_point_cloud_demo.py
@@ -0,0 +1,268 @@
+# SPDX-FileCopyrightText: Copyright (c) 2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: Apache-2.0
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""Demo for DepthToPointCloudOp.
+
+Selectable input source (``--source``):
+
+* ``synthetic`` (default) generates an organized depth image (a gently tilting plane) plus an
+  aligned RGB image entirely on the GPU. No camera or dataset is required, so the app runs in CI.
+* ``realsense`` is scaffolded for a live Intel RealSense camera but is not yet runnable from Python
+  (the ``realsense_camera`` operator ships no Python bindings and emits ``VideoBuffer``s rather than
+  the ``Tensor`` this operator consumes); selecting it raises ``NotImplementedError``. See README.md.
+
+The deprojected organized point cloud is either summarized by ``PointCloudStatsOp`` (default,
+CI-friendly) or rendered as 3D points by ``HolovizOp`` when ``--visualize`` is passed.
+"""
+
+import argparse
+
+import cupy as cp
+from holoscan.conditions import CountCondition
+from holoscan.core import Application, Operator, OperatorSpec
+from holoscan.operators import HolovizOp
+from holoscan.resources import BlockMemoryPool, MemoryStorageType
+
+from holohub.depth_to_point_cloud import DepthToPointCloudOp
+
+
+class SyntheticDepthGeneratorOp(Operator):
+    """Emit a synthetic float32 depth image (meters) and an aligned uint8 RGB image."""
+
+    def __init__(self, fragment, *args, width=640, height=480, **kwargs):
+        self.width = width
+        self.height = height
+        self.frame = 0
+        ys, xs = cp.meshgrid(
+            cp.arange(height, dtype=cp.float32),
+            cp.arange(width, dtype=cp.float32),
+            indexing="ij",
+        )
+        self._xs = xs
+        self._ys = ys
+        super().__init__(fragment, *args, **kwargs)
+
+    def setup(self, spec: OperatorSpec):
+        spec.output("depth")
+        spec.output("color")
+
+    def compute(self, op_input, op_output, context):
+        t = self.frame * 0.05
+        # A tilted plane in meters: ~1.0 m near the top-left, increasing across the frame,
+        # with a slow global oscillation so successive frames differ.
+        depth = (
+            1.0 + 0.5 * (self._xs / self.width) + 0.4 * (self._ys / self.height) + 0.3 * cp.sin(t)
+        ).astype(cp.float32)
+
+        r = (255.0 * self._xs / self.width).astype(cp.uint8)
+        g = (255.0 * self._ys / self.height).astype(cp.uint8)
+        b = cp.full_like(r, 128)
+        color = cp.ascontiguousarray(cp.stack([r, g, b], axis=-1))  # HxWx3 uint8
+
+        op_output.emit({"depth": depth}, "depth")
+        op_output.emit({"color": color}, "color")
+        self.frame += 1
+
+
+class PointCloudStatsOp(Operator):
+    """Pull the point cloud and report valid-point count and Z range (CI-friendly sink)."""
+
+    def setup(self, spec: OperatorSpec):
+        spec.input("in")
+
+    def compute(self, op_input, op_output, context):
+        msg = op_input.receive("in")
+        pc = cp.asarray(msg["point_cloud"])  # HxWx3 float32
+        z = pc[..., 2]
+        valid = ~cp.isnan(z)
+        n_valid = int(valid.sum().get())
+
+        # The colored path is connected, so a colors tensor must accompany the cloud and
+        # share its H x W footprint (3 uint8 channels).
+        colors = cp.asarray(msg["colors"])  # HxWx3 uint8
+        if colors.shape[:2] != pc.shape[:2] or colors.shape[2] != 3:
+            raise RuntimeError(
+                f"colors shape {colors.shape} does not match cloud {pc.shape[:2]} x 3"
+            )
+
+        if n_valid:
+            zmin = float(z[valid].min().get())
+            zmax = float(z[valid].max().get())
+            print(
+                f"[depth_to_point_cloud_demo] points={pc.shape[0] * pc.shape[1]} "
+                f"valid={n_valid} z=[{zmin:.3f}, {zmax:.3f}] m colors={tuple(colors.shape)}"
+            )
+        else:
+            print("[depth_to_point_cloud_demo] no valid points")
+
+
+class CloudToHolovizOp(Operator):
+    """Compact the organized H x W x 3 cloud to a flat N x 3 of finite points for HolovizOp.
+
+    HolovizOp renders a ``points_3d`` primitive from an ``(N, 3)`` coordinate tensor, so the
+    organized cloud is flattened and the invalid (NaN) pixels are dropped first, as recommended in
+    the README. The compaction stays on the GPU (CuPy), keeping the path device-resident.
+    """
+
+    def setup(self, spec: OperatorSpec):
+        spec.input("in")
+        spec.output("out")
+
+    def compute(self, op_input, op_output, context):
+        msg = op_input.receive("in")
+        pc = cp.asarray(msg["point_cloud"]).reshape(-1, 3)  # (H*W, 3) float32
+        valid = cp.isfinite(pc).all(axis=1)
+        pts = pc[valid]  # (N, 3)
+        # Holoviz expects at least one coordinate; emit a degenerate point if the frame is empty.
+        if pts.shape[0] == 0:
+            pts = cp.zeros((1, 3), dtype=cp.float32)
+        coords = cp.ascontiguousarray(pts.astype(cp.float32))  # (N, 3) as HolovizOp expects
+        op_output.emit({"point_cloud": coords}, "out")
+
+
+class DepthToPointCloudDemoApp(Application):
+    def __init__(self, frames=100, width=640, height=480, source="synthetic", visualize=False):
+        super().__init__()
+        self._frames = frames
+        self._width = width
+        self._height = height
+        self._source = source
+        self._visualize = visualize
+
+    def compose(self):
+        if self._source == "realsense":
+            raise NotImplementedError(
+                "--source realsense is not yet runnable from this Python demo: the "
+                "realsense_camera operator ships no Python bindings and emits VideoBuffers "
+                "rather than the Tensor DepthToPointCloudOp consumes. See the 'Using a real "
+                "Intel RealSense camera' section of README.md for the required wiring "
+                "(Python bindings + FormatConverterOp + intrinsics)."
+            )
+        if self._source != "synthetic":
+            raise ValueError(f"unknown source '{self._source}'")
+
+        generator = SyntheticDepthGeneratorOp(
+            self,
+            CountCondition(self, count=self._frames),
+            name="generator",
+            width=self._width,
+            height=self._height,
+        )
+
+        # Two device tensors per frame (HxWx3 float32 point cloud + HxWx3 uint8 colors) drawn
+        # from this pool; size each block for the larger (float32 XYZ) output and keep enough
+        # blocks for both tensors plus one frame of pipelining headroom.
+        out_blocks = 4
+        block_size = self._width * self._height * 3 * 4  # float32 XYZ is the larger output
+        cloud = DepthToPointCloudOp(
+            self,
+            name="point_cloud",
+            allocator=BlockMemoryPool(
+                self,
+                name="pool",
+                storage_type=MemoryStorageType.DEVICE,
+                block_size=block_size,
+                num_blocks=out_blocks,
+            ),
+            # Pinhole intrinsics for the synthetic camera: square pixels (fx == fy) with the
+            # principal point at the image center. A single focal length is used for both axes
+            # by design; the focal length is independent of the image aspect ratio.
+            fx=float(self._width) * 0.8,
+            fy=float(self._width) * 0.8,
+            cx=(self._width - 1) / 2.0,
+            cy=(self._height - 1) / 2.0,
+            depth_scale=1.0,  # synthetic depth is already in meters
+            depth_min=0.1,
+            depth_max=10.0,
+        )
+
+        self.add_flow(generator, cloud, {("depth", "depth")})
+        self.add_flow(generator, cloud, {("color", "color")})
+
+        if self._visualize:
+            # Compact the organized cloud to N x 3 finite points, then render as 3D points.
+            compact = CloudToHolovizOp(self, name="compact")
+            visualizer = HolovizOp(
+                self,
+                name="holoviz",
+                window_title="depth_to_point_cloud_demo",
+                width=1280,
+                height=720,
+                # The cloud lives in the camera optical frame (x-right, y-down, z-forward),
+                # centered near (0, 0, ~1.5 m). Place the camera in front of and above it (negative
+                # z is "in front", negative y is "up" in this frame) so the tilted plane is framed.
+                camera_eye=[1.5, -1.5, -1.0],
+                camera_look_at=[0.0, 0.0, 1.5],
+                camera_up=[0.0, -1.0, 0.0],
+                tensors=[
+                    dict(
+                        name="point_cloud",
+                        type="points_3d",
+                        color=[0.0, 1.0, 0.0, 1.0],
+                        point_size=3.0,
+                    ),
+                ],
+            )
+            self.add_flow(cloud, compact, {("point_cloud", "in")})
+            self.add_flow(compact, visualizer, {("out", "receivers")})
+        else:
+            sink = PointCloudStatsOp(self, name="stats")
+            self.add_flow(cloud, sink, {("point_cloud", "in")})
+
+
+def main():
+    parser = argparse.ArgumentParser(description="DepthToPointCloudOp demo")
+    parser.add_argument(
+        "-s",
+        "--source",
+        choices=["synthetic", "realsense"],
+        default="synthetic",
+        help=(
+            "Input source. 'synthetic' (default) uses an on-GPU depth+RGB generator (hardware-free, "
+            "CI-friendly); 'realsense' targets a live Intel RealSense camera (see README — not yet "
+            "runnable from Python)."
+        ),
+    )
+    parser.add_argument(
+        "--visualize",
+        action="store_true",
+        help="Render the cloud as 3D points in HolovizOp instead of the statistics sink "
+        "(requires a display).",
+    )
+    parser.add_argument("--frames", type=int, default=100, help="Number of frames to process")
+    parser.add_argument("--width", type=int, default=640)
+    parser.add_argument("--height", type=int, default=480)
+    args = parser.parse_args()
+
+    for name, value in (
+        ("--frames", args.frames),
+        ("--width", args.width),
+        ("--height", args.height),
+    ):
+        if value <= 0:
+            parser.error(f"{name} must be a positive integer (got {value})")
+
+    app = DepthToPointCloudDemoApp(
+        frames=args.frames,
+        width=args.width,
+        height=args.height,
+        source=args.source,
+        visualize=args.visualize,
+    )
+    app.run()
+
+
+if __name__ == "__main__":
+    main()