保存渲染图像和3D重投影#

这个指南与 run_usd_camera.py 脚本一起使用,位于 IsaacLab/source/standalone/tutorials/04_sensors 目录中。

run_usd_camera.py的代码
  1# Copyright (c) 2022-2025, The Isaac Lab Project Developers.
  2# All rights reserved.
  3#
  4# SPDX-License-Identifier: BSD-3-Clause
  5
  6"""
  7This script shows how to use the camera sensor from the Isaac Lab framework.
  8
  9The camera sensor is created and interfaced through the Omniverse Replicator API. However, instead of using
 10the simulator or OpenGL convention for the camera, we use the robotics or ROS convention.
 11
 12.. code-block:: bash
 13
 14    # Usage with GUI
 15    ./isaaclab.sh -p source/standalone/tutorials/04_sensors/run_usd_camera.py --enable_cameras
 16
 17    # Usage with headless
 18    ./isaaclab.sh -p source/standalone/tutorials/04_sensors/run_usd_camera.py --headless --enable_cameras
 19
 20"""
 21
 22"""Launch Isaac Sim Simulator first."""
 23
 24import argparse
 25
 26from omni.isaac.lab.app import AppLauncher
 27
 28# add argparse arguments
 29parser = argparse.ArgumentParser(description="This script demonstrates how to use the camera sensor.")
 30parser.add_argument(
 31    "--draw",
 32    action="store_true",
 33    default=False,
 34    help="Draw the pointcloud from camera at index specified by ``--camera_id``.",
 35)
 36parser.add_argument(
 37    "--save",
 38    action="store_true",
 39    default=False,
 40    help="Save the data from camera at index specified by ``--camera_id``.",
 41)
 42parser.add_argument(
 43    "--camera_id",
 44    type=int,
 45    choices={0, 1},
 46    default=0,
 47    help=(
 48        "The camera ID to use for displaying points or saving the camera data. Default is 0."
 49        " The viewport will always initialize with the perspective of camera 0."
 50    ),
 51)
 52# append AppLauncher cli args
 53AppLauncher.add_app_launcher_args(parser)
 54# parse the arguments
 55args_cli = parser.parse_args()
 56
 57# launch omniverse app
 58app_launcher = AppLauncher(args_cli)
 59simulation_app = app_launcher.app
 60
 61"""Rest everything follows."""
 62
 63import numpy as np
 64import os
 65import random
 66import torch
 67
 68import omni.isaac.core.utils.prims as prim_utils
 69import omni.replicator.core as rep
 70
 71import omni.isaac.lab.sim as sim_utils
 72from omni.isaac.lab.assets import RigidObject, RigidObjectCfg
 73from omni.isaac.lab.markers import VisualizationMarkers
 74from omni.isaac.lab.markers.config import RAY_CASTER_MARKER_CFG
 75from omni.isaac.lab.sensors.camera import Camera, CameraCfg
 76from omni.isaac.lab.sensors.camera.utils import create_pointcloud_from_depth
 77from omni.isaac.lab.utils import convert_dict_to_backend
 78
 79
 80def define_sensor() -> Camera:
 81    """Defines the camera sensor to add to the scene."""
 82    # Setup camera sensor
 83    # In contrast to the ray-cast camera, we spawn the prim at these locations.
 84    # This means the camera sensor will be attached to these prims.
 85    prim_utils.create_prim("/World/Origin_00", "Xform")
 86    prim_utils.create_prim("/World/Origin_01", "Xform")
 87    camera_cfg = CameraCfg(
 88        prim_path="/World/Origin_.*/CameraSensor",
 89        update_period=0,
 90        height=480,
 91        width=640,
 92        data_types=[
 93            "rgb",
 94            "distance_to_image_plane",
 95            "normals",
 96            "semantic_segmentation",
 97            "instance_segmentation_fast",
 98            "instance_id_segmentation_fast",
 99        ],
100        colorize_semantic_segmentation=True,
101        colorize_instance_id_segmentation=True,
102        colorize_instance_segmentation=True,
103        spawn=sim_utils.PinholeCameraCfg(
104            focal_length=24.0, focus_distance=400.0, horizontal_aperture=20.955, clipping_range=(0.1, 1.0e5)
105        ),
106    )
107    # Create camera
108    camera = Camera(cfg=camera_cfg)
109
110    return camera
111
112
113def design_scene() -> dict:
114    """Design the scene."""
115    # Populate scene
116    # -- Ground-plane
117    cfg = sim_utils.GroundPlaneCfg()
118    cfg.func("/World/defaultGroundPlane", cfg)
119    # -- Lights
120    cfg = sim_utils.DistantLightCfg(intensity=3000.0, color=(0.75, 0.75, 0.75))
121    cfg.func("/World/Light", cfg)
122
123    # Create a dictionary for the scene entities
124    scene_entities = {}
125
126    # Xform to hold objects
127    prim_utils.create_prim("/World/Objects", "Xform")
128    # Random objects
129    for i in range(8):
130        # sample random position
131        position = np.random.rand(3) - np.asarray([0.05, 0.05, -1.0])
132        position *= np.asarray([1.5, 1.5, 0.5])
133        # sample random color
134        color = (random.random(), random.random(), random.random())
135        # choose random prim type
136        prim_type = random.choice(["Cube", "Cone", "Cylinder"])
137        common_properties = {
138            "rigid_props": sim_utils.RigidBodyPropertiesCfg(),
139            "mass_props": sim_utils.MassPropertiesCfg(mass=5.0),
140            "collision_props": sim_utils.CollisionPropertiesCfg(),
141            "visual_material": sim_utils.PreviewSurfaceCfg(diffuse_color=color, metallic=0.5),
142            "semantic_tags": [("class", prim_type)],
143        }
144        if prim_type == "Cube":
145            shape_cfg = sim_utils.CuboidCfg(size=(0.25, 0.25, 0.25), **common_properties)
146        elif prim_type == "Cone":
147            shape_cfg = sim_utils.ConeCfg(radius=0.1, height=0.25, **common_properties)
148        elif prim_type == "Cylinder":
149            shape_cfg = sim_utils.CylinderCfg(radius=0.25, height=0.25, **common_properties)
150        # Rigid Object
151        obj_cfg = RigidObjectCfg(
152            prim_path=f"/World/Objects/Obj_{i:02d}",
153            spawn=shape_cfg,
154            init_state=RigidObjectCfg.InitialStateCfg(pos=position),
155        )
156        scene_entities[f"rigid_object{i}"] = RigidObject(cfg=obj_cfg)
157
158    # Sensors
159    camera = define_sensor()
160
161    # return the scene information
162    scene_entities["camera"] = camera
163    return scene_entities
164
165
166def run_simulator(sim: sim_utils.SimulationContext, scene_entities: dict):
167    """Run the simulator."""
168    # extract entities for simplified notation
169    camera: Camera = scene_entities["camera"]
170
171    # Create replicator writer
172    output_dir = os.path.join(os.path.dirname(os.path.realpath(__file__)), "output", "camera")
173    rep_writer = rep.BasicWriter(
174        output_dir=output_dir,
175        frame_padding=0,
176        colorize_instance_id_segmentation=camera.cfg.colorize_instance_id_segmentation,
177        colorize_instance_segmentation=camera.cfg.colorize_instance_segmentation,
178        colorize_semantic_segmentation=camera.cfg.colorize_semantic_segmentation,
179    )
180
181    # Camera positions, targets, orientations
182    camera_positions = torch.tensor([[2.5, 2.5, 2.5], [-2.5, -2.5, 2.5]], device=sim.device)
183    camera_targets = torch.tensor([[0.0, 0.0, 0.0], [0.0, 0.0, 0.0]], device=sim.device)
184    # These orientations are in ROS-convention, and will position the cameras to view the origin
185    camera_orientations = torch.tensor(  # noqa: F841
186        [[-0.1759, 0.3399, 0.8205, -0.4247], [-0.4247, 0.8205, -0.3399, 0.1759]], device=sim.device
187    )
188
189    # Set pose: There are two ways to set the pose of the camera.
190    # -- Option-1: Set pose using view
191    camera.set_world_poses_from_view(camera_positions, camera_targets)
192    # -- Option-2: Set pose using ROS
193    # camera.set_world_poses(camera_positions, camera_orientations, convention="ros")
194
195    # Index of the camera to use for visualization and saving
196    camera_index = args_cli.camera_id
197
198    # Create the markers for the --draw option outside of is_running() loop
199    if sim.has_gui() and args_cli.draw:
200        cfg = RAY_CASTER_MARKER_CFG.replace(prim_path="/Visuals/CameraPointCloud")
201        cfg.markers["hit"].radius = 0.002
202        pc_markers = VisualizationMarkers(cfg)
203
204    # Simulate physics
205    while simulation_app.is_running():
206        # Step simulation
207        sim.step()
208        # Update camera data
209        camera.update(dt=sim.get_physics_dt())
210
211        # Print camera info
212        print(camera)
213        if "rgb" in camera.data.output.keys():
214            print("Received shape of rgb image        : ", camera.data.output["rgb"].shape)
215        if "distance_to_image_plane" in camera.data.output.keys():
216            print("Received shape of depth image      : ", camera.data.output["distance_to_image_plane"].shape)
217        if "normals" in camera.data.output.keys():
218            print("Received shape of normals          : ", camera.data.output["normals"].shape)
219        if "semantic_segmentation" in camera.data.output.keys():
220            print("Received shape of semantic segm.   : ", camera.data.output["semantic_segmentation"].shape)
221        if "instance_segmentation_fast" in camera.data.output.keys():
222            print("Received shape of instance segm.   : ", camera.data.output["instance_segmentation_fast"].shape)
223        if "instance_id_segmentation_fast" in camera.data.output.keys():
224            print("Received shape of instance id segm.: ", camera.data.output["instance_id_segmentation_fast"].shape)
225        print("-------------------------------")
226
227        # Extract camera data
228        if args_cli.save:
229            # Save images from camera at camera_index
230            # note: BasicWriter only supports saving data in numpy format, so we need to convert the data to numpy.
231            single_cam_data = convert_dict_to_backend(
232                {k: v[camera_index] for k, v in camera.data.output.items()}, backend="numpy"
233            )
234
235            # Extract the other information
236            single_cam_info = camera.data.info[camera_index]
237
238            # Pack data back into replicator format to save them using its writer
239            rep_output = {"annotators": {}}
240            for key, data, info in zip(single_cam_data.keys(), single_cam_data.values(), single_cam_info.values()):
241                if info is not None:
242                    rep_output["annotators"][key] = {"render_product": {"data": data, **info}}
243                else:
244                    rep_output["annotators"][key] = {"render_product": {"data": data}}
245            # Save images
246            # Note: We need to provide On-time data for Replicator to save the images.
247            rep_output["trigger_outputs"] = {"on_time": camera.frame[camera_index]}
248            rep_writer.write(rep_output)
249
250        # Draw pointcloud if there is a GUI and --draw has been passed
251        if sim.has_gui() and args_cli.draw and "distance_to_image_plane" in camera.data.output.keys():
252            # Derive pointcloud from camera at camera_index
253            pointcloud = create_pointcloud_from_depth(
254                intrinsic_matrix=camera.data.intrinsic_matrices[camera_index],
255                depth=camera.data.output[camera_index]["distance_to_image_plane"],
256                position=camera.data.pos_w[camera_index],
257                orientation=camera.data.quat_w_ros[camera_index],
258                device=sim.device,
259            )
260
261            # In the first few steps, things are still being instanced and Camera.data
262            # can be empty. If we attempt to visualize an empty pointcloud it will crash
263            # the sim, so we check that the pointcloud is not empty.
264            if pointcloud.size()[0] > 0:
265                pc_markers.visualize(translations=pointcloud)
266
267
268def main():
269    """Main function."""
270    # Load simulation context
271    sim_cfg = sim_utils.SimulationCfg(device=args_cli.device)
272    sim = sim_utils.SimulationContext(sim_cfg)
273    # Set main camera
274    sim.set_camera_view([2.5, 2.5, 2.5], [0.0, 0.0, 0.0])
275    # design the scene
276    scene_entities = design_scene()
277    # Play simulator
278    sim.reset()
279    # Now we are ready!
280    print("[INFO]: Setup complete...")
281    # Run simulator
282    run_simulator(sim, scene_entities)
283
284
285if __name__ == "__main__":
286    # run the main function
287    main()
288    # close sim app
289    simulation_app.close()

使用复制器基本写入器进行保存#

为了保存摄像机输出,我们使用Omniverse Replicator中的基本写入类。该类允许我们以numpy格式保存图像。有关基本写入器的更多信息,请参阅 文档

    rep_writer = rep.BasicWriter(
        output_dir=output_dir,
        frame_padding=0,
        colorize_instance_id_segmentation=camera.cfg.colorize_instance_id_segmentation,
        colorize_instance_segmentation=camera.cfg.colorize_instance_segmentation,
        colorize_semantic_segmentation=camera.cfg.colorize_semantic_segmentation,
    )

在模拟器运行时,图像可以保存到已定义的文件夹中。由于BasicWriter仅支持使用NumPy格式保存数据,因此我们首先需要将PyTorch传感器转换为NumPy数组,然后将其打包到字典中。

            # Save images from camera at camera_index
            # note: BasicWriter only supports saving data in numpy format, so we need to convert the data to numpy.
            single_cam_data = convert_dict_to_backend(
                {k: v[camera_index] for k, v in camera.data.output.items()}, backend="numpy"
            )

            # Extract the other information
            single_cam_info = camera.data.info[camera_index]

完成此步骤后,我们可以使用BasicWriter保存图像。

            # Pack data back into replicator format to save them using its writer
            rep_output = {"annotators": {}}
            for key, data, info in zip(single_cam_data.keys(), single_cam_data.values(), single_cam_info.values()):
                if info is not None:
                    rep_output["annotators"][key] = {"render_product": {"data": data, **info}}
                else:
                    rep_output["annotators"][key] = {"render_product": {"data": data}}
            # Save images
            # Note: We need to provide On-time data for Replicator to save the images.
            rep_output["trigger_outputs"] = {"on_time": camera.frame[camera_index]}
            rep_writer.write(rep_output)

投影到3D空间#

我们包含实用程序来将深度图像投影到3D空间。重新投影操作使用PyTorch操作来进行,这可以加快计算速度。

from omni.isaac.lab.utils.math import transform_points, unproject_depth

# Pointcloud in world frame
points_3d_cam = unproject_depth(
   camera.data.output["distance_to_image_plane"], camera.data.intrinsic_matrices
)

points_3d_world = transform_points(points_3d_cam, camera.data.pos_w, camera.data.quat_w_ros)

或者,我们可以使用 omni.isaac.lab.sensors.camera.utils.create_pointcloud_from_depth() 函数从深度图像创建点云,并将其转换为世界框架。

            # Derive pointcloud from camera at camera_index
            pointcloud = create_pointcloud_from_depth(
                intrinsic_matrix=camera.data.intrinsic_matrices[camera_index],
                depth=camera.data.output[camera_index]["distance_to_image_plane"],
                position=camera.data.pos_w[camera_index],
                orientation=camera.data.quat_w_ros[camera_index],
                device=sim.device,
            )

使用Isaac Sim中的 omni.isaac.debug_draw 扩展,可以将结果点云可视化。这样可以轻松在3D空间中可视化点云。

            # In the first few steps, things are still being instanced and Camera.data
            # can be empty. If we attempt to visualize an empty pointcloud it will crash
            # the sim, so we check that the pointcloud is not empty.
            if pointcloud.size()[0] > 0:
                pc_markers.visualize(translations=pointcloud)

执行脚本#

要运行附带的脚本,请执行以下命令:

# Usage with saving and drawing
./isaaclab.sh -p source/standalone/tutorials/04_sensors/run_usd_camera.py --save --draw --enable_cameras

# Usage with saving only in headless mode
./isaaclab.sh -p source/standalone/tutorials/04_sensors/run_usd_camera.py --save --headless --enable_cameras

模拟应该开始运行,你可以观察到不同的物体掉落。在 IsaacLab/source/standalone/tutorials/04_sensors 目录中会创建一个输出文件夹,其中将保存图像。此外,你应该看到绘制在视口上的3D空间中的点云。

要停止模拟,关闭窗口,或在终端中使用 Ctrl+C