Source code for mani_skill.envs.scene

from dataclasses import dataclass
from functools import cached_property
from typing import Any, Mapping, Optional, Tuple, Union, cast

import numpy as np
import sapien
import sapien.physx as physx
import sapien.render
import torch
from sapien.render import RenderCameraComponent

import mani_skill.render.utils as render_utils
from mani_skill.envs.utils.system.backend import BackendInfo
from mani_skill.render import SAPIEN_RENDER_SYSTEM
from mani_skill.sensors.base_sensor import BaseSensor
from mani_skill.sensors.camera import Camera
from mani_skill.utils import common, sapien_utils
from mani_skill.utils.structs.actor import Actor
from mani_skill.utils.structs.articulation import Articulation
from mani_skill.utils.structs.drive import Drive
from mani_skill.utils.structs.link import Link
from mani_skill.utils.structs.pose import Pose
from mani_skill.utils.structs.render_camera import RenderCamera
from mani_skill.utils.structs.types import Array, Device, SimConfig

# try and determine which render system is used by the installed sapien package
if SAPIEN_RENDER_SYSTEM == "3.1":
    from sapien.wrapper.scene import (
        get_camera_shader_pack,  # pyright: ignore[reportAttributeAccessIssue]
    )


[docs]
    GlobalShaderPack = None

    sapien.render.RenderCameraGroup = "oldtype"


@dataclass

[docs]
class StateDictRegistry:

[docs]
    actors: dict[str, Actor]


[docs]
    articulations: dict[str, Articulation]





[docs]
class ManiSkillScene:
    """
    Class that manages a list of sub-scenes (sapien.Scene). In CPU simulation there should only be one sub-scene.
    In GPU simulation, there can be many sub-scenes, and this wrapper ensures that use calls to many of the original sapien.Scene API
    are applied to all sub-scenes. This includes calls to change object poses, velocities, drive targets etc.

    This wrapper also helps manage GPU states if GPU simulation is used
    """

    def __init__(
        self,
        sub_scenes: Optional[list[sapien.Scene]] = None,
        sim_config: SimConfig = SimConfig(),
        device: Optional[Device] = None,
        parallel_in_single_scene: bool = False,
        backend: Optional[BackendInfo] = None,
    ):
        assert device is not None, "device argument is required"
        assert backend is not None, "backend argument is required"
        if sub_scenes is None:
            sub_scenes = [sapien.Scene()]

[docs]
        self.sub_scenes = sub_scenes


[docs]
        self.px: physx.PhysxSystem = self.sub_scenes[0].physx_system

        assert all(
            isinstance(s.physx_system, type(self.px)) for s in self.sub_scenes
        ), "all sub-scenes must use the same simulation backend"

[docs]
        self.gpu_sim_enabled = (
            True if isinstance(self.px, physx.PhysxGpuSystem) else False
        )

        """whether the sub scenes are using the GPU or CPU backend"""

[docs]
        self.sim_config = sim_config


[docs]
        self._gpu_sim_initialized = False

        if isinstance(device, str):
            device = torch.device(device)

[docs]
        self.device = device


[docs]
        self.backend = backend  # references the backend object stored in BaseEnv class



[docs]
        self.camera_groups: dict[str, sapien.render.RenderCameraGroup] = dict()


[docs]
        self.render_system_group: sapien.render.RenderSystemGroup = (
            None  # pyright: ignore[reportAttributeAccessIssue]
        )



[docs]
        self.actors: dict[str, Actor] = dict()


[docs]
        self.articulations: dict[str, Articulation] = dict()



[docs]
        self.actor_views: dict[str, Actor] = dict()

        """views of actors in any sub-scenes created by using Actor.merge and queryable as if it were a single Actor"""

[docs]
        self.articulation_views: dict[str, Articulation] = dict()

        """views of articulations in any sub-scenes created by using Articulation.merge and queryable as if it were a single Articulation"""


[docs]
        self.sensors: dict[str, BaseSensor] = dict()


[docs]
        self.human_render_cameras: dict[str, Camera] = dict()


[docs]
        self._sensors_initialized = False


[docs]
        self._human_render_cameras_initialized = False



[docs]
        self._reset_mask = torch.ones(
            len(sub_scenes), dtype=torch.bool, device=self.device
        )

        """Used internally by various objects like Actor, Link, and Controllers to auto mask out sub-scenes so they do not get modified during
        partial env resets"""


[docs]
        self._needs_fetch = False

        """Used internally to raise some errors ahead of time of when there may be undefined behaviors"""


[docs]
        self.pairwise_contact_queries: dict[
            str, physx.PhysxGpuContactPairImpulseQuery
        ] = dict()

        """dictionary mapping pairwise contact query keys to GPU contact queries. Used in GPU simulation only to cache queries as
        query creation will pause any GPU sim computation"""

[docs]
        self._pairwise_contact_query_unique_hashes: dict[str, int] = dict()

        """maps keys in self.pairwise_contact_queries to unique hashes dependent on the actual objects involved in the query.
        This is used to determine automatically when to rebuild contact queries as keys for self.pairwise_contact_queries are kept
        non-unique between episode resets in order to be easily rebuilt and deallocate old queries. This essentially acts as a way
        to invalidate the cached queries."""


[docs]
        self.parallel_in_single_scene: bool = parallel_in_single_scene

        """Whether rendering all parallel scenes in the viewer/gui is enabled"""


[docs]
        self.state_dict_registry: StateDictRegistry = StateDictRegistry(
            actors=dict(), articulations=dict()
        )

        """state dict registry that map actor/articulation names to Actor/Articulation struct references. Only these structs are used for the environment state"""


[docs]
    def can_render(self):
        """Whether or not this Scene object permits rendering, depending on the rendering device selected"""
        return render_utils.can_render(self.backend.render_device)


    # -------------------------------------------------------------------------- #
    # Functions from sapien.Scene
    # -------------------------------------------------------------------------- #
    @property

[docs]
    def timestep(self):
        """The current simulation timestep"""
        return self.px.timestep


    @timestep.setter
    def timestep(self, timestep):
        self.px.timestep = timestep


[docs]
    def set_timestep(self, timestep):
        """Sets the current simulation timestep"""
        self.timestep = timestep



[docs]
    def get_timestep(self):
        """Returns the current simulation timestep"""
        return self.timestep



[docs]
    def create_actor_builder(self):
        """Creates an ActorBuilder object that can be used to build actors in this scene"""
        from ..utils.building.actor_builder import ActorBuilder

        return ActorBuilder().set_scene(self)



[docs]
    def create_articulation_builder(self):
        """Creates an ArticulationBuilder object that can be used to build articulations in this scene"""
        from ..utils.building.articulation_builder import ArticulationBuilder

        return ArticulationBuilder().set_scene(self)



[docs]
    def create_urdf_loader(self):
        """Creates a URDFLoader object that can be used to load URDF files into this scene"""
        from ..utils.building.urdf_loader import URDFLoader

        loader = URDFLoader()
        loader.set_scene(self)
        return loader



[docs]
    def create_mjcf_loader(self):
        """Creates a MJCFLoader object that can be used to load MJCF files into this scene"""
        from ..utils.building.mjcf_loader import MJCFLoader

        loader = MJCFLoader()
        loader.set_scene(self)
        return loader


    # def create_physical_material(
    #     self, static_friction: float, dynamic_friction: float, restitution: float
    # ):
    #     return physx.PhysxMaterial(static_friction, dynamic_friction, restitution)


[docs]
    def remove_actor(self, actor: Actor):
        """Removes an actor from the scene. Only works in CPU simulation."""
        if self.gpu_sim_enabled:
            raise NotImplementedError(
                "Cannot remove actors after creating them in GPU sim at the moment"
            )
        else:
            self.sub_scenes[0].remove_entity(actor._objs[0])
            self.actors.pop(actor.name)



[docs]
    def remove_articulation(self, articulation: Articulation):
        """Removes an articulation from the scene. Only works in CPU simulation."""
        if self.gpu_sim_enabled:
            raise NotImplementedError(
                "Cannot remove articulations after creating them in GPU sim at the moment"
            )
        else:
            entities = [l.entity for l in articulation._objs[0].links]
            for e in entities:
                self.sub_scenes[0].remove_entity(e)
            self.articulations.pop(articulation.name)



[docs]
    def add_camera(
        self,
        name,
        pose,
        width,
        height,
        near,
        far,
        fovy: Union[float, list, None] = None,
        intrinsic: Union[Array, None] = None,
        mount: Union[Actor, Link, None] = None,
    ) -> RenderCamera:
        """Add's a (mounted) camera to the scene"""
        if SAPIEN_RENDER_SYSTEM == "3.1":
            return self._sapien_31_add_camera(
                name, pose, width, height, near, far, fovy, intrinsic, mount
            )
        else:
            return self._sapien_add_camera(
                name, pose, width, height, near, far, fovy, intrinsic, mount
            )



[docs]
    def _sapien_add_camera(
        self,
        name,
        pose,
        width,
        height,
        near,
        far,
        fovy: Union[float, list, None] = None,
        intrinsic: Union[Array, None] = None,
        mount: Union[Actor, Link, None] = None,
    ) -> RenderCamera:
        """internal helper function to add (mounted) cameras"""
        cameras = []
        pose = Pose.create(pose)
        # TODO (stao): support scene idxs property for cameras in the future
        # move intrinsic to np and batch intrinsic if it is not batched
        if intrinsic is not None:
            intrinsic = common.to_numpy(intrinsic)
            if len(intrinsic.shape) == 2:
                intrinsic = intrinsic[None, :]
                if len(self.sub_scenes) > 1:
                    # repeat the intrinsic along batch dim
                    intrinsic = intrinsic.repeat(len(self.sub_scenes), 0)
            assert len(intrinsic) == len(
                self.sub_scenes
            ), "intrinsic matrix batch dim not equal to the number of sub-scenes"
        for i, scene in enumerate(self.sub_scenes):
            # Create camera component
            camera = RenderCameraComponent(width, height)
            if fovy is not None:
                if isinstance(fovy, float) or isinstance(fovy, int):
                    camera.set_fovy(fovy, compute_x=True)
                else:
                    camera.set_fovy(fovy[i], compute_x=True)
            elif intrinsic is not None:
                camera.set_focal_lengths(intrinsic[i, 0, 0], intrinsic[i, 1, 1])
                camera.set_principal_point(intrinsic[i, 0, 2], intrinsic[i, 1, 2])
            if isinstance(near, float) or isinstance(near, int):
                camera.near = near
            else:
                camera.near = near[i]
            if isinstance(far, float) or isinstance(far, int):
                camera.far = far
            else:
                camera.far = far[i]

            # mount camera to actor/link
            if mount is not None:
                if self.gpu_sim_enabled:
                    if isinstance(mount, Actor):
                        camera.set_gpu_pose_batch_index(
                            cast(
                                physx.PhysxRigidDynamicComponent,
                                mount._objs[i].find_component_by_type(
                                    physx.PhysxRigidDynamicComponent
                                ),
                            ).gpu_pose_index
                        )
                    elif isinstance(mount, Link):
                        camera.set_gpu_pose_batch_index(mount._objs[i].gpu_pose_index)
                    else:
                        raise ValueError(
                            f"Tried to mount camera on object of type {mount.__class__}"
                        )
                if isinstance(mount, Link):
                    mount._objs[i].entity.add_component(camera)
                else:
                    mount._objs[i].add_component(camera)
            else:
                camera_mount = sapien.Entity()
                camera_mount.add_component(camera)
                scene.add_entity(camera_mount)
                camera_mount.name = f"scene-{i}_{name}"
            if len(pose) == 1:
                camera.local_pose = pose.sp
            else:
                camera.local_pose = pose[i].sp
            camera.name = f"scene-{i}_{name}"
            cameras.append(camera)
        return RenderCamera.create(cameras, self, mount=mount)



[docs]
    def _sapien_31_add_camera(
        self,
        name,
        pose,
        width,
        height,
        near,
        far,
        fovy: Union[float, list, None] = None,
        intrinsic: Union[Array, None] = None,
        mount: Union[Actor, Link, None] = None,
    ) -> RenderCamera:
        """internal helper function to add (mounted) cameras"""
        cameras = []
        pose = Pose.create(pose)
        # TODO (stao): support scene idxs property for cameras in the future
        # move intrinsic to np and batch intrinsic if it is not batched
        if intrinsic is not None:
            intrinsic = common.to_numpy(intrinsic)
            if len(intrinsic.shape) == 2:
                intrinsic = intrinsic[None, :]
                if len(self.sub_scenes) > 1:
                    # repeat the intrinsic along batch dim
                    intrinsic = intrinsic.repeat(len(self.sub_scenes), 0)
            assert len(intrinsic) == len(
                self.sub_scenes
            ), "intrinsic matrix batch dim not equal to the number of sub-scenes"

        for i, scene in enumerate(self.sub_scenes):
            # Create camera component
            camera = RenderCameraComponent(
                width, height, GlobalShaderPack or get_camera_shader_pack()
            )
            if fovy is not None:
                if isinstance(fovy, (float, int)):
                    camera.set_fovy(fovy, compute_x=True)
                else:
                    camera.set_fovy(fovy[i], compute_x=True)
            elif intrinsic is not None:
                camera.set_focal_lengths(intrinsic[i, 0, 0], intrinsic[i, 1, 1])
                camera.set_principal_point(intrinsic[i, 0, 2], intrinsic[i, 1, 2])
            if isinstance(near, (float, int)):
                camera.near = near
            else:
                camera.near = near[i]
            if isinstance(far, (float, int)):
                camera.far = far
            else:
                camera.far = far[i]

            # mount camera to actor/link
            if mount is not None:
                if isinstance(mount, Link):
                    mount._objs[i].entity.add_component(camera)
                else:
                    mount._objs[i].add_component(camera)
            else:
                camera_mount = sapien.Entity()
                camera_mount.set_pose(sapien.Pose([0, 0, 0]))
                camera_mount.add_component(camera)
                camera_mount.name = f"scene-{i}_{name}"
                scene.add_entity(camera_mount)
            if len(pose) == 1:
                camera.local_pose = pose.sp
            else:
                camera.local_pose = pose[i].sp
            camera.name = f"scene-{i}_{name}"
            cameras.append(camera)
            scene.update_render()
        return RenderCamera.create(cameras, self, mount=mount)


    # def remove_camera(self, camera):
    #     self.remove_entity(camera.entity)

    # def get_cameras(self):
    #     return self.render_system.cameras

    # def get_mounted_cameras(self):
    #     return self.get_cameras()


[docs]
    def step(self):
        self.px.step()



[docs]
    def update_render(
        self, update_sensors: bool = True, update_human_render_cameras: bool = True
    ):
        """
        Updates the renderer based on the current simulation state. Note that on the first call if a sensor/human render camera is required to be updated,
        GPU memory will be allocated for the sensor/human render camera respectively.

        Arguments:
            update_sensors (bool): Whether to update the sensors.
            update_human_render_cameras (bool): Whether to update the human render cameras.
        """
        if SAPIEN_RENDER_SYSTEM == "3.1":
            self._sapien_31_update_render(
                update_sensors=update_sensors,
                update_human_render_cameras=update_human_render_cameras,
            )
        else:
            self._sapien_update_render(
                update_sensors=update_sensors,
                update_human_render_cameras=update_human_render_cameras,
            )



[docs]
    def _sapien_update_render(
        self, update_sensors: bool = True, update_human_render_cameras: bool = True
    ):
        # note that this design is such that no GPU memory is allocated for memory unless requested for, which can occur
        # after the e.g. physx GPU simulation is initialized.
        if self.gpu_sim_enabled:
            if not self.parallel_in_single_scene:
                if self.render_system_group is None:
                    self._setup_gpu_rendering()
                if not self._sensors_initialized and update_sensors:
                    self._gpu_setup_sensors(self.sensors)
                    self._sensors_initialized = True
                if (
                    not self._human_render_cameras_initialized
                    and update_human_render_cameras
                ):
                    self._gpu_setup_sensors(self.human_render_cameras)
                    self._human_render_cameras_initialized = True
                self.render_system_group.update_render()
            else:
                assert isinstance(self.px, physx.PhysxGpuSystem)
                self.px.sync_poses_gpu_to_cpu()
                self.sub_scenes[0].update_render()
        else:
            self.sub_scenes[0].update_render()



[docs]
    def _sapien_31_update_render(
        self, update_sensors: bool = True, update_human_render_cameras: bool = True
    ):
        if self.gpu_sim_enabled:
            if self.render_system_group is None:
                # TODO (stao): for new render system support the parallel in single scene rendering option
                for scene in self.sub_scenes:
                    scene.update_render()
                self._setup_gpu_rendering()
            if not self._sensors_initialized and update_sensors:
                self._gpu_setup_sensors(self.sensors)
                self._sensors_initialized = True
            if (
                not self._human_render_cameras_initialized
                and update_human_render_cameras
            ):
                self._gpu_setup_sensors(self.human_render_cameras)
                self._human_render_cameras_initialized = True

            manager: sapien.render.GpuSyncManager = (  # pyright: ignore[reportAttributeAccessIssue]
                self.render_system_group
            )
            manager.sync()
        else:
            self.sub_scenes[0].update_render()



[docs]
    def get_contacts(self):
        if self.gpu_sim_enabled:
            raise NotImplementedError(
                "get_contacts is not available for GPU simulation"
            )
        else:
            assert isinstance(self.px, physx.PhysxCpuSystem)
            return self.px.get_contacts()



[docs]
    def get_all_actors(self):
        """
        Returns list of all sapien.Entity objects that have rigid dynamic and static components across all sub scenes
        """
        return [
            c.entity
            for c in self.px.rigid_dynamic_components + self.px.rigid_static_components
        ]



[docs]
    def get_all_articulations(self):
        """
        Returns list of all physx articulation objects across all sub scenes
        """
        return [
            c.articulation for c in self.px.articulation_link_components if c.is_root
        ]



[docs]
    def create_drive(
        self,
        body0: Union[Actor, Link],
        pose0: Union[sapien.Pose, Pose],
        body1: Union[Actor, Link],
        pose1: Union[sapien.Pose, Pose],
    ):
        # body0 and body1 should be in parallel.
        return Drive.create_from_actors_or_links(
            self, body0, pose0, body1, pose1, body0._scene_idxs
        )


    # def create_connection(
    #     self,
    #     body0: Optional[Union[sapien.Entity, physx.PhysxRigidBaseComponent]],
    #     pose0: sapien.Pose,
    #     body1: Union[sapien.Entity, physx.PhysxRigidBaseComponent],
    #     pose1: sapien.Pose,
    # ):
    #     if body0 is None:
    #         c0 = None
    #     elif isinstance(body0, sapien.Entity):
    #         c0 = next(
    #             c
    #             for c in body0.components
    #             if isinstance(c, physx.PhysxRigidBaseComponent)
    #         )
    #     else:
    #         c0 = body0

    #     assert body1 is not None
    #     if isinstance(body1, sapien.Entity):
    #         e1 = body1
    #         c1 = next(
    #             c
    #             for c in body1.components
    #             if isinstance(c, physx.PhysxRigidBaseComponent)
    #         )
    #     else:
    #         e1 = body1.entity
    #         c1 = body1

    #     connection = physx.PhysxDistanceJointComponent(c1)
    #     connection.parent = c0
    #     connection.pose_in_child = pose1
    #     connection.pose_in_parent = pose0
    #     e1.add_component(connection)
    #     connection.set_limit(0, 0)
    #     return connection

    # def create_gear(
    #     self,
    #     body0: Optional[Union[sapien.Entity, physx.PhysxRigidBaseComponent]],
    #     pose0: sapien.Pose,
    #     body1: Union[sapien.Entity, physx.PhysxRigidBaseComponent],
    #     pose1: sapien.Pose,
    # ):
    #     if body0 is None:
    #         c0 = None
    #     elif isinstance(body0, sapien.Entity):
    #         c0 = next(
    #             c
    #             for c in body0.components
    #             if isinstance(c, physx.PhysxRigidBaseComponent)
    #         )
    #     else:
    #         c0 = body0

    #     assert body1 is not None
    #     if isinstance(body1, sapien.Entity):
    #         e1 = body1
    #         c1 = next(
    #             c
    #             for c in body1.components
    #             if isinstance(c, physx.PhysxRigidBaseComponent)
    #         )
    #     else:
    #         e1 = body1.entity
    #         c1 = body1

    #     gear = physx.PhysxGearComponent(c1)
    #     gear.parent = c0
    #     gear.pose_in_child = pose1
    #     gear.pose_in_parent = pose0
    #     e1.add_component(gear)
    #     return gear

    # @property
    # def render_id_to_visual_name(self):
    #     # TODO
    #     return

    @property

[docs]
    def ambient_light(self):
        return self.sub_scenes[0].ambient_light


    @ambient_light.setter
    def ambient_light(self, color):
        for scene in self.sub_scenes:
            scene.render_system.ambient_light = color


[docs]
    def set_ambient_light(self, color):
        self.ambient_light = color



[docs]
    def add_point_light(
        self,
        position,
        color,
        shadow=False,
        shadow_near=0.1,
        shadow_far=10.0,
        shadow_map_size=2048,
        scene_idxs: Optional[list[int]] = None,
    ):
        if scene_idxs is None:
            scene_idxs = list(range(len(self.sub_scenes)))
        for scene_idx in scene_idxs:
            if self.parallel_in_single_scene:
                scene = self.sub_scenes[0]
            else:
                scene = self.sub_scenes[scene_idx]
            entity = sapien.Entity()
            entity.name = "point_light"
            light = sapien.render.RenderPointLightComponent()
            entity.add_component(light)
            light.color = color
            light.shadow = shadow
            light.shadow_near = shadow_near
            light.shadow_far = shadow_far
            light.shadow_map_size = shadow_map_size
            if self.parallel_in_single_scene:
                light.pose = sapien.Pose(position + self.scene_offsets_np[scene_idx])
            else:
                light.pose = sapien.Pose(position)

            scene.add_entity(entity)
        return light



[docs]
    def add_directional_light(
        self,
        direction,
        color,
        shadow=False,
        position=[0, 0, 0],
        shadow_scale=10.0,
        shadow_near=-10.0,
        shadow_far=10.0,
        shadow_map_size=2048,
        scene_idxs: Optional[list[int]] = None,
    ):
        if scene_idxs is None:
            scene_idxs = list(range(len(self.sub_scenes)))
        for scene_idx in scene_idxs:
            if self.parallel_in_single_scene:
                scene = self.sub_scenes[0]
            else:
                scene = self.sub_scenes[scene_idx]
            entity = sapien.Entity()
            entity.name = "directional_light"
            light = sapien.render.RenderDirectionalLightComponent()
            entity.add_component(light)
            light.color = color
            light.shadow = shadow
            light.shadow_near = shadow_near
            light.shadow_far = shadow_far
            light.shadow_half_size = shadow_scale
            light.shadow_map_size = shadow_map_size
            if self.parallel_in_single_scene:
                light_position = position + self.scene_offsets_np[scene_idx]
            else:
                light_position = position
            light.pose = sapien.Pose(
                light_position,
                sapien.math.shortest_rotation(
                    [1, 0, 0], direction  # pyright: ignore[reportArgumentType]
                ),
            )
            scene.add_entity(entity)
            if self.parallel_in_single_scene:
                # for directional lights adding multiple does not make much sense
                # and for parallel gui rendering setup accurate lighting does not matter as it is only
                # for demo purposes
                break
        return



[docs]
    def add_spot_light(
        self,
        position,
        direction,
        inner_fov: float,
        outer_fov: float,
        color,
        shadow=False,
        shadow_near=0.1,
        shadow_far=10.0,
        shadow_map_size=2048,
        scene_idxs: Optional[list[int]] = None,
    ):
        if scene_idxs is None:
            scene_idxs = list(range(len(self.sub_scenes)))
        for scene_idx in scene_idxs:
            if self.parallel_in_single_scene:
                scene = self.sub_scenes[0]
            else:
                scene = self.sub_scenes[scene_idx]
            entity = sapien.Entity()
            entity.name = "spot_light"
            light = sapien.render.RenderSpotLightComponent()
            entity.add_component(light)
            light.color = color
            light.shadow = shadow
            light.shadow_near = shadow_near
            light.shadow_far = shadow_far
            light.shadow_map_size = shadow_map_size
            light.inner_fov = inner_fov
            light.outer_fov = outer_fov
            if self.parallel_in_single_scene:
                light_position = position + self.scene_offsets_np[scene_idx]
            else:
                light_position = position
            light.pose = sapien.Pose(
                light_position,
                sapien.math.shortest_rotation(
                    [1, 0, 0], direction  # pyright: ignore[reportArgumentType]
                ),
            )
            scene.add_entity(entity)
        return



[docs]
    def add_area_light_for_ray_tracing(
        self,
        pose: sapien.Pose,
        color,
        half_width: float,
        half_height: float,
        scene_idxs=None,
    ):
        lighting_scenes = (
            self.sub_scenes
            if scene_idxs is None
            else [self.sub_scenes[i] for i in scene_idxs]
        )
        for scene in lighting_scenes:
            entity = sapien.Entity()
            light = sapien.render.RenderParallelogramLightComponent()
            entity.add_component(light)
            light.set_shape(half_width, half_height)
            light.color = color
            light.pose = pose
            scene.add_entity(entity)
        return


    # def remove_light(self, light):
    #     self.remove_entity(light.entity)

    # def set_environment_map(self, cubemap: str):
    #     if isinstance(cubemap, str):
    #         self.render_system.cubemap = sapien.render.RenderCubemap(cubemap)
    #     else:
    #         self.render_system.cubemap = cubemap

    # def set_environment_map_from_files(
    #     self, px: str, nx: str, py: str, ny: str, pz: str, nz: str
    # ):
    #     self.render_system.cubemap = sapien.render.RenderCubemap(px, nx, py, ny, pz, nz)

    # ---------------------------------------------------------------------------- #
    # Additional useful properties / functions
    # ---------------------------------------------------------------------------- #
    @property

[docs]
    def num_envs(self):
        return len(self.sub_scenes)



[docs]
    def get_pairwise_contact_impulses(
        self, obj1: Union[Actor, Link], obj2: Union[Actor, Link]
    ):
        """
        Get the impulse vectors between two actors/links. Returns impulse vector of shape (N, 3)
        where N is the number of environments and 3 is the dimension of the impulse vector itself,
        representing x, y, and z direction of impulse.

        Note that dividing the impulse value by self.px.timestep yields the pairwise contact force in Newtons. The equivalent API for that
        is self.get_pairwise_contact_force(obj1, obj2). It is generally recommended to use the force values since they are independent of the
        timestep (dt = 1 / sim_freq) of the simulation.

        Args:
            obj1: Actor | Link
            obj2: Actor | Link
        """
        # TODO (stao): Is there any optimization improvement when putting all queries all together and fetched together
        # vs multiple smaller queries? If so, might be worth exposing a helpful API for that instead of having user
        # write this code below themselves.
        if self.gpu_sim_enabled:
            assert isinstance(self.px, physx.PhysxGpuSystem)
            query_hash = hash((obj1, obj2))
            query_key = obj1.name + obj2.name

            # we rebuild the potentially expensive contact query if it has not existed previously
            # or if it has, the managed objects are a different set
            rebuild_query = (query_key not in self.pairwise_contact_queries) or (
                query_key in self._pairwise_contact_query_unique_hashes
                and self._pairwise_contact_query_unique_hashes[query_key] != query_hash
            )
            if rebuild_query:
                body_pairs = cast(
                    list[
                        tuple[
                            physx.PhysxRigidBaseComponent, physx.PhysxRigidBaseComponent
                        ]
                    ],
                    list(zip(obj1._bodies, obj2._bodies)),
                )
                self.pairwise_contact_queries[
                    query_key
                ] = self.px.gpu_create_contact_pair_impulse_query(body_pairs)
                self._pairwise_contact_query_unique_hashes[query_key] = query_hash

            query = self.pairwise_contact_queries[query_key]
            self.px.gpu_query_contact_pair_impulses(query)
            # query.cuda_impulses is shape (num_unique_pairs * num_envs, 3)
            pairwise_contact_impulses = query.cuda_impulses.torch().clone()
            return pairwise_contact_impulses
        else:
            assert isinstance(self.px, physx.PhysxCpuSystem)
            contacts = cast(physx.PhysxCpuSystem, self.px).get_contacts()
            pairwise_contact_impulses = sapien_utils.get_pairwise_contact_impulse(
                contacts, obj1._bodies[0].entity, obj2._bodies[0].entity
            )
            return common.to_tensor(pairwise_contact_impulses)[None, :]



[docs]
    def get_pairwise_contact_forces(
        self, obj1: Union[Actor, Link], obj2: Union[Actor, Link]
    ):
        """
        Get the force vectors between two actors/links. Returns force vector of shape (N, 3)
        where N is the number of environments and 3 is the dimension of the force vector itself,
        representing x, y, and z direction of force.

        Args:
            obj1: Actor | Link
            obj2: Actor | Link
        """
        return self.get_pairwise_contact_impulses(obj1, obj2) / self.px.timestep


    @cached_property

[docs]
    def scene_offsets(self):
        """torch tensor of shape (num_envs, 3) representing the offset of each scene in the world frame"""
        if self.gpu_sim_enabled:
            assert isinstance(self.px, physx.PhysxGpuSystem)
            return torch.tensor(
                np.array(
                    [
                        self.px.get_scene_offset(sub_scene)
                        for sub_scene in self.sub_scenes
                    ]
                ),
                device=self.device,
            )
        else:
            raise NotImplementedError(
                "scene_offsets is not available for CPU simulation"
            )


    @cached_property

[docs]
    def scene_offsets_np(self):
        """numpy array of shape (num_envs, 3) representing the offset of each scene in the world frame"""
        if self.gpu_sim_enabled:
            assert isinstance(self.px, physx.PhysxGpuSystem)
            return np.array(
                [self.px.get_scene_offset(sub_scene) for sub_scene in self.sub_scenes]
            )
        else:
            raise NotImplementedError(
                "scene_offsets_np is not available for CPU simulation"
            )


    # -------------------------------------------------------------------------- #
    # Simulation state (required for MPC)
    # -------------------------------------------------------------------------- #


[docs]
    def add_to_state_dict_registry(self, object: Union[Actor, Articulation]):
        if isinstance(object, Actor):
            assert (
                object.name not in self.state_dict_registry.actors
            ), f"Object {object.name} already in state dict registry"
            self.state_dict_registry.actors[object.name] = object
        elif isinstance(object, Articulation):
            assert (
                object.name not in self.state_dict_registry.articulations
            ), f"Object {object.name} already in state dict registry"
            self.state_dict_registry.articulations[object.name] = object
        else:
            raise ValueError(f"Expected Actor or Articulation, got {object}")



[docs]
    def remove_from_state_dict_registry(self, object: Union[Actor, Articulation]):
        if isinstance(object, Actor):
            assert (
                object.name in self.state_dict_registry.actors
            ), f"Object {object.name} not in state dict registry"
            del self.state_dict_registry.actors[object.name]
        elif isinstance(object, Articulation):
            assert (
                object.name in self.state_dict_registry.articulations
            ), f"Object {object.name} not in state dict registry"
            del self.state_dict_registry.articulations[object.name]
        else:
            raise ValueError(f"Expected Actor or Articulation, got {object}")



[docs]
    def get_sim_state(self) -> dict[str, dict[str, torch.Tensor]]:
        """Get simulation state. Returns a dictionary with two nested dictionaries "actors" and "articulations".
        In the nested dictionaries they map the actor/articulation name to a vector of shape (N, D) for N parallel
        environments and D dimensions of padded state per environment.

        Note that static actor data are not included. It is expected that an environment reconstructs itself in a deterministic manner such that
        the same static actors always have the same states"""
        state_dict = dict()
        state_dict["actors"] = dict()
        state_dict["articulations"] = dict()
        for actor in self.state_dict_registry.actors.values():
            if actor.px_body_type == "static":
                continue
            state_dict["actors"][actor.name] = actor.get_state().clone()
        for articulation in self.state_dict_registry.articulations.values():
            state_dict["articulations"][
                articulation.name
            ] = articulation.get_state().clone()
        if len(state_dict["actors"]) == 0:
            del state_dict["actors"]
        if len(state_dict["articulations"]) == 0:
            del state_dict["articulations"]
        return state_dict



[docs]
    def set_sim_state(self, state: dict, env_idx: Optional[torch.Tensor] = None):
        if env_idx is not None:
            prev_reset_mask = self._reset_mask.clone()
            # safe guard against setting the wrong states
            self._reset_mask[:] = False
            self._reset_mask[env_idx] = True

        if "actors" in state:
            for actor_id, actor_state in state["actors"].items():
                if len(actor_state.shape) == 1:
                    actor_state = actor_state[None, :]
                # do not pass in env_idx to avoid redundant reset mask changes
                self.state_dict_registry.actors[actor_id].set_state(actor_state, None)
        if "articulations" in state:
            for art_id, art_state in state["articulations"].items():
                if len(art_state.shape) == 1:
                    art_state = art_state[None, :]
                self.state_dict_registry.articulations[art_id].set_state(
                    art_state, None
                )
        if env_idx is not None:
            self._reset_mask = prev_reset_mask


    # ---------------------------------------------------------------------------- #
    # GPU Simulation Management
    # ---------------------------------------------------------------------------- #

[docs]
    def _setup(self, enable_gpu: bool):
        """
        Start the CPU/GPU simulation and allocate all buffers and initialize objects
        """
        if enable_gpu:
            assert isinstance(self.px, physx.PhysxGpuSystem)
            if SAPIEN_RENDER_SYSTEM == "3.1":
                for scene in self.sub_scenes:
                    scene.update_render()
            self.px.gpu_init()
        self.non_static_actors: list[Actor] = []
        # find non static actors, and set data indices that are now available after gpu_init was called
        for actor in self.actors.values():
            if actor.px_body_type == "static":
                continue
            self.non_static_actors.append(actor)
            if enable_gpu:
                actor._body_data_index  # only need to access this attribute to populate it

        for articulation in self.articulations.values():
            articulation._data_index
            for link in articulation.links:
                link._body_data_index
        for actor in self.non_static_actors:
            actor.set_pose(actor.initial_pose)
        for articulation in self.articulations.values():
            articulation.set_pose(articulation.initial_pose)

        if enable_gpu:
            assert isinstance(self.px, physx.PhysxGpuSystem)
            self.px.cuda_rigid_body_data.torch()[:, 7:] = torch.zeros_like(
                self.px.cuda_rigid_body_data.torch()[:, 7:]
            )  # zero out all velocities
            self.px.cuda_articulation_qvel.torch()[:, :] = torch.zeros_like(
                self.px.cuda_articulation_qvel.torch()
            )  # zero out all q velocities
            self.px.cuda_articulation_qf.torch()[:, :] = torch.zeros_like(
                self.px.cuda_articulation_qf.torch()
            )  # zero out all qf

            self.px.gpu_apply_rigid_dynamic_data()
            self.px.gpu_apply_articulation_root_pose()
            self.px.gpu_apply_articulation_root_velocity()
            self.px.gpu_apply_articulation_qvel()
            self.px.gpu_apply_articulation_qf()

            self._gpu_sim_initialized = True
            self.px.gpu_update_articulation_kinematics()
            self._gpu_fetch_all()



[docs]
    def _gpu_apply_all(self):
        """
        Calls gpu_apply to update all body data, qpos, qvel, qf, and root poses
        """
        assert (
            not self._needs_fetch
        ), "Once _gpu_apply_all is called, you must call _gpu_fetch_all before calling _gpu_apply_all again\
            as otherwise there is undefined behavior that is likely impossible to debug"
        assert isinstance(self.px, physx.PhysxGpuSystem)
        self.px.gpu_apply_rigid_dynamic_data()
        self.px.gpu_apply_articulation_qpos()
        self.px.gpu_apply_articulation_qvel()
        self.px.gpu_apply_articulation_qf()
        self.px.gpu_apply_articulation_root_pose()
        self.px.gpu_apply_articulation_root_velocity()
        self.px.gpu_apply_articulation_target_position()
        self.px.gpu_apply_articulation_target_velocity()
        self._needs_fetch = True



[docs]
    def _gpu_fetch_all(self):
        """
        Queries simulation for all relevant GPU data. Note that this has some overhead.
        Should only be called at most once per simulation step as this automatically queries all data for all
        objects built in the scene.
        """
        assert isinstance(self.px, physx.PhysxGpuSystem)
        if len(self.non_static_actors) > 0:
            self.px.gpu_fetch_rigid_dynamic_data()

        if len(self.articulations) > 0:
            self.px.gpu_fetch_articulation_link_pose()
            self.px.gpu_fetch_articulation_link_velocity()
            self.px.gpu_fetch_articulation_qpos()
            self.px.gpu_fetch_articulation_qvel()
            self.px.gpu_fetch_articulation_qacc()
            self.px.gpu_fetch_articulation_target_qpos()
            self.px.gpu_fetch_articulation_target_qvel()

        self._needs_fetch = False


    # ---------------------------------------------------------------------------- #
    # CPU/GPU sim Rendering Code
    # ---------------------------------------------------------------------------- #

[docs]
    def _get_all_render_bodies(
        self,
    ) -> list[Tuple[sapien.render.RenderBodyComponent, int]]:
        all_render_bodies = []
        for actor in self.actors.values():
            if actor.px_body_type == "static":
                continue
            all_render_bodies += [
                (
                    entity.find_component_by_type(sapien.render.RenderBodyComponent),
                    cast(
                        physx.PhysxRigidDynamicComponent,
                        entity.find_component_by_type(physx.PhysxRigidDynamicComponent),
                    ).gpu_pose_index,
                )
                for entity in actor._objs
            ]
        for articulation in self.articulations.values():
            all_render_bodies += [
                (
                    px_link.entity.find_component_by_type(
                        sapien.render.RenderBodyComponent
                    ),
                    px_link.gpu_pose_index,
                )
                for link in articulation.links
                for px_link in link._objs
            ]
        return all_render_bodies



[docs]
    def _setup_gpu_rendering(self):
        if SAPIEN_RENDER_SYSTEM == "3.1":
            self._sapien_31_setup_gpu_rendering()
        else:
            self._sapien_setup_gpu_rendering()



[docs]
    def _sapien_setup_gpu_rendering(self):
        """
        Prepares the scene for GPU parallelized rendering to enable taking e.g. RGB images
        """
        assert isinstance(self.px, physx.PhysxGpuSystem)
        for rb, gpu_pose_index in self._get_all_render_bodies():
            if rb is not None:
                for s in rb.render_shapes:
                    s.set_gpu_pose_batch_index(gpu_pose_index)
        self.render_system_group = sapien.render.RenderSystemGroup(
            [s.render_system for s in self.sub_scenes]
        )
        self.render_system_group.set_cuda_poses(self.px.cuda_rigid_body_data)



[docs]
    def _sapien_31_setup_gpu_rendering(self):
        """
        Prepares the scene for GPU parallelized rendering to enable taking e.g. RGB images
        """
        assert isinstance(self.px, physx.PhysxGpuSystem)
        px = self.px

        shape_pose_indices = []
        shapes = []
        scene_id = 0
        for scene in self.sub_scenes:
            scene_id += 1
            for body in scene.render_system.render_bodies:
                b = body.entity.find_component_by_type(
                    sapien.physx.PhysxRigidBodyComponent
                )
                if b is None:
                    continue
                for s in body.render_shapes:
                    shape_pose_indices.append(
                        b.gpu_pose_index  # pyright: ignore[reportAttributeAccessIssue]
                    )
                    shapes.append(s)

        cam_pose_indices = []
        cams = []
        for cameras in self.sensors.values():
            assert isinstance(cameras, Camera), f"Expected Camera, got {cameras}"
            for c in cameras.camera._render_cameras:
                b = c.entity.find_component_by_type(
                    sapien.physx.PhysxRigidBodyComponent
                )
                if b is None:
                    continue
                cam_pose_indices.append(
                    b.gpu_pose_index  # pyright: ignore[reportAttributeAccessIssue]
                )
                cams.append(c)

        sync_manager = (
            sapien.render.GpuSyncManager()  # pyright: ignore[reportAttributeAccessIssue]
        )
        sync_manager.set_cuda_poses(px.cuda_rigid_body_data)
        sync_manager.set_render_shapes(shape_pose_indices, shapes)
        sync_manager.set_cameras(cam_pose_indices, cams)

        self.render_system_group = sync_manager



[docs]
    def _gpu_setup_sensors(self, sensors: Mapping[str, BaseSensor]):
        if SAPIEN_RENDER_SYSTEM == "3.1":
            self._sapien_31_gpu_setup_sensors(sensors)
        else:
            self._sapien_gpu_setup_sensors(sensors)



[docs]
    def _sapien_gpu_setup_sensors(self, sensors: Mapping[str, BaseSensor]):
        for name, sensor in sensors.items():
            if isinstance(sensor, Camera):
                try:
                    camera_group = self.render_system_group.create_camera_group(
                        sensor.camera._render_cameras,
                        list(
                            sensor.config.shader_config.texture_names.keys()  # pyright: ignore[reportOptionalMemberAccess]
                        ),
                    )
                except RuntimeError as e:
                    raise RuntimeError(
                        "Unable to create GPU parallelized camera group. "
                        "If the error is about being unable to create a buffer, you are likely using too many Cameras. "
                        "Either use less cameras (via less parallel envs) and/or reduce the size of the cameras. "
                        "Another common cause is using a memory intensive shader, you can try using the 'minimal' shader "
                        "which optimizes for GPU memory but disables some advanced functionalities. "
                        "Another option is to avoid rendering with the rgb_array mode / using the human render cameras as "
                        "they can be more memory intensive as they typically have higher resolutions for the purposes of visualization."
                    ) from e
                sensor.camera.camera_group = camera_group
                self.camera_groups[name] = camera_group
            else:
                raise NotImplementedError(
                    f"This sensor {sensor} of type {sensor.__class__} has not been implemented yet on the GPU"
                )



[docs]
    def _sapien_31_gpu_setup_sensors(self, sensors: Mapping[str, BaseSensor]):
        for name, sensor in sensors.items():
            if isinstance(sensor, Camera):
                batch_renderer = sapien.render.RenderManager(  # pyright: ignore[reportAttributeAccessIssue]
                    sapien.render.get_shader_pack(  # pyright: ignore[reportAttributeAccessIssue]
                        sensor.config.shader_config.shader_pack  # pyright: ignore[reportOptionalMemberAccess]
                    )
                )
                batch_renderer.set_size(sensor.config.width, sensor.config.height)
                batch_renderer.set_cameras(sensor.camera._render_cameras)
                sensor.camera.camera_group = self.camera_groups[name] = batch_renderer
            else:
                raise NotImplementedError(
                    f"This sensor {sensor} of type {sensor.__class__} has not bget_picture_cuda implemented yet on the GPU"
                )



[docs]
    def get_sensor_images(
        self, obs: dict[str, Any]
    ) -> dict[str, dict[str, torch.Tensor]]:
        """Get raw sensor data as images for visualization purposes."""
        sensor_data = dict()
        for name, sensor in self.sensors.items():
            sensor_data[name] = sensor.get_images(obs[name])
        return sensor_data



[docs]
    def get_human_render_camera_images(
        self, camera_name: Optional[str] = None
    ) -> dict[str, torch.Tensor]:
        image_data = dict()
        if self.gpu_sim_enabled:
            if self.parallel_in_single_scene:
                for name, camera in self.human_render_cameras.items():
                    camera.camera._render_cameras[0].take_picture()
                    rgb = camera.get_obs(
                        rgb=True, depth=False, segmentation=False, position=False
                    )["rgb"]
                    image_data[name] = rgb
            else:
                for name, camera in self.human_render_cameras.items():
                    if camera_name is not None and name != camera_name:
                        continue
                    assert (
                        camera.config.shader_config.shader_pack  # pyright: ignore[reportOptionalMemberAccess]
                        not in [
                            "rt",
                            "rt-fast",
                            "rt-med",
                        ]
                    ), "ray tracing shaders do not work with parallel rendering"
                    camera.capture()
                    rgb = camera.get_obs(
                        rgb=True, depth=False, segmentation=False, position=False
                    )["rgb"]
                    image_data[name] = rgb
        else:
            for name, camera in self.human_render_cameras.items():
                if camera_name is not None and name != camera_name:
                    continue
                camera.capture()
                rgb = camera.get_obs(
                    rgb=True, depth=False, segmentation=False, position=False
                )["rgb"]
                image_data[name] = rgb
        return image_data