Skip to content

collision_reward

CollisionReward

Bases: BaseRewardFunction

Collision reward Penalize robot collision. Typically collision_reward_weight is negative. Note that we ignore collisions with any floor objects.

Parameters:

Name Type Description Default
robot_idn int

robot identifier to evaluate collision penalty with. Default is 0, corresponding to the first robot added to the scene

0
ignore_self_collisions bool

Whether to ignore robot self-collisions or not

True
r_collision float

Penalty value (>0) to penalize collisions

0.1
Source code in omnigibson/reward_functions/collision_reward.py
class CollisionReward(BaseRewardFunction):
    """
    Collision reward
    Penalize robot collision. Typically collision_reward_weight is negative. Note that we ignore collisions with any
    floor objects.

    Args:
        robot_idn (int): robot identifier to evaluate collision penalty with. Default is 0, corresponding to the first
            robot added to the scene
        ignore_self_collisions (bool): Whether to ignore robot self-collisions or not
        r_collision (float): Penalty value (>0) to penalize collisions
    """

    def __init__(self, robot_idn=0, ignore_self_collisions=True, r_collision=0.1):
        # Store internal vars
        assert r_collision > 0, f"r_collision must be positive, got: {r_collision}!"
        self._robot_idn = robot_idn
        self._ignore_self_collisions = ignore_self_collisions
        self._r_collision = r_collision

        # Run super
        super().__init__()

    def _step(self, task, env, action):
        # Penalty is Reward is -self._r_collision if there were any collisions in the last timestep
        robot = env.robots[self._robot_idn]
        # Ignore floors and potentially robot's own prims as well
        floors = list(env.scene.object_registry("category", "floors", []))
        ignore_objs = floors if self._ignore_self_collisions is None else floors + [robot]
        in_contact = len(env.robots[self._robot_idn].states[ContactBodies].get_value(ignore_objs=tuple(ignore_objs))) > 0
        reward = float(in_contact) * -self._r_collision
        return reward, {}