Source code for gym_jiminy.common.blocks.motor_safety_limit

"""Implementation of basic Proportional-Derivative controller block compatible
with gym_jiminy reinforcement learning pipeline environment design.
"""
import warnings
from typing import List

import numpy as np
import numba as nb

from jiminy_py.core import EncoderSensor  # pylint: disable=no-name-in-module

from .proportional_derivative_controller import get_encoder_to_motor_map

from ..bases import (BaseObs,
                     InterfaceJiminyEnv,
                     BaseControllerBlock,
                     BasePipelineWrapper,
                     ControlledJiminyEnv)


[docs] @nb.jit(nopython=True, cache=True, fastmath=True) def apply_safety_limits(command: np.ndarray, q_measured: np.ndarray, v_measured: np.ndarray, kp: np.ndarray, kd: np.ndarray, motors_soft_position_lower: np.ndarray, motors_soft_position_upper: np.ndarray, motors_velocity_limit: np.ndarray, motors_effort_limit: np.ndarray, out: np.ndarray) -> None: """Clip the command torque to ensure safe operation. It acts on each actuator independently and only activate close to the position or velocity limits. Basically, the idea to the avoid moving faster when some prescribed velocity limit or exceeding soft position bounds by forcing the command torque to act against it. Still, it may not be enough to prevent such issue in practice as the command torque is bounded. .. warning:: All the input arguments must be in motor order, including the measured position and velocity of the actuators. In practice, those measurements comes from the encoder sensors. If so, then the measurements must be re-ordered if necessary to match motor order instead of sensor order. .. seealso:: See `MotorSafetyLimit` documentation for details. :param command: Desired command to will be updated in-place if necessary. :param q_measured: Current position of the actuators. :param v_measured: Current velocity of the actuators. :param kp: Scale of the velocity bound triggered by position limits. :param kd: Scale of the effort bound triggered by velocity limits. :param motors_soft_position_lower: Soft lower position limit of the actuators. :param motors_soft_position_upper: Soft upper position limit of the actuators. :param motors_velocity_limit: Maximum velocity of the actuators. :param motors_effort_limit: Maximum effort that the actuators can output. The command torque cannot exceed this limits, not even if needed to enforce safe operation. :param out: Pre-allocated memory to store the command motor torques. """ # Computes velocity bounds based on margin from soft joint limit if any safe_velocity_lower = motors_velocity_limit * np.minimum(np.maximum( -kp * (q_measured - motors_soft_position_lower), -1.0), 1.0) safe_velocity_upper = motors_velocity_limit * np.minimum(np.maximum( -kp * (q_measured - motors_soft_position_upper), -1.0), 1.0) # Computes effort bounds based on velocity and effort bounds safe_effort_lower = motors_effort_limit * np.minimum(np.maximum( -kd * (v_measured - safe_velocity_lower), -1.0), 1.0) safe_effort_upper = motors_effort_limit * np.minimum(np.maximum( -kd * (v_measured - safe_velocity_upper), -1.0), 1.0) # Clip command according to safe effort bounds out[:] = np.minimum(np.maximum( command, safe_effort_lower), safe_effort_upper)
[docs] class MotorSafetyLimit( BaseControllerBlock[np.ndarray, np.ndarray, BaseObs, np.ndarray]): """Safety mechanism primarily designed to prevent hardware damage and premature wear, but also to temper violent, sporadic and dangerous motions. A velocity limit v+ is enforced by bounding the commanded effort such that no effort can be applied to push the joint beyond the velocity limit, and a damping effort is applied if the joint is moving at a velocity beyond the limit, ie -kd * (v - v+). When the joint is near the soft limits x+/-, the velocities are bounded to keep the position from crossing the soft limits. The k_position term determines the scale of the bound on velocity, ie v+/- = -kp * (x - x+/-). These bounds on velocity are the ones determining the bounds on effort. The output command would never exceed the maximum effort, not even if needed to enforce safe operation. .. note:: The prescribed position and velocity limits may be more respective that the actual hardware specification of the robot. .. warning:: It must be connected directly to the environment without any other intermediary controller. .. seealso:: See official ROS documentation and implementation for details: https://wiki.ros.org/pr2_controller_manager/safety_limits https://github.com/PR2/pr2_mechanism/blob/melodic-devel/pr2_mechanism_model/src/joint.cpp """ # noqa: E501 # pylint: disable=line-too-long def __init__(self, name: str, env: InterfaceJiminyEnv[BaseObs, np.ndarray], *, kp: float, kd: float, soft_position_margin: float, soft_velocity_max: float, soft_effort_rel_max: float = 1.0) -> None: """ :param name: Name of the block. :param env: Environment to connect with. :param kp: Scale of the velocity bound triggered by position limits. :param kd: Scale of the effort bound triggered by velocity limits. :param soft_position_margin: Minimum distance of the current joint positions from their respective bounds before starting to break. :param soft_velocity_max: Maximum velocity of the joint before starting to break. :param soft_effort_rel_max: Maximum effort of the motor before applying artificial saturation on it. This limitation is ignored in evaluation mode. Optional: 1.0 by default. """ # Make sure that the parameters are valid if soft_position_margin < 0.0: raise ValueError("Soft position margin must be positive.") if soft_velocity_max < 0.0: raise ValueError("Soft maximum velocity must be positive.") if soft_effort_rel_max < 0.0 or soft_effort_rel_max > 1.0: raise ValueError( "Soft relative maximum torque must be between 0.0 and 1.0.") # Make sure that no other controller has been added prior to this block env_unwrapped: InterfaceJiminyEnv = env while isinstance(env_unwrapped, BasePipelineWrapper): if isinstance(env_unwrapped, ControlledJiminyEnv): raise TypeError( "No other control block must be added prior to this one.") env_unwrapped = env_unwrapped.env # Backup some user argument(s) self.kp = kp self.kd = kd # Extract mechanical reduction ratio # FIXME: Is it considered invariant ? If not, it should be refreshed in # `_setup`, as done for `DeformationEstimator`. encoder_to_joint_ratio = [] for motor in env.robot.motors: motor_options = motor.get_options() encoder_to_joint_ratio.append(motor_options["mechanicalReduction"]) # Define buffers storing information about the motors for efficiency self.motors_position_lower = np.array([ motor.position_limit_lower + ratio * soft_position_margin for motor, ratio in zip(env.robot.motors, encoder_to_joint_ratio)]) self.motors_position_upper = np.array([ motor.position_limit_upper - ratio * soft_position_margin for motor, ratio in zip(env.robot.motors, encoder_to_joint_ratio)]) self.motors_velocity_limit = np.array([ min(motor.velocity_limit, ratio * soft_velocity_max) for motor, ratio in zip(env.robot.motors, encoder_to_joint_ratio)]) self.motors_effort_limit_true = np.array([ motor.effort_limit for motor in env.robot.motors]) self.motors_effort_limit_true[ self.motors_position_lower > self.motors_position_upper] = 0.0 self.motors_effort_limit_soft = ( self.motors_effort_limit_true * soft_effort_rel_max) # Mapping from motors to encoders self.encoder_to_motor_map = get_encoder_to_motor_map(env.robot) # Whether stored reference to encoder measurements are already in the # same order as the motors, allowing skipping re-ordering entirely. self._is_same_order = isinstance(self.encoder_to_motor_map, slice) if not self._is_same_order: warnings.warn( "Consider using the same ordering for encoders and motors for " "optimal performance.") # Extract measured motor positions and velocities for fast access self.q_measured, self.v_measured = ( env.measurement["measurements"][EncoderSensor.type]) # Initialize the controller super().__init__(name, env, update_ratio=1) # Whether to enforce soft effort limits self._enable_limit_soft = True def _initialize_action_space(self) -> None: """Configure the action space of the controller. The action spaces corresponds to the command motors efforts. """ self.action_space = self.env.action_space @property def fieldnames(self) -> List[str]: return [f"currentMotorTorque{motor.name}" for motor in self.env.robot.motors] def _setup(self) -> None: # Call base implementation super()._setup() # Unbounded effort limits in evaluation mode. # Note that training/evaluation cannot be changed at this point. self._enable_limit_soft = self.env.training
[docs] def compute_command(self, action: np.ndarray, command: np.ndarray) -> None: """Apply safety limits to the desired motor torques right before sending it to the robot so as to avoid exceeded prescribed position and velocity limits. :param action: Desired motor torques to apply on the robot. :param command: Current motor torques that will be updated in-place. """ # Extract motor positions and velocity from encoder data q_measured, v_measured = self.q_measured, self.v_measured if not self._is_same_order: q_measured = q_measured[self.encoder_to_motor_map] v_measured = v_measured[self.encoder_to_motor_map] # Pick the right effort limits depending on training / evaluation mode if self._enable_limit_soft: motors_effort_limit = self.motors_effort_limit_soft else: motors_effort_limit = self.motors_effort_limit_true # Clip command according to safe effort bounds apply_safety_limits(action, q_measured, v_measured, self.kp, self.kd, self.motors_position_lower, self.motors_position_upper, self.motors_velocity_limit, motors_effort_limit, command)