Gymnasium/gym/envs/robotics/hand/manipulate_touch_sensors.py

import os
import numpy as np

from gym import utils, error, spaces
from gym.envs.robotics.hand import manipulate

# Ensure we get the path separator correct on windows
MANIPULATE_BLOCK_XML = os.path.join('hand', 'manipulate_block_touch_sensors.xml')
MANIPULATE_EGG_XML = os.path.join('hand', 'manipulate_egg_touch_sensors.xml')
MANIPULATE_PEN_XML = os.path.join('hand', 'manipulate_pen_touch_sensors.xml')


class ManipulateTouchSensorsEnv(manipulate.ManipulateEnv, utils.EzPickle):
    def __init__(
        self, model_path, target_position, target_rotation,
        target_position_range, reward_type, initial_qpos={},
        randomize_initial_position=True, randomize_initial_rotation=True,
        distance_threshold=0.01, rotation_threshold=0.1, n_substeps=20, relative_control=False,
        ignore_z_target_rotation=False, touch_visualisation="on_touch", touch_get_obs="boolean",
    ):
        """Initializes a new Hand manipulation environment with touch sensors.

        Args:
            touch_visualisation (string): how touch sensor sites are visualised
                - "on_touch": shows touch sensor sites only when touch values > 0
                - "always": always shows touch sensor sites
                - "off" or else: does not show touch sensor sites
            touch_get_obs (string): touch sensor readings
                - "boolean": returns 1 if touch sensor reading != 0.0 else 0
                - "log": returns log(x+1) touch sensor readings from self.sim.data.sensordata[]
                - "off" or else: does not add touch sensor readings to the observation

        """
        self.touch_visualisation = touch_visualisation
        self.touch_get_obs = touch_get_obs
        self._touch_sensor_id_site_id = []
        self.touch_color = [1, 0, 0, 0.4]
        self.notouch_color = [0, 0.5, 0, 0.3]

        manipulate.ManipulateEnv.__init__(
            self, model_path, target_position, target_rotation,
            target_position_range, reward_type, initial_qpos=initial_qpos,
            randomize_initial_position=randomize_initial_position, randomize_initial_rotation=randomize_initial_rotation,
            distance_threshold=distance_threshold, rotation_threshold=rotation_threshold, n_substeps=n_substeps, relative_control=relative_control,
            ignore_z_target_rotation=ignore_z_target_rotation,
        )
        utils.EzPickle.__init__(self)

        for k, v in self.sim.model._sensor_name2id.items():  # get touch sensor ids and their site names
            if 'robot0:TS_' in k:
                self._touch_sensor_id_site_id.append((v, self.sim.model._site_name2id[k.replace('robot0:TS_', 'robot0:T_')]))

        if self.touch_visualisation == 'off':  # set touch sensors rgba values
            for touch_sensor_id, site_id in self._touch_sensor_id_site_id:
                self.sim.model.site_rgba[site_id][3] = 0.0
        elif self.touch_visualisation == 'always':
            pass

        obs = self._get_obs()
        self.observation_space = spaces.Dict(dict(
            desired_goal=spaces.Box(-np.inf, np.inf, shape=obs['achieved_goal'].shape, dtype='float32'),
            achieved_goal=spaces.Box(-np.inf, np.inf, shape=obs['achieved_goal'].shape, dtype='float32'),
            observation=spaces.Box(-np.inf, np.inf, shape=obs['observation'].shape, dtype='float32'),
        ))

    def _render_callback(self):
        super(ManipulateTouchSensorsEnv, self)._render_callback()
        if self.touch_visualisation == 'on_touch':
            for touch_sensor_id, site_id in self._touch_sensor_id_site_id:
                if self.sim.data.sensordata[touch_sensor_id] != 0.0:
                    self.sim.model.site_rgba[site_id] = self.touch_color
                else:
                    self.sim.model.site_rgba[site_id] = self.notouch_color

    def _get_obs(self):
        robot_qpos, robot_qvel = manipulate.robot_get_obs(self.sim)
        object_qvel = self.sim.data.get_joint_qvel('object:joint')
        achieved_goal = self._get_achieved_goal().ravel()  # this contains the object position + rotation
        touch_values = []  # get touch sensor readings. if there is one, set value to 1
        if self.touch_get_obs == 'boolean':
            for touch_sensor_id, site_id in self._touch_sensor_id_site_id:
                value = 1.0 if self.sim.data.sensordata[touch_sensor_id] != 0.0 else 0.0
                touch_values.append(value)
        elif self.touch_get_obs == 'log':
            for touch_sensor_id, site_id in self._touch_sensor_id_site_id:
                value = self.sim.data.sensordata[touch_sensor_id]
                touch_values.append(value)
            if len(touch_values) > 0:
                touch_values = np.log(np.array(touch_values) + 1.0)
        observation = np.concatenate([robot_qpos, robot_qvel, object_qvel, touch_values, achieved_goal])

        return {
            'observation': observation.copy(),
            'achieved_goal': achieved_goal.copy(),
            'desired_goal': self.goal.ravel().copy(),
        }


class HandBlockTouchSensorsEnv(ManipulateTouchSensorsEnv):
    def __init__(self, target_position='random', target_rotation='xyz', reward_type='sparse'):
        super(HandBlockTouchSensorsEnv, self).__init__(
            model_path=MANIPULATE_BLOCK_XML, target_position=target_position,
            target_rotation=target_rotation,
            target_position_range=np.array([(-0.04, 0.04), (-0.06, 0.02), (0.0, 0.06)]),
            reward_type=reward_type)


class HandEggTouchSensorsEnv(ManipulateTouchSensorsEnv):
    def __init__(self, target_position='random', target_rotation='xyz', reward_type='sparse'):
        super(HandEggTouchSensorsEnv, self).__init__(
            model_path=MANIPULATE_EGG_XML, target_position=target_position,
            target_rotation=target_rotation,
            target_position_range=np.array([(-0.04, 0.04), (-0.06, 0.02), (0.0, 0.06)]),
            reward_type=reward_type)


class HandPenTouchSensorsEnv(ManipulateTouchSensorsEnv):
    def __init__(self, target_position='random', target_rotation='xyz', reward_type='sparse'):
        super(HandPenTouchSensorsEnv, self).__init__(
            model_path=MANIPULATE_PEN_XML, target_position=target_position,
            target_rotation=target_rotation,
            target_position_range=np.array([(-0.04, 0.04), (-0.06, 0.02), (0.0, 0.06)]),
            randomize_initial_rotation=False, reward_type=reward_type,
            ignore_z_target_rotation=True, distance_threshold=0.05)
Add optional touch sensors for hand environments (#1299) * extending robotics shadow hand with touch sensors * extending robotics shadow hand with touch sensors * extending robotics shadow hand with touch sensors * extending robotics shadow hand with touch sensors * extending robotics shadow hand with touch sensors * extending robotics shadow hand with touch sensors * extending robotics shadow hand with touch sensors Co-authored-by: Luca Lach <llach@techfak.uni-bielefeld.de> * add touch sensors layout * add touch sensors layout * extending robotics shadow hand with touch sensors Co-authored-by: Luca Lach <llach@techfak.uni-bielefeld.de> * extending robotics shadow hand with touch sensors * add touch sensors layout Co-authored-by: Luca Lach <llach@techfak.uni-bielefeld.de> * update touch sensors layout 85 Co-authored-by: Luca Lach <llach@techfak.uni-bielefeld.de> * add manipulate_egg_touch_sensors_85.xml & manipulate_pen_touch_sensors_85.xml; ManipulateTouchSensorsEnv._render_callback() Co-authored-by: Luca Lach <llach@techfak.uni-bielefeld.de> * add shared_touch_sensors_92.xml; solve pytest . failure Co-authored-by: Luca Lach <llach@techfak.uni-bielefeld.de> 2019-02-09 01:00:19 +01:00			`import os`
			`import numpy as np`

			`from gym import utils, error, spaces`
			`from gym.envs.robotics.hand import manipulate`

			`# Ensure we get the path separator correct on windows`
			`MANIPULATE_BLOCK_XML = os.path.join('hand', 'manipulate_block_touch_sensors.xml')`
			`MANIPULATE_EGG_XML = os.path.join('hand', 'manipulate_egg_touch_sensors.xml')`
			`MANIPULATE_PEN_XML = os.path.join('hand', 'manipulate_pen_touch_sensors.xml')`


			`class ManipulateTouchSensorsEnv(manipulate.ManipulateEnv, utils.EzPickle):`
			`def __init__(`
			`self, model_path, target_position, target_rotation,`
			`target_position_range, reward_type, initial_qpos={},`
			`randomize_initial_position=True, randomize_initial_rotation=True,`
			`distance_threshold=0.01, rotation_threshold=0.1, n_substeps=20, relative_control=False,`
			`ignore_z_target_rotation=False, touch_visualisation="on_touch", touch_get_obs="boolean",`
			`):`
			`"""Initializes a new Hand manipulation environment with touch sensors.`

			`Args:`
			`touch_visualisation (string): how touch sensor sites are visualised`
			`- "on_touch": shows touch sensor sites only when touch values > 0`
			`- "always": always shows touch sensor sites`
			`- "off" or else: does not show touch sensor sites`
			`touch_get_obs (string): touch sensor readings`
			`- "boolean": returns 1 if touch sensor reading != 0.0 else 0`
			`- "log": returns log(x+1) touch sensor readings from self.sim.data.sensordata[]`
			`- "off" or else: does not add touch sensor readings to the observation`

			`"""`
			`self.touch_visualisation = touch_visualisation`
			`self.touch_get_obs = touch_get_obs`
			`self._touch_sensor_id_site_id = []`
			`self.touch_color = [1, 0, 0, 0.4]`
			`self.notouch_color = [0, 0.5, 0, 0.3]`

			`manipulate.ManipulateEnv.__init__(`
			`self, model_path, target_position, target_rotation,`
			`target_position_range, reward_type, initial_qpos=initial_qpos,`
			`randomize_initial_position=randomize_initial_position, randomize_initial_rotation=randomize_initial_rotation,`
			`distance_threshold=distance_threshold, rotation_threshold=rotation_threshold, n_substeps=n_substeps, relative_control=relative_control,`
			`ignore_z_target_rotation=ignore_z_target_rotation,`
			`)`
			`utils.EzPickle.__init__(self)`

			`for k, v in self.sim.model._sensor_name2id.items(): # get touch sensor ids and their site names`
			`if 'robot0:TS_' in k:`
			`self._touch_sensor_id_site_id.append((v, self.sim.model._site_name2id[k.replace('robot0:TS_', 'robot0:T_')]))`

			`if self.touch_visualisation == 'off': # set touch sensors rgba values`
			`for touch_sensor_id, site_id in self._touch_sensor_id_site_id:`
			`self.sim.model.site_rgba[site_id][3] = 0.0`
			`elif self.touch_visualisation == 'always':`
			`pass`

			`obs = self._get_obs()`
			`self.observation_space = spaces.Dict(dict(`
			`desired_goal=spaces.Box(-np.inf, np.inf, shape=obs['achieved_goal'].shape, dtype='float32'),`
			`achieved_goal=spaces.Box(-np.inf, np.inf, shape=obs['achieved_goal'].shape, dtype='float32'),`
			`observation=spaces.Box(-np.inf, np.inf, shape=obs['observation'].shape, dtype='float32'),`
			`))`

			`def _render_callback(self):`
			`super(ManipulateTouchSensorsEnv, self)._render_callback()`
			`if self.touch_visualisation == 'on_touch':`
			`for touch_sensor_id, site_id in self._touch_sensor_id_site_id:`
			`if self.sim.data.sensordata[touch_sensor_id] != 0.0:`
			`self.sim.model.site_rgba[site_id] = self.touch_color`
			`else:`
			`self.sim.model.site_rgba[site_id] = self.notouch_color`

			`def _get_obs(self):`
			`robot_qpos, robot_qvel = manipulate.robot_get_obs(self.sim)`
			`object_qvel = self.sim.data.get_joint_qvel('object:joint')`
			`achieved_goal = self._get_achieved_goal().ravel() # this contains the object position + rotation`
			`touch_values = [] # get touch sensor readings. if there is one, set value to 1`
			`if self.touch_get_obs == 'boolean':`
			`for touch_sensor_id, site_id in self._touch_sensor_id_site_id:`
			`value = 1.0 if self.sim.data.sensordata[touch_sensor_id] != 0.0 else 0.0`
			`touch_values.append(value)`
			`elif self.touch_get_obs == 'log':`
			`for touch_sensor_id, site_id in self._touch_sensor_id_site_id:`
			`value = self.sim.data.sensordata[touch_sensor_id]`
			`touch_values.append(value)`
			`if len(touch_values) > 0:`
			`touch_values = np.log(np.array(touch_values) + 1.0)`
			`observation = np.concatenate([robot_qpos, robot_qvel, object_qvel, touch_values, achieved_goal])`

			`return {`
			`'observation': observation.copy(),`
			`'achieved_goal': achieved_goal.copy(),`
			`'desired_goal': self.goal.ravel().copy(),`
			`}`


			`class HandBlockTouchSensorsEnv(ManipulateTouchSensorsEnv):`
			`def __init__(self, target_position='random', target_rotation='xyz', reward_type='sparse'):`
			`super(HandBlockTouchSensorsEnv, self).__init__(`
			`model_path=MANIPULATE_BLOCK_XML, target_position=target_position,`
			`target_rotation=target_rotation,`
			`target_position_range=np.array([(-0.04, 0.04), (-0.06, 0.02), (0.0, 0.06)]),`
			`reward_type=reward_type)`


			`class HandEggTouchSensorsEnv(ManipulateTouchSensorsEnv):`
			`def __init__(self, target_position='random', target_rotation='xyz', reward_type='sparse'):`
			`super(HandEggTouchSensorsEnv, self).__init__(`
			`model_path=MANIPULATE_EGG_XML, target_position=target_position,`
			`target_rotation=target_rotation,`
			`target_position_range=np.array([(-0.04, 0.04), (-0.06, 0.02), (0.0, 0.06)]),`
			`reward_type=reward_type)`


			`class HandPenTouchSensorsEnv(ManipulateTouchSensorsEnv):`
			`def __init__(self, target_position='random', target_rotation='xyz', reward_type='sparse'):`
			`super(HandPenTouchSensorsEnv, self).__init__(`
			`model_path=MANIPULATE_PEN_XML, target_position=target_position,`
			`target_rotation=target_rotation,`
			`target_position_range=np.array([(-0.04, 0.04), (-0.06, 0.02), (0.0, 0.06)]),`
			`randomize_initial_rotation=False, reward_type=reward_type,`
			`ignore_z_target_rotation=True, distance_threshold=0.05)`