Source code for rofunc.learning.RofuncRL.tasks.isaacgymenv.base.curi_base_task

# Copyright 2023, Junjia LIU, jjliu@mae.cuhk.edu.hk
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#      https://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

from isaacgym import gymtorch, gymapi
from isaacgym.torch_utils import *

from rofunc.learning.RofuncRL.tasks.isaacgymenv.base.vec_task import VecTask


[docs]class CURIBaseTask(VecTask): def __init__(self, cfg, rl_device, sim_device, graphics_device_id, headless, virtual_screen_capture, force_render): self.cfg = cfg self.max_episode_length = self.cfg["env"]["episodeLength"] self.action_scale = self.cfg["env"]["actionScale"] self.start_position_noise = self.cfg["env"]["startPositionNoise"] self.start_rotation_noise = self.cfg["env"]["startRotationNoise"] self.num_props = self.cfg["env"]["numProps"] self.aggregate_mode = self.cfg["env"]["aggregateMode"] self.dof_vel_scale = self.cfg["env"]["dofVelocityScale"] self.dist_reward_scale = self.cfg["env"]["distRewardScale"] self.rot_reward_scale = self.cfg["env"]["rotRewardScale"] self.around_handle_reward_scale = self.cfg["env"]["aroundHandleRewardScale"] self.open_reward_scale = self.cfg["env"]["openRewardScale"] self.finger_dist_reward_scale = self.cfg["env"]["fingerDistRewardScale"] self.action_penalty_scale = self.cfg["env"]["actionPenaltyScale"] self.debug_viz = self.cfg["env"]["enableDebugVis"] self.up_axis = "z" self.up_axis_idx = 2 self.distX_offset = 0.04 self.dt = 1 / 60. # prop dimensions self.prop_width = 0.08 self.prop_height = 0.08 self.prop_length = 0.08 self.prop_spacing = 0.09 super().__init__(config=self.cfg, rl_device=rl_device, sim_device=sim_device, graphics_device_id=graphics_device_id, headless=headless, virtual_screen_capture=virtual_screen_capture, force_render=force_render)
[docs] def create_sim(self): self.sim_params.up_axis = gymapi.UP_AXIS_Z self.sim_params.gravity.x = 0 self.sim_params.gravity.y = 0 self.sim_params.gravity.z = -9.81 self.sim = super().create_sim(self.device_id, self.graphics_device_id, self.physics_engine, self.sim_params) self._create_ground_plane() self._create_envs(self.num_envs, self.cfg["env"]['envSpacing'], int(np.sqrt(self.num_envs)))
def _create_ground_plane(self): plane_params = gymapi.PlaneParams() plane_params.normal = gymapi.Vec3(0.0, 0.0, 1.0) self.gym.add_ground(self.sim, plane_params)
[docs] def pre_physics_step(self, actions): self.actions = actions.clone().to(self.device) targets = self.curi_dof_targets[:, :self.num_curi_dofs] + self.curi_dof_speed_scales * self.dt * self.actions * self.action_scale self.curi_dof_targets[:, :self.num_curi_dofs] = tensor_clamp( targets, self.curi_dof_lower_limits, self.curi_dof_upper_limits) env_ids_int32 = torch.arange(self.num_envs, dtype=torch.int32, device=self.device) self.gym.set_dof_position_target_tensor(self.sim, gymtorch.unwrap_tensor(self.curi_dof_targets))