0% found this document useful (0 votes)

14 views26 pages

Legged Robot

The document outlines the implementation of a LeggedRobot class in a simulation environment, detailing its initialization, action application, and observation computation. It includes methods for handling physics steps, computing rewards, and managing environment resets. The class is designed to facilitate the training of legged robots using the Isaac Gym framework.

Uploaded by

bhhhh001

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

14 views26 pages

Legged Robot

Uploaded by

bhhhh001

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 26

# SPDX-FileCopyrightText: Copyright (c) 2021 NVIDIA CORPORATION & AFFILIATES.

All
rights reserved.
# SPDX-License-Identifier: BSD-3-Clause
#
# Redistribution and use in source and binary forms, with or without
# modification, are permitted provided that the following conditions are met:
#
# 1. Redistributions of source code must retain the above copyright notice, this
# list of conditions and the following disclaimer.
#
# 2. Redistributions in binary form must reproduce the above copyright notice,
# this list of conditions and the following disclaimer in the documentation
# and/or other materials provided with the distribution.
#
# 3. Neither the name of the copyright holder nor the names of its
# contributors may be used to endorse or promote products derived from
# this software without specific prior written permission.
#
# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
# AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
# FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
# DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
# SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
# CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
# OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
#
# Copyright (c) 2021 ETH Zurich, Nikita Rudin

from legged_gym import LEGGED_GYM_ROOT_DIR, envs

from time import time
from warnings import WarningMessage
import numpy as np
import os

from isaacgym.torch_utils import *

from isaacgym import gymtorch, gymapi, gymutil

import torch
from torch import Tensor
from typing import Tuple, Dict

from legged_gym import LEGGED_GYM_ROOT_DIR

from legged_gym.envs.base.base_task import BaseTask
from legged_gym.utils.terrain import Terrain
from legged_gym.utils.math import quat_apply_yaw, wrap_to_pi, torch_rand_sqrt_float
from legged_gym.utils.helpers import class_to_dict
from .legged_robot_config import LeggedRobotCfg

class LeggedRobot(BaseTask):
def __init__(self, cfg: LeggedRobotCfg, sim_params, physics_engine, sim_device,
headless):
""" Parses the provided config file,
calls create_sim() (which creates, simulation, terrain and
environments),
initilizes pytorch buffers used during training
Args:
cfg (Dict): Environment config file
sim_params (gymapi.SimParams): simulation parameters
physics_engine (gymapi.SimType): gymapi.SIM_PHYSX (must be PhysX)
device_type (string): 'cuda' or 'cpu'
device_id (int): 0, 1, ...
headless (bool): Run without rendering if True
"""
self.cfg = cfg
self.sim_params = sim_params
self.height_samples = None
self.debug_viz = False
self.init_done = False
self._parse_cfg(self.cfg)
super().__init__(self.cfg, sim_params, physics_engine, sim_device,
headless)
self.num_one_step_obs = self.cfg.env.num_one_step_observations
self.num_one_step_privileged_obs = self.cfg.env.num_one_step_privileged_obs
self.history_length = int(self.num_obs / self.num_one_step_obs)

if not self.headless:
self.set_camera(self.cfg.viewer.pos, self.cfg.viewer.lookat)
self._init_buffers()
self._prepare_reward_function()
self.init_done = True

def step(self, actions):

""" Apply actions, simulate, call self.post_physics_step()

Args:
actions (torch.Tensor): Tensor of shape (num_envs, num_actions_per_env)
"""
clip_actions = self.cfg.normalization.clip_actions
self.actions = torch.clip(actions, -clip_actions,
clip_actions).to(self.device)

self.delayed_actions = self.actions.clone().view(self.num_envs, 1,
self.num_actions).repeat(1, self.cfg.control.decimation, 1)
delay_steps = torch.randint(0, self.cfg.control.decimation, (self.num_envs,
1), device=self.device)
if self.cfg.domain_rand.delay:
for i in range(self.cfg.control.decimation):
self.delayed_actions[:, i] = self.last_actions + (self.actions -
self.last_actions) * (i >= delay_steps)
# step physics and render each frame
self.render()
for _ in range(self.cfg.control.decimation):
self.torques = self._compute_torques(self.delayed_actions[:,
_]).view(self.torques.shape)
self.gym.set_dof_actuation_force_tensor(self.sim,
gymtorch.unwrap_tensor(self.torques))
self.gym.simulate(self.sim)
if self.device == 'cpu':
self.gym.fetch_results(self.sim, True)
self.gym.refresh_dof_state_tensor(self.sim)
termination_ids, termination_priveleged_obs = self.post_physics_step()

# return clipped obs, clipped states (None), rewards, dones and infos
clip_obs = self.cfg.normalization.clip_observations
self.obs_buf = torch.clip(self.obs_buf, -clip_obs, clip_obs)
if self.privileged_obs_buf is not None:
self.privileged_obs_buf = torch.clip(self.privileged_obs_buf, -
clip_obs, clip_obs)
return self.obs_buf, self.privileged_obs_buf, self.rew_buf, self.reset_buf,
self.extras, termination_ids, termination_priveleged_obs

def post_physics_step(self):
""" check terminations, compute observations and rewards
calls self._post_physics_step_callback() for common computations
calls self._draw_debug_vis() if needed
"""
self.gym.refresh_actor_root_state_tensor(self.sim)
self.gym.refresh_net_contact_force_tensor(self.sim)
self.gym.refresh_rigid_body_state_tensor(self.sim)

self.episode_length_buf += 1
self.common_step_counter += 1

# prepare quantities
self.base_quat[:] = self.root_states[:, 3:7]
self.base_lin_vel[:] = quat_rotate_inverse(self.base_quat,
self.root_states[:, 7:10])
self.base_ang_vel[:] = quat_rotate_inverse(self.base_quat,
self.root_states[:, 10:13])
self.projected_gravity[:] = quat_rotate_inverse(self.base_quat,
self.gravity_vec)

self.feet_pos = self.rigid_body_states.view(self.num_envs, self.num_bodies,

13)[:, self.feet_indices, 0:3]
self.feet_vel = self.rigid_body_states.view(self.num_envs, self.num_bodies,
13)[:, self.feet_indices, 7:10]

self._post_physics_step_callback()

# compute observations, rewards, resets, ...

self.check_termination()
self.compute_reward()
env_ids = self.reset_buf.nonzero(as_tuple=False).flatten()
termination_privileged_obs = self.compute_termination_observations(env_ids)
self.reset_idx(env_ids)
self.compute_observations() # in some cases a simulation step might be
required to refresh some obs (for example body positions)

self.disturbance[:, :, :] = 0.0
self.last_last_actions[:] = self.last_actions[:]
self.last_actions[:] = self.actions[:]
self.last_dof_vel[:] = self.dof_vel[:]
self.last_root_vel[:] = self.root_states[:, 7:13]

if self.viewer and self.enable_viewer_sync and self.debug_viz:

self._draw_debug_vis()

return env_ids, termination_privileged_obs

def check_termination(self):
""" Check if environments need to be reset
"""
self.reset_buf = torch.any(torch.norm(self.contact_forces[:,
self.termination_contact_indices, :], dim=-1) > 1., dim=1)
self.time_out_buf = self.episode_length_buf > self.max_episode_length # no
terminal reward for time-outs
self.reset_buf |= self.time_out_buf

def reset_idx(self, env_ids):

""" Reset some environments.
Calls self._reset_dofs(env_ids), self._reset_root_states(env_ids), and
self._resample_commands(env_ids)
[Optional] calls self._update_terrain_curriculum(env_ids),
self.update_command_curriculum(env_ids) and
Logs episode info
Resets some buffers

Args:
env_ids (list[int]): List of environment ids which must be reset
"""
if len(env_ids) == 0:
return
# update curriculum
if self.cfg.terrain.curriculum:
self._update_terrain_curriculum(env_ids)
# avoid updating command curriculum at each step since the maximum command
is common to all envs
if self.cfg.commands.curriculum and (self.common_step_counter %
self.max_episode_length==0):
self.update_command_curriculum(env_ids)

# reset robot states

self._reset_dofs(env_ids)
self._reset_root_states(env_ids)

self._resample_commands(env_ids)

# reset buffers
self.last_actions[env_ids] = 0.
self.last_last_actions[env_ids] = 0.
self.last_dof_vel[env_ids] = 0.
self.feet_air_time[env_ids] = 0.
self.reset_buf[env_ids] = 1

# update height measurements

if self.cfg.terrain.measure_heights:
self.measured_heights = self._get_heights()

#reset randomized prop

if self.cfg.domain_rand.randomize_kp:
self.Kp_factors[env_ids] =
torch_rand_float(self.cfg.domain_rand.kp_range[0],
self.cfg.domain_rand.kp_range[1], (len(env_ids), 1), device=self.device)
if self.cfg.domain_rand.randomize_kd:
self.Kd_factors[env_ids] =
torch_rand_float(self.cfg.domain_rand.kd_range[0],
self.cfg.domain_rand.kd_range[1], (len(env_ids), 1), device=self.device)
if self.cfg.domain_rand.randomize_motor_strength:
self.motor_strength_factors[env_ids] =
torch_rand_float(self.cfg.domain_rand.motor_strength_range[0],
self.cfg.domain_rand.motor_strength_range[1], (len(env_ids), 1),
device=self.device)
self.refresh_actor_rigid_shape_props(env_ids)

# fill extras
self.extras["episode"] = {}
for key in self.episode_sums.keys():
self.extras["episode"]['rew_' + key] =
torch.mean(self.episode_sums[key][env_ids] /
torch.clip(self.episode_length_buf[env_ids], min=1) / self.dt)
self.episode_sums[key][env_ids] = 0.
# log additional curriculum info
if self.cfg.terrain.curriculum:
self.extras["episode"]["terrain_level"] =
torch.mean(self.terrain_levels.float())
if self.cfg.commands.curriculum:
self.extras["episode"]["max_command_x"] =
self.command_ranges["lin_vel_x"][1]
# send timeout info to the algorithm
if self.cfg.env.send_timeouts:
self.extras["time_outs"] = self.time_out_buf

self.episode_length_buf[env_ids] = 0

def compute_reward(self):
""" Compute rewards
Calls each reward function which had a non-zero scale (processed in
self._prepare_reward_function())
adds each terms to the episode sums and to the total reward
"""
self.rew_buf[:] = 0.
for i in range(len(self.reward_functions)):
name = self.reward_names[i]
rew = self.reward_functions[i]() * self.reward_scales[name]
self.rew_buf += rew
self.episode_sums[name] += rew
if self.cfg.rewards.only_positive_rewards:
self.rew_buf[:] = torch.clip(self.rew_buf[:], min=0.)
# add termination reward after clipping
if "termination" in self.reward_scales:
rew = self._reward_termination() * self.reward_scales["termination"]
self.rew_buf += rew
self.episode_sums["termination"] += rew

def compute_observations(self):
""" Computes observations
"""
current_obs = torch.cat(( self.commands[:, :3] * self.commands_scale,
self.base_ang_vel * self.obs_scales.ang_vel,
self.projected_gravity,
(self.dof_pos - self.default_dof_pos) *
self.obs_scales.dof_pos,
self.dof_vel * self.obs_scales.dof_vel,
self.actions
),dim=-1)
# add noise if needed
if self.add_noise:
current_obs += (2 * torch.rand_like(current_obs) - 1) *
self.noise_scale_vec[0:(9 + 3 * self.num_actions)]
# add perceptive inputs if not blind
current_obs = torch.cat((current_obs, self.base_lin_vel *
self.obs_scales.lin_vel, self.disturbance[:, 0, :]), dim=-1)
if self.cfg.terrain.measure_heights:
heights = torch.clip(self.root_states[:, 2].unsqueeze(1) - 0.5 -
self.measured_heights, -1, 1.) * self.obs_scales.height_measurements
heights += (2 * torch.rand_like(heights) - 1) * self.noise_scale_vec[(9
+ 3 * self.num_actions):(9 + 3 * self.num_actions+187)]
current_obs = torch.cat((current_obs, heights), dim=-1)

self.obs_buf = torch.cat((current_obs[:, :self.num_one_step_obs],

self.obs_buf[:, :-self.num_one_step_obs]), dim=-1)
self.privileged_obs_buf =
torch.cat((current_obs[:, :self.num_one_step_privileged_obs],
self.privileged_obs_buf[:, :-self.num_one_step_privileged_obs]), dim=-1)

def get_current_obs(self):
current_obs = torch.cat(( self.commands[:, :3] * self.commands_scale,
self.base_ang_vel * self.obs_scales.ang_vel,
self.projected_gravity,
(self.dof_pos - self.default_dof_pos) *
self.obs_scales.dof_pos,
self.dof_vel * self.obs_scales.dof_vel,
self.actions
),dim=-1)
# add noise if needed
if self.add_noise:
current_obs += (2 * torch.rand_like(current_obs) - 1) *
self.noise_scale_vec[0:(9 + 3 * self.num_actions)]

# add perceptive inputs if not blind

current_obs = torch.cat((current_obs, self.base_lin_vel *
self.obs_scales.lin_vel, self.disturbance[:, 0, :]), dim=-1)
if self.cfg.terrain.measure_heights:
heights = torch.clip(self.root_states[:, 2].unsqueeze(1) - 0.5 -
self.measured_heights, -1, 1.) * self.obs_scales.height_measurements
heights += (2 * torch.rand_like(heights) - 1) * self.noise_scale_vec[(9
+ 3 * self.num_actions):(9 + 3 * self.num_actions+187)]
current_obs = torch.cat((current_obs, heights), dim=-1)

return current_obs

def compute_termination_observations(self, env_ids):

""" Computes observations
"""
current_obs = torch.cat(( self.commands[:, :3] * self.commands_scale,
self.base_ang_vel * self.obs_scales.ang_vel,
self.projected_gravity,
(self.dof_pos - self.default_dof_pos) *
self.obs_scales.dof_pos,
self.dof_vel * self.obs_scales.dof_vel,
self.actions
),dim=-1)
# add noise if needed
if self.add_noise:
current_obs += (2 * torch.rand_like(current_obs) - 1) *
self.noise_scale_vec[0:(9 + 3 * self.num_actions)]

# add perceptive inputs if not blind

return torch.cat((current_obs[:, :self.num_one_step_privileged_obs],

self.privileged_obs_buf[:, :-self.num_one_step_privileged_obs]), dim=-1)[env_ids]

def create_sim(self):
""" Creates simulation, terrain and evironments
"""
self.up_axis_idx = 2 # 2 for z, 1 for y -> adapt gravity accordingly
self.sim = self.gym.create_sim(self.sim_device_id, self.graphics_device_id,
self.physics_engine, self.sim_params)
mesh_type = self.cfg.terrain.mesh_type
if mesh_type in ['heightfield', 'trimesh']:
self.terrain = Terrain(self.cfg.terrain, self.num_envs)
if mesh_type=='plane':
self._create_ground_plane()
elif mesh_type=='heightfield':
self._create_heightfield()
elif mesh_type=='trimesh':
self._create_trimesh()
elif mesh_type is not None:
raise ValueError("Terrain mesh type not recognised. Allowed types are
[None, plane, heightfield, trimesh]")
self._create_envs()

def set_camera(self, position, lookat):

""" Set camera position and direction
"""
cam_pos = gymapi.Vec3(position[0], position[1], position[2])
cam_target = gymapi.Vec3(lookat[0], lookat[1], lookat[2])
self.gym.viewer_camera_look_at(self.viewer, None, cam_pos, cam_target)

#------------- Callbacks --------------

def _process_rigid_shape_props(self, props, env_id):
""" Callback allowing to store/change/randomize the rigid shape properties
of each environment.
Called During environment creation.
Base behavior: randomizes the friction of each environment

Args:
props (List[gymapi.RigidShapeProperties]): Properties of each shape of
the asset
env_id (int): Environment id

Returns:
[List[gymapi.RigidShapeProperties]]: Modified rigid shape properties
"""
if self.cfg.domain_rand.randomize_friction:
if env_id==0:
# prepare friction randomization
friction_range = self.cfg.domain_rand.friction_range
self.friction_coeffs = torch_rand_float(friction_range[0],
friction_range[1], (self.num_envs,1), device=self.device)

for s in range(len(props)):
props[s].friction = self.friction_coeffs[env_id]

if self.cfg.domain_rand.randomize_restitution:
if env_id==0:
# prepare restitution randomization
restitution_range = self.cfg.domain_rand.restitution_range
self.restitution_coeffs = torch_rand_float(restitution_range[0],
restitution_range[1], (self.num_envs,1), device=self.device)

for s in range(len(props)):
props[s].restitution = self.restitution_coeffs[env_id]

return props

def refresh_actor_rigid_shape_props(self, env_ids):

if self.cfg.domain_rand.randomize_friction:
self.friction_coeffs[env_ids] =
torch_rand_float(self.cfg.domain_rand.friction_range[0],
self.cfg.domain_rand.friction_range[1], (len(env_ids), 1), device=self.device)
if self.cfg.domain_rand.randomize_restitution:
self.restitution_coeffs[env_ids] =
torch_rand_float(self.cfg.domain_rand.restitution_range[0],
self.cfg.domain_rand.restitution_range[1], (len(env_ids), 1), device=self.device)

for env_id in env_ids:

rigid_shape_props =
self.gym.get_actor_rigid_shape_properties(self.envs[env_id], 0)

for i in range(len(rigid_shape_props)):
rigid_shape_props[i].friction = self.friction_coeffs[env_id, 0]
rigid_shape_props[i].restitution = self.restitution_coeffs[env_id,
0]

self.gym.set_actor_rigid_shape_properties(self.envs[env_id], 0,
rigid_shape_props)

def _process_dof_props(self, props, env_id):

""" Callback allowing to store/change/randomize the DOF properties of each
environment.
Called During environment creation.
Base behavior: stores position, velocity and torques limits defined in
the URDF

Args:
props (numpy.array): Properties of each DOF of the asset
env_id (int): Environment id

Returns:
[numpy.array]: Modified DOF properties
"""
if env_id==0:
self.dof_pos_limits = torch.zeros(self.num_dof, 2, dtype=torch.float,
device=self.device, requires_grad=False)
self.dof_vel_limits = torch.zeros(self.num_dof, dtype=torch.float,
device=self.device, requires_grad=False)
self.torque_limits = torch.zeros(self.num_dof, dtype=torch.float,
device=self.device, requires_grad=False)
for i in range(len(props)):
self.dof_pos_limits[i, 0] = props["lower"][i].item()
self.dof_pos_limits[i, 1] = props["upper"][i].item()
self.dof_vel_limits[i] = props["velocity"][i].item()
self.torque_limits[i] = props["effort"][i].item()
# soft limits
m = (self.dof_pos_limits[i, 0] + self.dof_pos_limits[i, 1]) / 2
r = self.dof_pos_limits[i, 1] - self.dof_pos_limits[i, 0]
self.dof_pos_limits[i, 0] = m - 0.5 * r *
self.cfg.rewards.soft_dof_pos_limit
self.dof_pos_limits[i, 1] = m + 0.5 * r *
self.cfg.rewards.soft_dof_pos_limit
return props

def _process_rigid_body_props(self, props, env_id):

# if env_id==0:
# sum = 0
# for i, p in enumerate(props):
# sum += p.mass
# print(f"Mass of body {i}: {p.mass} (before randomization)")
# print(f"Total mass {sum} (before randomization)")
# randomize base mass
if self.cfg.domain_rand.randomize_payload_mass:
props[0].mass = self.default_rigid_body_mass[0] + self.payload[env_id,
0]

if self.cfg.domain_rand.randomize_com_displacement:
props[0].com = gymapi.Vec3(self.com_displacement[env_id, 0],
self.com_displacement[env_id, 1], self.com_displacement[env_id, 2])

if self.cfg.domain_rand.randomize_link_mass:
rng = self.cfg.domain_rand.link_mass_range
for i in range(1, len(props)):
scale = np.random.uniform(rng[0], rng[1])
props[i].mass = scale * self.default_rigid_body_mass[i]

return props

def _post_physics_step_callback(self):
""" Callback called before computing terminations, rewards, and
observations
Default behaviour: Compute ang vel command based on target and heading,
compute measured terrain heights and randomly push robots
"""
#
env_ids = (self.episode_length_buf %
int(self.cfg.commands.resampling_time /
self.dt)==0).nonzero(as_tuple=False).flatten()
self._resample_commands(env_ids)
if self.cfg.commands.heading_command:
forward = quat_apply(self.base_quat, self.forward_vec)
heading = torch.atan2(forward[:, 1], forward[:, 0])
self.commands[:, 2] = torch.clip(0.5*wrap_to_pi(self.commands[:, 3] -
heading), -2., 2.)

if self.cfg.terrain.measure_heights:
self.measured_heights = self._get_heights()
if self.cfg.domain_rand.push_robots and (self.common_step_counter %
self.cfg.domain_rand.push_interval == 0):
self._push_robots()
if self.cfg.domain_rand.disturbance and (self.common_step_counter %
self.cfg.domain_rand.disturbance_interval == 0):
self._disturbance_robots()

def _resample_commands(self, env_ids):

""" Randommly select commands of some environments

Args:
env_ids (List[int]): Environments ids for which new commands are needed
"""
self.commands[env_ids, 0] = torch_rand_float(-1.0, 1.0, (len(env_ids), 1),
device=self.device).squeeze(1)
self.commands[env_ids, 1] =
torch_rand_float(self.command_ranges["lin_vel_y"][0],
self.command_ranges["lin_vel_y"][1], (len(env_ids), 1),
device=self.device).squeeze(1)
if self.cfg.commands.heading_command:
self.commands[env_ids, 3] =
torch_rand_float(self.command_ranges["heading"][0], self.command_ranges["heading"]
[1], (len(env_ids), 1), device=self.device).squeeze(1)
else:
self.commands[env_ids, 2] =
torch_rand_float(self.command_ranges["ang_vel_yaw"][0],
self.command_ranges["ang_vel_yaw"][1], (len(env_ids), 1),
device=self.device).squeeze(1)

high_vel_env_ids = (env_ids < (self.num_envs * 0.2))

high_vel_env_ids = env_ids[high_vel_env_ids.nonzero(as_tuple=True)]

self.commands[high_vel_env_ids, 0] =
torch_rand_float(self.command_ranges["lin_vel_x"][0],
self.command_ranges["lin_vel_x"][1], (len(high_vel_env_ids), 1),
device=self.device).squeeze(1)

# set y commands of high vel envs to zero

self.commands[high_vel_env_ids, 1:2] *=
(torch.norm(self.commands[high_vel_env_ids, 0:1], dim=1) < 1.0).unsqueeze(1)

# set small commands to zero

self.commands[env_ids, :2] *= (torch.norm(self.commands[env_ids, :2],
dim=1) > 0.2).unsqueeze(1)

def _compute_torques(self, actions):

""" Compute torques from actions.
Actions can be interpreted as position or velocity targets given to a
PD controller, or directly as scaled torques.
[NOTE]: torques must have the same dimension as the number of DOFs,
even if some DOFs are not actuated.

Args:
actions (torch.Tensor): Actions

Returns:
[torch.Tensor]: Torques sent to the simulation
"""
#pd controller
actions_scaled = actions * self.cfg.control.action_scale
actions_scaled[:, [0, 3, 6, 9]] *=self.cfg.control.hip_reduction
self.joint_pos_target = self.default_dof_pos + actions_scaled

control_type = self.cfg.control.control_type
if control_type=="P":
torques = self.p_gains * self.Kp_factors * (self.joint_pos_target -
self.dof_pos) - self.d_gains * self.Kd_factors * self.dof_vel
elif control_type=="V":
torques = self.p_gains*(actions_scaled - self.dof_vel) -
self.d_gains*(self.dof_vel - self.last_dof_vel)/self.sim_params.dt
elif control_type=="T":
torques = actions_scaled
else:
raise NameError(f"Unknown controller type: {control_type}")
return torch.clip(torques, -self.torque_limits, self.torque_limits)

def _reset_dofs(self, env_ids):

""" Resets DOF position and velocities of selected environmments
Positions are randomly selected within 0.5:1.5 x default positions.
Velocities are set to zero.

Args:
env_ids (List[int]): Environemnt ids
"""
self.dof_pos[env_ids] = self.default_dof_pos * torch_rand_float(0.5, 1.5,
(len(env_ids), self.num_dof), device=self.device)
self.dof_vel[env_ids] = 0.

env_ids_int32 = env_ids.to(dtype=torch.int32)
self.gym.set_dof_state_tensor_indexed(self.sim,

gymtorch.unwrap_tensor(self.dof_state),

gymtorch.unwrap_tensor(env_ids_int32), len(env_ids_int32))
def _reset_root_states(self, env_ids):
""" Resets ROOT states position and velocities of selected environmments
Sets base position based on the curriculum
Selects randomized base velocities within -0.5:0.5 [m/s, rad/s]
Args:
env_ids (List[int]): Environemnt ids
"""
# base position
if self.custom_origins:
self.root_states[env_ids] = self.base_init_state
self.root_states[env_ids, :3] += self.env_origins[env_ids]
self.root_states[env_ids, :2] += torch_rand_float(-1., 1.,
(len(env_ids), 2), device=self.device) # xy position within 1m of the center
else:
self.root_states[env_ids] = self.base_init_state
self.root_states[env_ids, :3] += self.env_origins[env_ids]
# base velocities
self.root_states[env_ids, 7:13] = torch_rand_float(-0.5, 0.5,
(len(env_ids), 6), device=self.device) # [7:10]: lin vel, [10:13]: ang vel
env_ids_int32 = env_ids.to(dtype=torch.int32)
self.gym.set_actor_root_state_tensor_indexed(self.sim,

gymtorch.unwrap_tensor(self.root_states),
gymtorch.unwrap_tensor(env_ids_int32), len(env_ids_int32))

def _push_robots(self):
""" Random pushes the robots. Emulates an impulse by setting a randomized
base velocity.
"""
max_vel = self.cfg.domain_rand.max_push_vel_xy
self.root_states[:, 7:9] = torch_rand_float(-max_vel, max_vel,
(self.num_envs, 2), device=self.device) # lin vel x/y
self.gym.set_actor_root_state_tensor(self.sim,
gymtorch.unwrap_tensor(self.root_states))

def _disturbance_robots(self):
""" Random add disturbance force to the robots.
"""
disturbance = torch_rand_float(self.cfg.domain_rand.disturbance_range[0],
self.cfg.domain_rand.disturbance_range[1], (self.num_envs, 3), device=self.device)
self.disturbance[:, 0, :] = disturbance
self.gym.apply_rigid_body_force_tensors(self.sim,
forceTensor=gymtorch.unwrap_tensor(self.disturbance),
space=gymapi.CoordinateSpace.LOCAL_SPACE)

def _update_terrain_curriculum(self, env_ids):

""" Implements the game-inspired curriculum.

Args:
env_ids (List[int]): ids of environments being reset
"""
# Implement Terrain curriculum
if not self.init_done:
# don't change on initial reset
return
distance = torch.norm(self.root_states[env_ids, :2] -
self.env_origins[env_ids, :2], dim=1)
# robots that walked far enough progress to harder terains
move_up = distance > self.terrain.env_length / 2
# robots that walked less than half of their required distance go to
simpler terrains
move_down = (distance < torch.norm(self.commands[env_ids, :2],
dim=1)*self.max_episode_length_s*0.5) * ~move_up
self.terrain_levels[env_ids] += 1 * move_up - 1 * move_down
# Robots that solve the last level are sent to a random one
self.terrain_levels[env_ids] =
torch.where(self.terrain_levels[env_ids]>=self.max_terrain_level,

torch.randint_like(self.terrain_levels[env_ids], self.max_terrain_level),

torch.clip(self.terrain_levels[env_ids], 0)) # (the minumum level is zero)

self.env_origins[env_ids] =
self.terrain_origins[self.terrain_levels[env_ids], self.terrain_types[env_ids]]

def update_command_curriculum(self, env_ids):

""" Implements a curriculum of increasing commands

Args:
env_ids (List[int]): ids of environments being reset
"""
low_vel_env_ids = (env_ids > (self.num_envs * 0.2))
high_vel_env_ids = (env_ids < (self.num_envs * 0.2))
low_vel_env_ids = env_ids[low_vel_env_ids.nonzero(as_tuple=True)]
high_vel_env_ids = env_ids[high_vel_env_ids.nonzero(as_tuple=True)]
# If the tracking reward is above 80% of the maximum, increase the range of
commands
if (torch.mean(self.episode_sums["tracking_lin_vel"][low_vel_env_ids]) /
self.max_episode_length > 0.8 * self.reward_scales["tracking_lin_vel"]) and
(torch.mean(self.episode_sums["tracking_lin_vel"][high_vel_env_ids]) /
self.max_episode_length > 0.8 * self.reward_scales["tracking_lin_vel"]):
self.command_ranges["lin_vel_x"][0] =
np.clip(self.command_ranges["lin_vel_x"][0] - 0.2, -
self.cfg.commands.max_curriculum, 0.)
self.command_ranges["lin_vel_x"][1] =
np.clip(self.command_ranges["lin_vel_x"][1] + 0.2, 0.,
self.cfg.commands.max_curriculum)

def _get_noise_scale_vec(self, cfg):

""" Sets a vector used to scale the noise added to the observations.
[NOTE]: Must be adapted when changing the observations structure

Args:
cfg (Dict): Environment config file

Returns:
[torch.Tensor]: Vector of scales used to multiply a uniform
distribution in [-1, 1]
"""
# noise_vec = torch.zeros_like(self.obs_buf[0])\
if self.cfg.terrain.measure_heights:
noise_vec = torch.zeros(9 + 3*self.num_actions + 187,
device=self.device)
else:
noise_vec = torch.zeros(9 + 3*self.num_actions, device=self.device)
self.add_noise = self.cfg.noise.add_noise
noise_scales = self.cfg.noise.noise_scales
noise_level = self.cfg.noise.noise_level
noise_vec[0:3] = 0. # commands
noise_vec[3:6] = noise_scales.ang_vel * noise_level *
self.obs_scales.ang_vel
noise_vec[6:9] = noise_scales.gravity * noise_level
noise_vec[9:(9 + self.num_actions)] = noise_scales.dof_pos * noise_level *
self.obs_scales.dof_pos
noise_vec[(9 + self.num_actions):(9 + 2 * self.num_actions)] =
noise_scales.dof_vel * noise_level * self.obs_scales.dof_vel
noise_vec[(9 + 2 * self.num_actions):(9 + 3 * self.num_actions)] = 0. #
previous actions
if self.cfg.terrain.measure_heights:
noise_vec[(9 + 3 * self.num_actions):(9 + 3 * self.num_actions + 187)]
= noise_scales.height_measurements* noise_level *
self.obs_scales.height_measurements
#noise_vec[232:] = 0
return noise_vec

#----------------------------------------
def _init_buffers(self):
""" Initialize torch tensors which will contain simulation states and
processed quantities
"""
# get gym GPU state tensors
actor_root_state = self.gym.acquire_actor_root_state_tensor(self.sim)
dof_state_tensor = self.gym.acquire_dof_state_tensor(self.sim)
net_contact_forces = self.gym.acquire_net_contact_force_tensor(self.sim)
rigid_body_state = self.gym.acquire_rigid_body_state_tensor(self.sim)
self.gym.refresh_dof_state_tensor(self.sim)
self.gym.refresh_actor_root_state_tensor(self.sim)
self.gym.refresh_net_contact_force_tensor(self.sim)
self.gym.refresh_rigid_body_state_tensor(self.sim)

# create some wrapper tensors for different slices

self.root_states = gymtorch.wrap_tensor(actor_root_state)
self.dof_state = gymtorch.wrap_tensor(dof_state_tensor)
self.rigid_body_states = gymtorch.wrap_tensor(rigid_body_state)
self.dof_pos = self.dof_state.view(self.num_envs, self.num_dof, 2)[..., 0]
self.dof_vel = self.dof_state.view(self.num_envs, self.num_dof, 2)[..., 1]
self.base_quat = self.root_states[:, 3:7]
self.feet_pos = self.rigid_body_states.view(self.num_envs, self.num_bodies,
13)[:, self.feet_indices, 0:3]
self.feet_vel = self.rigid_body_states.view(self.num_envs, self.num_bodies,
13)[:, self.feet_indices, 7:10]

self.contact_forces =
gymtorch.wrap_tensor(net_contact_forces).view(self.num_envs, -1, 3) # shape:
num_envs, num_bodies, xyz axis

# initialize some data used later on

self.common_step_counter = 0
self.extras = {}
self.noise_scale_vec = self._get_noise_scale_vec(self.cfg)
self.gravity_vec = to_torch(get_axis_params(-1., self.up_axis_idx),
device=self.device).repeat((self.num_envs, 1))
self.forward_vec = to_torch([1., 0., 0.],
device=self.device).repeat((self.num_envs, 1))
self.torques = torch.zeros(self.num_envs, self.num_actions,
dtype=torch.float, device=self.device, requires_grad=False)
self.p_gains = torch.zeros(self.num_actions, dtype=torch.float,
device=self.device, requires_grad=False)
self.d_gains = torch.zeros(self.num_actions, dtype=torch.float,
device=self.device, requires_grad=False)
self.actions = torch.zeros(self.num_envs, self.num_actions,
dtype=torch.float, device=self.device, requires_grad=False)
self.last_actions = torch.zeros(self.num_envs, self.num_actions,
dtype=torch.float, device=self.device, requires_grad=False)
self.last_last_actions = torch.zeros(self.num_envs, self.num_actions,
dtype=torch.float, device=self.device, requires_grad=False)
self.last_dof_vel = torch.zeros_like(self.dof_vel)
self.last_root_vel = torch.zeros_like(self.root_states[:, 7:13])
self.commands = torch.zeros(self.num_envs, self.cfg.commands.num_commands,
dtype=torch.float, device=self.device, requires_grad=False) # x vel, y vel, yaw
vel, heading
self.commands_scale = torch.tensor([self.obs_scales.lin_vel,
self.obs_scales.lin_vel, self.obs_scales.ang_vel], device=self.device,
requires_grad=False,) # TODO change this
self.feet_air_time = torch.zeros(self.num_envs, self.feet_indices.shape[0],
dtype=torch.float, device=self.device, requires_grad=False)
self.last_contacts = torch.zeros(self.num_envs, len(self.feet_indices),
dtype=torch.bool, device=self.device, requires_grad=False)
self.base_lin_vel = quat_rotate_inverse(self.base_quat, self.root_states[:,
7:10])
self.base_ang_vel = quat_rotate_inverse(self.base_quat, self.root_states[:,
10:13])
self.projected_gravity = quat_rotate_inverse(self.base_quat,
self.gravity_vec)
if self.cfg.terrain.measure_heights:
self.height_points = self._init_height_points()
self.measured_heights = self._get_heights()
self.base_height_points = self._init_base_height_points()

# joint positions offsets and PD gains

self.default_dof_pos = torch.zeros(self.num_dof, dtype=torch.float,
device=self.device, requires_grad=False)
for i in range(self.num_dofs):
name = self.dof_names[i]
angle = self.cfg.init_state.default_joint_angles[name]
self.default_dof_pos[i] = angle
found = False
for dof_name in self.cfg.control.stiffness.keys():
if dof_name in name:
self.p_gains[i] = self.cfg.control.stiffness[dof_name]
self.d_gains[i] = self.cfg.control.damping[dof_name]
found = True
if not found:
self.p_gains[i] = 0.
self.d_gains[i] = 0.
if self.cfg.control.control_type in ["P", "V"]:
print(f"PD gain of joint {name} were not defined, setting them
to zero")
self.default_dof_pos = self.default_dof_pos.unsqueeze(0)

#randomize kp, kd, motor strength

self.Kp_factors = torch.ones(self.num_envs, 1, dtype=torch.float,
device=self.device, requires_grad=False)
self.Kd_factors = torch.ones(self.num_envs, 1, dtype=torch.float,
device=self.device, requires_grad=False)
self.motor_strength_factors = torch.ones(self.num_envs, 1,
dtype=torch.float, device=self.device, requires_grad=False)
self.payload = torch.zeros(self.num_envs, 1, dtype=torch.float,
device=self.device, requires_grad=False)
self.com_displacement = torch.zeros(self.num_envs, 3, dtype=torch.float,
device=self.device, requires_grad=False)
self.disturbance = torch.zeros(self.num_envs, self.num_bodies, 3,
dtype=torch.float, device=self.device, requires_grad=False)

if self.cfg.domain_rand.randomize_kp:
self.Kp_factors = torch_rand_float(self.cfg.domain_rand.kp_range[0],
self.cfg.domain_rand.kp_range[1], (self.num_envs, 1), device=self.device)
if self.cfg.domain_rand.randomize_kd:
self.Kd_factors = torch_rand_float(self.cfg.domain_rand.kd_range[0],
self.cfg.domain_rand.kd_range[1], (self.num_envs, 1), device=self.device)
if self.cfg.domain_rand.randomize_motor_strength:
self.motor_strength_factors =
torch_rand_float(self.cfg.domain_rand.motor_strength_range[0],
self.cfg.domain_rand.motor_strength_range[1], (self.num_envs, 1),
device=self.device)
if self.cfg.domain_rand.randomize_payload_mass:
self.payload =
torch_rand_float(self.cfg.domain_rand.payload_mass_range[0],
self.cfg.domain_rand.payload_mass_range[1], (self.num_envs, 1), device=self.device)
if self.cfg.domain_rand.randomize_com_displacement:
self.com_displacement =
torch_rand_float(self.cfg.domain_rand.com_displacement_range[0],
self.cfg.domain_rand.com_displacement_range[1], (self.num_envs, 3),
device=self.device)

#store friction and restitution

self.friction_coeffs = torch.ones(self.num_envs, 1, dtype=torch.float,
device=self.device, requires_grad=False)
self.restitution_coeffs = torch.zeros(self.num_envs, 1, dtype=torch.float,
device=self.device, requires_grad=False)

def _prepare_reward_function(self):
""" Prepares a list of reward functions, whcih will be called to compute
the total reward.
Looks for self._reward_<REWARD_NAME>, where <REWARD_NAME> are names of
all non zero reward scales in the cfg.
"""
# remove zero scales + multiply non-zero ones by dt
for key in list(self.reward_scales.keys()):
scale = self.reward_scales[key]
if scale==0:
self.reward_scales.pop(key)
else:
self.reward_scales[key] *= self.dt
# prepare list of functions
self.reward_functions = []
self.reward_names = []
for name, scale in self.reward_scales.items():
if name=="termination":
continue
self.reward_names.append(name)
name = '_reward_' + name
self.reward_functions.append(getattr(self, name))

# reward episode sums

self.episode_sums = {name: torch.zeros(self.num_envs, dtype=torch.float,
device=self.device, requires_grad=False)
for name in self.reward_scales.keys()}

def _create_ground_plane(self):
""" Adds a ground plane to the simulation, sets friction and restitution
based on the cfg.
"""
plane_params = gymapi.PlaneParams()
plane_params.normal = gymapi.Vec3(0.0, 0.0, 1.0)
plane_params.static_friction = self.cfg.terrain.static_friction
plane_params.dynamic_friction = self.cfg.terrain.dynamic_friction
plane_params.restitution = self.cfg.terrain.restitution
self.gym.add_ground(self.sim, plane_params)

def _create_heightfield(self):
""" Adds a heightfield terrain to the simulation, sets parameters based on
the cfg.
"""
hf_params = gymapi.HeightFieldParams()
hf_params.column_scale = self.terrain.cfg.horizontal_scale
hf_params.row_scale = self.terrain.cfg.horizontal_scale
hf_params.vertical_scale = self.terrain.cfg.vertical_scale
hf_params.nbRows = self.terrain.tot_cols
hf_params.nbColumns = self.terrain.tot_rows
hf_params.transform.p.x = -self.terrain.cfg.border_size
hf_params.transform.p.y = -self.terrain.cfg.border_size
hf_params.transform.p.z = 0.0
hf_params.static_friction = self.cfg.terrain.static_friction
hf_params.dynamic_friction = self.cfg.terrain.dynamic_friction
hf_params.restitution = self.cfg.terrain.restitution

self.gym.add_heightfield(self.sim, self.terrain.heightsamples, hf_params)

self.height_samples =
torch.tensor(self.terrain.heightsamples).view(self.terrain.tot_rows,
self.terrain.tot_cols).to(self.device)

def _create_trimesh(self):
""" Adds a triangle mesh terrain to the simulation, sets parameters based
on the cfg.
# """
tm_params = gymapi.TriangleMeshParams()
tm_params.nb_vertices = self.terrain.vertices.shape[0]
tm_params.nb_triangles = self.terrain.triangles.shape[0]

tm_params.transform.p.x = -self.terrain.cfg.border_size
tm_params.transform.p.y = -self.terrain.cfg.border_size
tm_params.transform.p.z = 0.0
tm_params.static_friction = self.cfg.terrain.static_friction
tm_params.dynamic_friction = self.cfg.terrain.dynamic_friction
tm_params.restitution = self.cfg.terrain.restitution
self.gym.add_triangle_mesh(self.sim,
self.terrain.vertices.flatten(order='C'),
self.terrain.triangles.flatten(order='C'), tm_params)
self.height_samples =
torch.tensor(self.terrain.heightsamples).view(self.terrain.tot_rows,
self.terrain.tot_cols).to(self.device)

def _create_envs(self):
""" Creates environments:
1. loads the robot URDF/MJCF asset,
2. For each environment
2.1 creates the environment,
2.2 calls DOF and Rigid shape properties callbacks,
2.3 create actor with these properties and add them to the env
3. Store indices of different bodies of the robot
"""
asset_path =
self.cfg.asset.file.format(LEGGED_GYM_ROOT_DIR=LEGGED_GYM_ROOT_DIR)
asset_root = os.path.dirname(asset_path)
asset_file = os.path.basename(asset_path)

asset_options = gymapi.AssetOptions()
asset_options.default_dof_drive_mode =
self.cfg.asset.default_dof_drive_mode
asset_options.collapse_fixed_joints = self.cfg.asset.collapse_fixed_joints
asset_options.replace_cylinder_with_capsule =
self.cfg.asset.replace_cylinder_with_capsule
asset_options.flip_visual_attachments =
self.cfg.asset.flip_visual_attachments
asset_options.fix_base_link = self.cfg.asset.fix_base_link
asset_options.density = self.cfg.asset.density
asset_options.angular_damping = self.cfg.asset.angular_damping
asset_options.linear_damping = self.cfg.asset.linear_damping
asset_options.max_angular_velocity = self.cfg.asset.max_angular_velocity
asset_options.max_linear_velocity = self.cfg.asset.max_linear_velocity
asset_options.armature = self.cfg.asset.armature
asset_options.thickness = self.cfg.asset.thickness
asset_options.disable_gravity = self.cfg.asset.disable_gravity

robot_asset = self.gym.load_asset(self.sim, asset_root, asset_file,

asset_options)
self.num_dof = self.gym.get_asset_dof_count(robot_asset)
self.num_bodies = self.gym.get_asset_rigid_body_count(robot_asset)
dof_props_asset = self.gym.get_asset_dof_properties(robot_asset)
rigid_shape_props_asset =
self.gym.get_asset_rigid_shape_properties(robot_asset)

# save body names from the asset

body_names = self.gym.get_asset_rigid_body_names(robot_asset)
self.dof_names = self.gym.get_asset_dof_names(robot_asset)
self.num_bodies = len(body_names)
self.num_dofs = len(self.dof_names)
feet_names = [s for s in body_names if self.cfg.asset.foot_name in s]
penalized_contact_names = []
for name in self.cfg.asset.penalize_contacts_on:
penalized_contact_names.extend([s for s in body_names if name in s])
termination_contact_names = []
for name in self.cfg.asset.terminate_after_contacts_on:
termination_contact_names.extend([s for s in body_names if name in s])

self.default_rigid_body_mass = torch.zeros(self.num_bodies,
dtype=torch.float, device=self.device, requires_grad=False)

base_init_state_list = self.cfg.init_state.pos + self.cfg.init_state.rot +

self.cfg.init_state.lin_vel + self.cfg.init_state.ang_vel
self.base_init_state = to_torch(base_init_state_list, device=self.device,
requires_grad=False)
start_pose = gymapi.Transform()
start_pose.p = gymapi.Vec3(*self.base_init_state[:3])

self._get_env_origins()
env_lower = gymapi.Vec3(0., 0., 0.)
env_upper = gymapi.Vec3(0., 0., 0.)
self.actor_handles = []
self.envs = []

self.payload = torch.zeros(self.num_envs, 1, dtype=torch.float,

device=self.device, requires_grad=False)
self.com_displacement = torch.zeros(self.num_envs, 3, dtype=torch.float,
device=self.device, requires_grad=False)
if self.cfg.domain_rand.randomize_payload_mass:
self.payload =
torch_rand_float(self.cfg.domain_rand.payload_mass_range[0],
self.cfg.domain_rand.payload_mass_range[1], (self.num_envs, 1), device=self.device)
if self.cfg.domain_rand.randomize_com_displacement:
self.com_displacement =
torch_rand_float(self.cfg.domain_rand.com_displacement_range[0],
self.cfg.domain_rand.com_displacement_range[1], (self.num_envs, 3),
device=self.device)

for i in range(self.num_envs):
# create env instance
env_handle = self.gym.create_env(self.sim, env_lower, env_upper,
int(np.sqrt(self.num_envs)))
pos = self.env_origins[i].clone()
pos[:2] += torch_rand_float(-1., 1., (2,1),
device=self.device).squeeze(1)
start_pose.p = gymapi.Vec3(*pos)

rigid_shape_props =
self._process_rigid_shape_props(rigid_shape_props_asset, i)
self.gym.set_asset_rigid_shape_properties(robot_asset,
rigid_shape_props)
actor_handle = self.gym.create_actor(env_handle, robot_asset,
start_pose, self.cfg.asset.name, i, self.cfg.asset.self_collisions, 0)
dof_props = self._process_dof_props(dof_props_asset, i)
self.gym.set_actor_dof_properties(env_handle, actor_handle, dof_props)
body_props = self.gym.get_actor_rigid_body_properties(env_handle,
actor_handle)

if i == 0:
for j in range(len(body_props)):
self.default_rigid_body_mass[j] = body_props[j].mass

body_props = self._process_rigid_body_props(body_props, i)
self.gym.set_actor_rigid_body_properties(env_handle, actor_handle,
body_props, recomputeInertia=True)
self.envs.append(env_handle)
self.actor_handles.append(actor_handle)

self.feet_indices = torch.zeros(len(feet_names), dtype=torch.long,

device=self.device, requires_grad=False)
for i in range(len(feet_names)):
self.feet_indices[i] =
self.gym.find_actor_rigid_body_handle(self.envs[0], self.actor_handles[0],
feet_names[i])

self.penalised_contact_indices = torch.zeros(len(penalized_contact_names),
dtype=torch.long, device=self.device, requires_grad=False)
for i in range(len(penalized_contact_names)):
self.penalised_contact_indices[i] =
self.gym.find_actor_rigid_body_handle(self.envs[0], self.actor_handles[0],
penalized_contact_names[i])

self.termination_contact_indices =
torch.zeros(len(termination_contact_names), dtype=torch.long, device=self.device,
requires_grad=False)
for i in range(len(termination_contact_names)):
self.termination_contact_indices[i] =
self.gym.find_actor_rigid_body_handle(self.envs[0], self.actor_handles[0],
termination_contact_names[i])

def _get_env_origins(self):
""" Sets environment origins. On rough terrain the origins are defined by
the terrain platforms.
Otherwise create a grid.
"""
if self.cfg.terrain.mesh_type in ["heightfield", "trimesh"]:
self.custom_origins = True
self.env_origins = torch.zeros(self.num_envs, 3, device=self.device,
requires_grad=False)
# put robots at the origins defined by the terrain
max_init_level = self.cfg.terrain.max_init_terrain_level
if not self.cfg.terrain.curriculum: max_init_level =
self.cfg.terrain.num_rows - 1
self.terrain_levels = torch.randint(0, max_init_level+1,
(self.num_envs,), device=self.device)
self.terrain_types = torch.div(torch.arange(self.num_envs,
device=self.device), (self.num_envs/self.cfg.terrain.num_cols),
rounding_mode='floor').to(torch.long)
self.max_terrain_level = self.cfg.terrain.num_rows
self.terrain_origins =
torch.from_numpy(self.terrain.env_origins).to(self.device).to(torch.float)
self.env_origins[:] = self.terrain_origins[self.terrain_levels,
self.terrain_types]
else:
self.custom_origins = False
self.env_origins = torch.zeros(self.num_envs, 3, device=self.device,
requires_grad=False)
# create a grid of robots
num_cols = np.floor(np.sqrt(self.num_envs))
num_rows = np.ceil(self.num_envs / num_cols)
xx, yy = torch.meshgrid(torch.arange(num_rows), torch.arange(num_cols))
spacing = self.cfg.env.env_spacing
self.env_origins[:, 0] = spacing * xx.flatten()[:self.num_envs]
self.env_origins[:, 1] = spacing * yy.flatten()[:self.num_envs]
self.env_origins[:, 2] = 0.

def _parse_cfg(self, cfg):

self.dt = self.cfg.control.decimation * self.sim_params.dt
self.obs_scales = self.cfg.normalization.obs_scales
self.reward_scales = class_to_dict(self.cfg.rewards.scales)
self.command_ranges = class_to_dict(self.cfg.commands.ranges)
if self.cfg.terrain.mesh_type not in ['heightfield', 'trimesh']:
self.cfg.terrain.curriculum = False
self.max_episode_length_s = self.cfg.env.episode_length_s
self.max_episode_length = np.ceil(self.max_episode_length_s / self.dt)

self.cfg.domain_rand.push_interval =
np.ceil(self.cfg.domain_rand.push_interval_s / self.dt)

def _draw_debug_vis(self):
""" Draws visualizations for dubugging (slows down simulation a lot).
Default behaviour: draws height measurement points
"""
# draw height lines
if not self.terrain.cfg.measure_heights:
return
self.gym.clear_lines(self.viewer)
self.gym.refresh_rigid_body_state_tensor(self.sim)
sphere_geom = gymutil.WireframeSphereGeometry(0.02, 4, 4, None, color=(1,
1, 0))
for i in range(self.num_envs):
base_pos = (self.root_states[i, :3]).cpu().numpy()
heights = self.measured_heights[i].cpu().numpy()
height_points =
quat_apply_yaw(self.base_quat[i].repeat(heights.shape[0]),
self.height_points[i]).cpu().numpy()
for j in range(heights.shape[0]):
x = height_points[j, 0] + base_pos[0]
y = height_points[j, 1] + base_pos[1]
z = heights[j]
sphere_pose = gymapi.Transform(gymapi.Vec3(x, y, z), r=None)
gymutil.draw_lines(sphere_geom, self.gym, self.viewer,
self.envs[i], sphere_pose)

def _init_height_points(self):
""" Returns points at which the height measurments are sampled (in base
frame)

Returns:
[torch.Tensor]: Tensor of shape (num_envs, self.num_height_points, 3)
"""
y = torch.tensor(self.cfg.terrain.measured_points_y, device=self.device,
requires_grad=False)
x = torch.tensor(self.cfg.terrain.measured_points_x, device=self.device,
requires_grad=False)
grid_x, grid_y = torch.meshgrid(x, y)

self.num_height_points = grid_x.numel()
points = torch.zeros(self.num_envs, self.num_height_points, 3,
device=self.device, requires_grad=False)
points[:, :, 0] = grid_x.flatten()
points[:, :, 1] = grid_y.flatten()
return points

def _init_base_height_points(self):
""" Returns points at which the height measurments are sampled (in base
frame)

Returns:
[torch.Tensor]: Tensor of shape (num_envs, self.num_base_height_points,
3)
"""
y = torch.tensor([-0.2, -0.15, -0.1, -0.05, 0., 0.05, 0.1, 0.15, 0.2],
device=self.device, requires_grad=False)
x = torch.tensor([-0.15, -0.1, -0.05, 0., 0.05, 0.1, 0.15],
device=self.device, requires_grad=False)
grid_x, grid_y = torch.meshgrid(x, y)

self.num_base_height_points = grid_x.numel()
points = torch.zeros(self.num_envs, self.num_base_height_points, 3,
device=self.device, requires_grad=False)
points[:, :, 0] = grid_x.flatten()
points[:, :, 1] = grid_y.flatten()
return points

def _get_heights(self, env_ids=None):

""" Samples heights of the terrain at required points around each robot.
The points are offset by the base's position and rotated by the base's
yaw

Args:
env_ids (List[int], optional): Subset of environments for which to
return the heights. Defaults to None.

Raises:
NameError: [description]

Returns:
[type]: [description]
"""
if self.cfg.terrain.mesh_type == 'plane':
return torch.zeros(self.num_envs, self.num_height_points,
device=self.device, requires_grad=False)
elif self.cfg.terrain.mesh_type == 'none':
raise NameError("Can't measure height with terrain mesh type 'none'")

if env_ids:
points = quat_apply_yaw(self.base_quat[env_ids].repeat(1,
self.num_height_points), self.height_points[env_ids]) +
(self.root_states[env_ids, :3]).unsqueeze(1)
else:
points = quat_apply_yaw(self.base_quat.repeat(1,
self.num_height_points), self.height_points) +
(self.root_states[:, :3]).unsqueeze(1)

points += self.terrain.cfg.border_size
points = (points/self.terrain.cfg.horizontal_scale).long()
px = points[:, :, 0].view(-1)
py = points[:, :, 1].view(-1)
px = torch.clip(px, 0, self.height_samples.shape[0]-2)
py = torch.clip(py, 0, self.height_samples.shape[1]-2)

heights1 = self.height_samples[px, py]

heights2 = self.height_samples[px+1, py]
heights3 = self.height_samples[px, py+1]
heights = torch.min(heights1, heights2)
heights = torch.min(heights, heights3)

return heights.view(self.num_envs, -1) * self.terrain.cfg.vertical_scale

def _get_base_heights(self, env_ids=None):

""" Samples heights of the terrain at required points around each robot.
The points are offset by the base's position and rotated by the base's
yaw

Args:
env_ids (List[int], optional): Subset of environments for which to
return the heights. Defaults to None.

Raises:
NameError: [description]

Returns:
[type]: [description]
"""
if self.cfg.terrain.mesh_type == 'plane':
return self.root_states[:, 2].clone()
elif self.cfg.terrain.mesh_type == 'none':
raise NameError("Can't measure height with terrain mesh type 'none'")
if env_ids:
points = quat_apply_yaw(self.base_quat[env_ids].repeat(1,
self.num_base_height_points), self.base_height_points[env_ids]) +
(self.root_states[env_ids, :3]).unsqueeze(1)
else:
points = quat_apply_yaw(self.base_quat.repeat(1,
self.num_base_height_points), self.base_height_points) +
(self.root_states[:, :3]).unsqueeze(1)

heights1 = self.height_samples[px, py]

heights2 = self.height_samples[px+1, py]
heights3 = self.height_samples[px, py+1]
heights = torch.min(heights1, heights2)
heights = torch.min(heights, heights3)
# heights = (heights1 + heights2 + heights3) / 3

base_height = heights.view(self.num_envs, -1) *

self.terrain.cfg.vertical_scale
base_height = torch.mean(self.root_states[:, 2].unsqueeze(1) - base_height,
dim=1)

return base_height

def _get_feet_heights(self, env_ids=None):

""" Samples heights of the terrain at required points around each robot.
The points are offset by the base's position and rotated by the base's
yaw

Args:
env_ids (List[int], optional): Subset of environments for which to
return the heights. Defaults to None.

Raises:
NameError: [description]

Returns:
[type]: [description]
"""
if self.cfg.terrain.mesh_type == 'plane':
return self.feet_pos[:, :, 2].clone()
elif self.cfg.terrain.mesh_type == 'none':
raise NameError("Can't measure height with terrain mesh type 'none'")

if env_ids:
points = self.feet_pos[env_ids].clone()
else:
points = self.feet_pos.clone()

heights1 = self.height_samples[px, py]

heights2 = self.height_samples[px+1, py]
heights3 = self.height_samples[px, py+1]
# heights = torch.min(heights1, heights2)
# heights = torch.min(heights, heights3)
heights = (heights1 + heights2 + heights3) / 3

heights = heights.view(self.num_envs, -1) * self.terrain.cfg.vertical_scale

feet_height = self.feet_pos[:, :, 2] - heights

return feet_height

#------------ reward functions----------------

def _reward_tracking_lin_vel(self):
# Tracking of linear velocity commands (xy axes)
lin_vel_error = torch.sum(torch.square(self.commands[:, :2] -
self.base_lin_vel[:, :2]), dim=1)
return torch.exp(-lin_vel_error/self.cfg.rewards.tracking_sigma)

def _reward_tracking_ang_vel(self):
# Tracking of angular velocity commands (yaw)
ang_vel_error = torch.square(self.commands[:, 2] - self.base_ang_vel[:, 2])
return torch.exp(-ang_vel_error/self.cfg.rewards.tracking_sigma)

def _reward_lin_vel_z(self):
# Penalize z axis base linear velocity
return torch.square(self.base_lin_vel[:, 2])

def _reward_ang_vel_xy(self):
# Penalize xy axes base angular velocity
return torch.sum(torch.square(self.base_ang_vel[:, :2]), dim=1)

def _reward_orientation(self):
# Penalize non flat base orientation
return torch.sum(torch.square(self.projected_gravity[:, :2]), dim=1)

def _reward_dof_acc(self):
# Penalize dof accelerations
return torch.sum(torch.square((self.last_dof_vel - self.dof_vel) /
self.dt), dim=1)

def _reward_joint_power(self):
#Penalize high power
return torch.sum(torch.abs(self.dof_vel) * torch.abs(self.torques), dim=1)

def _reward_base_height(self):
# Penalize base height away from target
base_height = self._get_base_heights()
return torch.square(base_height - self.cfg.rewards.base_height_target)

def _reward_foot_clearance(self):
cur_footpos_translated = self.feet_pos - self.root_states[:,
0:3].unsqueeze(1)
footpos_in_body_frame = torch.zeros(self.num_envs, len(self.feet_indices),
3, device=self.device)
cur_footvel_translated = self.feet_vel - self.root_states[:,
7:10].unsqueeze(1)
footvel_in_body_frame = torch.zeros(self.num_envs, len(self.feet_indices),
3, device=self.device)
for i in range(len(self.feet_indices)):
footpos_in_body_frame[:, i, :] = quat_rotate_inverse(self.base_quat,
cur_footpos_translated[:, i, :])
footvel_in_body_frame[:, i, :] = quat_rotate_inverse(self.base_quat,
cur_footvel_translated[:, i, :])

height_error = torch.square(footpos_in_body_frame[:, :, 2] -
self.cfg.rewards.clearance_height_target).view(self.num_envs, -1)
foot_leteral_vel =
torch.sqrt(torch.sum(torch.square(footvel_in_body_frame[:, :, :2]),
dim=2)).view(self.num_envs, -1)
return torch.sum(height_error * foot_leteral_vel, dim=1)

def _reward_action_rate(self):
# Penalize changes in actions
return torch.sum(torch.square(self.last_actions - self.actions), dim=1)

def _reward_smoothness(self):
# second order smoothness
return torch.sum(torch.square(self.actions - self.last_actions -
self.last_actions + self.last_last_actions), dim=1)

def _reward_torques(self):
# Penalize torques
return torch.sum(torch.square(self.torques), dim=1)

def _reward_dof_vel(self):
# Penalize dof velocities
return torch.sum(torch.square(self.dof_vel), dim=1)

def _reward_collision(self):
# Penalize collisions on selected bodies
return torch.sum(1.*(torch.norm(self.contact_forces[:,
self.penalised_contact_indices, :], dim=-1) > 0.1), dim=1)

def _reward_termination(self):
# Terminal reward / penalty
return self.reset_buf * ~self.time_out_buf

def _reward_dof_pos_limits(self):
# Penalize dof positions too close to the limit
out_of_limits = -(self.dof_pos - self.dof_pos_limits[:, 0]).clip(max=0.) #
lower limit
out_of_limits += (self.dof_pos - self.dof_pos_limits[:, 1]).clip(min=0.)
return torch.sum(out_of_limits, dim=1)

def _reward_dof_vel_limits(self):
# Penalize dof velocities too close to the limit
# clip to max error = 1 rad/s per joint to avoid huge penalties
return torch.sum((torch.abs(self.dof_vel) -
self.dof_vel_limits*self.cfg.rewards.soft_dof_vel_limit).clip(min=0., max=1.),
dim=1)

def _reward_torque_limits(self):
# penalize torques too close to the limit
return torch.sum((torch.abs(self.torques) -
self.torque_limits*self.cfg.rewards.soft_torque_limit).clip(min=0.), dim=1)

def _reward_feet_air_time(self):
# Reward long steps
# Need to filter the contacts because the contact reporting of PhysX is
unreliable on meshes
contact = self.contact_forces[:, self.feet_indices, 2] > 1.
contact_filt = torch.logical_or(contact, self.last_contacts)
self.last_contacts = contact
first_contact = (self.feet_air_time > 0.) * contact_filt
self.feet_air_time += self.dt
rew_airTime = torch.sum((self.feet_air_time - 0.5) * first_contact, dim=1)
# reward only on first contact with the ground
rew_airTime *= torch.norm(self.commands[:, :2], dim=1) > 0.1 #no reward for
zero command
self.feet_air_time *= ~contact_filt
return rew_airTime

def _reward_stumble(self):
# Penalize feet hitting vertical surfaces
return torch.any(torch.norm(self.contact_forces[:, self.feet_indices, :2],
dim=2) >\
5 *torch.abs(self.contact_forces[:, self.feet_indices, 2]), dim=1)

def _reward_stand_still(self):
# Penalize motion at zero commands
return torch.sum(torch.abs(self.dof_pos - self.default_dof_pos), dim=1) *
(torch.norm(self.commands[:, :2], dim=1) < 0.1)

def _reward_feet_contact_forces(self):
# penalize high contact forces
return torch.sum((torch.norm(self.contact_forces[:, self.feet_indices, :],
dim=-1) - self.cfg.rewards.max_contact_force).clip(min=0.), dim=1)

Github Copilot Coding With Copilot
100% (2)
Github Copilot Coding With Copilot
41 pages
TXT
No ratings yet
TXT
7 pages
Experiment No 13 Final
No ratings yet
Experiment No 13 Final
9 pages
Tutorials Sources Beginner Ptcheat
No ratings yet
Tutorials Sources Beginner Ptcheat
7 pages
PyTorch Cheat Sheet & Quick Reference
No ratings yet
PyTorch Cheat Sheet & Quick Reference
6 pages
Pytorch MNIST Digits Prediction Hands On 1
No ratings yet
Pytorch MNIST Digits Prediction Hands On 1
16 pages
Hyper Parameteres: Dataset
No ratings yet
Hyper Parameteres: Dataset
13 pages
DL 8
No ratings yet
DL 8
4 pages
Program 8-1
No ratings yet
Program 8-1
9 pages
Fnnexpriment 1
No ratings yet
Fnnexpriment 1
7 pages
Code File
No ratings yet
Code File
6 pages
Code
No ratings yet
Code
21 pages
Hrhrttgggegerge
No ratings yet
Hrhrttgggegerge
3 pages
Intro To Pytorch
No ratings yet
Intro To Pytorch
12 pages
City96 Comfyui Gguf
No ratings yet
City96 Comfyui Gguf
45 pages
Transformer Flux
No ratings yet
Transformer Flux
11 pages
Main
No ratings yet
Main
1 page
CS236 Introduction To PyTorch
100% (4)
CS236 Introduction To PyTorch
33 pages
Font Transfer 2 Autoencoders
No ratings yet
Font Transfer 2 Autoencoders
78 pages
Assignment3 AL
No ratings yet
Assignment3 AL
23 pages
361 Project Code
No ratings yet
361 Project Code
10 pages
Practical 14
No ratings yet
Practical 14
5 pages
ML Code
No ratings yet
ML Code
47 pages
Assignment 3 DS5620
No ratings yet
Assignment 3 DS5620
11 pages
LLM Code Ref
No ratings yet
LLM Code Ref
10 pages
Debugging Tensorflow Guide
No ratings yet
Debugging Tensorflow Guide
28 pages
Modeling Chatglm
No ratings yet
Modeling Chatglm
20 pages
CIFAR - 10 - Dataset - Using - CNN - Aniiiii - HTML
No ratings yet
CIFAR - 10 - Dataset - Using - CNN - Aniiiii - HTML
8 pages
(Deep Learning Using PyTorch) (Cheatsheet)
No ratings yet
(Deep Learning Using PyTorch) (Cheatsheet)
7 pages
Variational AutoEncoders (VAE) With PyTorch - Alexander Van de Kleut
No ratings yet
Variational AutoEncoders (VAE) With PyTorch - Alexander Van de Kleut
17 pages
Deep Learning Practical
No ratings yet
Deep Learning Practical
12 pages
Import Gym
No ratings yet
Import Gym
4 pages
Applied Machine and Deep Learning
No ratings yet
Applied Machine and Deep Learning
34 pages
Val
No ratings yet
Val
9 pages
Pipeline Flux Ipa
No ratings yet
Pipeline Flux Ipa
18 pages
Ilovepdf Merged
No ratings yet
Ilovepdf Merged
10 pages
PyTorch CrashCourse
No ratings yet
PyTorch CrashCourse
16 pages
Pytorch Demo 1749471354
No ratings yet
Pytorch Demo 1749471354
10 pages
CV Lab Final AwaisKhan EE A
No ratings yet
CV Lab Final AwaisKhan EE A
7 pages
3 Steps To Update Parameters of Faster R-CNN - SSD Models in TensorFlow Object Detection API
No ratings yet
3 Steps To Update Parameters of Faster R-CNN - SSD Models in TensorFlow Object Detection API
15 pages
PyTorch CrashCourse
No ratings yet
PyTorch CrashCourse
17 pages
Dinushasan Courseproject04: Sign in
No ratings yet
Dinushasan Courseproject04: Sign in
19 pages
AD3511-DEEP LEARNING LAB MANUAL Revised
No ratings yet
AD3511-DEEP LEARNING LAB MANUAL Revised
72 pages
Karpathy MinGPT Model
No ratings yet
Karpathy MinGPT Model
7 pages
Loss Log Rmse
No ratings yet
Loss Log Rmse
137 pages
Perceptron Pytorch
No ratings yet
Perceptron Pytorch
3 pages
Object Detection Using Autoencoder
No ratings yet
Object Detection Using Autoencoder
8 pages
PyTorch Crash Course 1713016363
No ratings yet
PyTorch Crash Course 1713016363
15 pages
02 - Lecture Note - TensorFlow Ops
No ratings yet
02 - Lecture Note - TensorFlow Ops
21 pages
Chap 3.1 Embedding in Tensorflow
No ratings yet
Chap 3.1 Embedding in Tensorflow
23 pages
Kijai ComfyUI VEnhancer
No ratings yet
Kijai ComfyUI VEnhancer
76 pages
Lab 6
No ratings yet
Lab 6
29 pages
Convolutional Autoencoder in Pytorch On MNIST Dataset - by Eugenia Anello - DataSeries - Medium
No ratings yet
Convolutional Autoencoder in Pytorch On MNIST Dataset - by Eugenia Anello - DataSeries - Medium
18 pages
Experimental Pix2pix
No ratings yet
Experimental Pix2pix
5 pages
Csc413 Project Semantic Segmentation
No ratings yet
Csc413 Project Semantic Segmentation
84 pages
Keras
No ratings yet
Keras
4 pages
Astro AI
No ratings yet
Astro AI
20 pages
NNDL 7&8 Programs
No ratings yet
NNDL 7&8 Programs
7 pages
Lab 9
No ratings yet
Lab 9
29 pages
Crash Course On Tensorflow!: Vincent Lepetit!
No ratings yet
Crash Course On Tensorflow!: Vincent Lepetit!
63 pages
Python Advanced Programming: The Guide to Learn Python Programming. Reference with Exercises and Samples About Dynamical Programming, Multithreading, Multiprocessing, Debugging, Testing and More
From Everand
Python Advanced Programming: The Guide to Learn Python Programming. Reference with Exercises and Samples About Dynamical Programming, Multithreading, Multiprocessing, Debugging, Testing and More
Marcus Richards
No ratings yet
Develop PLSQL Program Units - sg3 (1-10)
No ratings yet
Develop PLSQL Program Units - sg3 (1-10)
10 pages
AMI Aptio 4.x Status Codes PUB PDF
No ratings yet
AMI Aptio 4.x Status Codes PUB PDF
12 pages
Dokumentasi - Laporan Pembelian & Laporan Penjualan
No ratings yet
Dokumentasi - Laporan Pembelian & Laporan Penjualan
13 pages
Intelligent Agents: An Introduction To Multiagent Systems
No ratings yet
Intelligent Agents: An Introduction To Multiagent Systems
60 pages
Unity P Replication Config PDF
No ratings yet
Unity P Replication Config PDF
94 pages
Pipe Flow Expert Lifetime Activation Code 2022 New
No ratings yet
Pipe Flow Expert Lifetime Activation Code 2022 New
4 pages
MCIA-Level 1 MAINTENANCE MuleSoft Exam Practice Questions
No ratings yet
MCIA-Level 1 MAINTENANCE MuleSoft Exam Practice Questions
9 pages
MongoDB Restaurants
No ratings yet
MongoDB Restaurants
5 pages
The Stuff of Thought - Chapter 7 - The Seven Words You Can't Say On Television
No ratings yet
The Stuff of Thought - Chapter 7 - The Seven Words You Can't Say On Television
50 pages
6CN017HK - Assignment Brief 1 - 2023-2024
No ratings yet
6CN017HK - Assignment Brief 1 - 2023-2024
7 pages
CNS Lab
No ratings yet
CNS Lab
2 pages
Determinants of Driver Vs Second Row Occupant Post
No ratings yet
Determinants of Driver Vs Second Row Occupant Post
11 pages
Communication Protocols
100% (1)
Communication Protocols
23 pages
PowerSchool 2022 MSA - Final Online Version (02-14-2022)
No ratings yet
PowerSchool 2022 MSA - Final Online Version (02-14-2022)
20 pages
Campus Recruitment and Placement System: Rajnish Tripathi, Raghvendra Singh Ms. Jaweria Usmani
No ratings yet
Campus Recruitment and Placement System: Rajnish Tripathi, Raghvendra Singh Ms. Jaweria Usmani
6 pages
Hotelman
No ratings yet
Hotelman
8 pages
Talent Test Junior It Operations Engineer
No ratings yet
Talent Test Junior It Operations Engineer
7 pages
Fourpot Manu
No ratings yet
Fourpot Manu
34 pages
Manual Mon2020 Software For Gas Chromatographs Rosemount en 105130 PDF
No ratings yet
Manual Mon2020 Software For Gas Chromatographs Rosemount en 105130 PDF
374 pages
BDS Session 5
No ratings yet
BDS Session 5
57 pages
Optimisation in The Design of Underground Mine Access: January 2004
No ratings yet
Optimisation in The Design of Underground Mine Access: January 2004
19 pages
Assignment Machine Vision
No ratings yet
Assignment Machine Vision
10 pages
Uniquely Decodable Codes
No ratings yet
Uniquely Decodable Codes
10 pages
Symantec VIP Web Based RDP - User Guide
No ratings yet
Symantec VIP Web Based RDP - User Guide
6 pages
Basic Software Library Volume 6 - A Complete Business System
No ratings yet
Basic Software Library Volume 6 - A Complete Business System
186 pages
用自定义表提高BSEG取数性能
No ratings yet
用自定义表提高BSEG取数性能
17 pages
BP 2050 Physical Networking
No ratings yet
BP 2050 Physical Networking
26 pages
Planning and Designing Your DeltaV™ Digital Automation Systems and DeltaV™ SIS Process Safety Systems 2015 PDF
100% (2)
Planning and Designing Your DeltaV™ Digital Automation Systems and DeltaV™ SIS Process Safety Systems 2015 PDF
214 pages
Chapter 6 Solution
No ratings yet
Chapter 6 Solution
10 pages

Legged Robot

Uploaded by

Legged Robot

Uploaded by

# SPDX-FileCopyrightText: Copyright (c) 2021 NVIDIA CORPORATION & AFFILIATES.

from legged_gym import LEGGED_GYM_ROOT_DIR, envs

from isaacgym.torch_utils import *

from legged_gym import LEGGED_GYM_ROOT_DIR

def step(self, actions):

self.feet_pos = self.rigid_body_states.view(self.num_envs, self.num_bodies,

# compute observations, rewards, resets, ...

if self.viewer and self.enable_viewer_sync and self.debug_viz:

return env_ids, termination_privileged_obs

def reset_idx(self, env_ids):

# reset robot states

# update height measurements

#reset randomized prop

self.obs_buf = torch.cat((current_obs[:, :self.num_one_step_obs],

# add perceptive inputs if not blind

def compute_termination_observations(self, env_ids):

# add perceptive inputs if not blind

return torch.cat((current_obs[:, :self.num_one_step_privileged_obs],

def set_camera(self, position, lookat):

#------------- Callbacks --------------

def refresh_actor_rigid_shape_props(self, env_ids):

for env_id in env_ids:

def _process_dof_props(self, props, env_id):

def _process_rigid_body_props(self, props, env_id):

def _resample_commands(self, env_ids):

high_vel_env_ids = (env_ids < (self.num_envs * 0.2))

# set y commands of high vel envs to zero

# set small commands to zero

def _compute_torques(self, actions):

def _reset_dofs(self, env_ids):

def _update_terrain_curriculum(self, env_ids):

torch.clip(self.terrain_levels[env_ids], 0)) # (the minumum level is zero)

def update_command_curriculum(self, env_ids):

def _get_noise_scale_vec(self, cfg):

# create some wrapper tensors for different slices

# initialize some data used later on

# joint positions offsets and PD gains

#randomize kp, kd, motor strength

#store friction and restitution

# reward episode sums

self.gym.add_heightfield(self.sim, self.terrain.heightsamples, hf_params)

robot_asset = self.gym.load_asset(self.sim, asset_root, asset_file,

# save body names from the asset

base_init_state_list = self.cfg.init_state.pos + self.cfg.init_state.rot +

self.payload = torch.zeros(self.num_envs, 1, dtype=torch.float,

self.feet_indices = torch.zeros(len(feet_names), dtype=torch.long,

def _parse_cfg(self, cfg):

def _get_heights(self, env_ids=None):

heights1 = self.height_samples[px, py]

return heights.view(self.num_envs, -1) * self.terrain.cfg.vertical_scale

def _get_base_heights(self, env_ids=None):

heights1 = self.height_samples[px, py]

base_height = heights.view(self.num_envs, -1) *

def _get_feet_heights(self, env_ids=None):

heights1 = self.height_samples[px, py]

heights = heights.view(self.num_envs, -1) * self.terrain.cfg.vertical_scale

feet_height = self.feet_pos[:, :, 2] - heights

#------------ reward functions----------------

You might also like