2024-01-28 17:11:38 +08:00
|
|
|
import time
|
|
|
|
|
|
|
|
import lcm
|
|
|
|
import numpy as np
|
|
|
|
import torch
|
|
|
|
# import cv2
|
|
|
|
|
|
|
|
from go2_gym_deploy.lcm_types.pd_tau_targets_lcmt import pd_tau_targets_lcmt
|
|
|
|
|
|
|
|
lc = lcm.LCM("udpm://239.255.76.67:7667?ttl=255")
|
|
|
|
|
|
|
|
|
|
|
|
def class_to_dict(obj) -> dict:
|
|
|
|
if not hasattr(obj, "__dict__"):
|
|
|
|
return obj
|
|
|
|
result = {}
|
|
|
|
for key in dir(obj):
|
|
|
|
if key.startswith("_") or key == "terrain":
|
|
|
|
continue
|
|
|
|
element = []
|
|
|
|
val = getattr(obj, key)
|
|
|
|
if isinstance(val, list):
|
|
|
|
for item in val:
|
|
|
|
element.append(class_to_dict(item))
|
|
|
|
else:
|
|
|
|
element = class_to_dict(val)
|
|
|
|
result[key] = element
|
|
|
|
return result
|
|
|
|
|
|
|
|
|
|
|
|
class LCMAgent():
|
|
|
|
def __init__(self, cfg, se, command_profile):
|
|
|
|
if not isinstance(cfg, dict):
|
|
|
|
cfg = class_to_dict(cfg)
|
|
|
|
self.cfg = cfg
|
|
|
|
self.se = se
|
|
|
|
self.command_profile = command_profile
|
|
|
|
|
|
|
|
self.dt = self.cfg["control"]["decimation"] * self.cfg["sim"]["dt"]
|
|
|
|
self.timestep = 0
|
|
|
|
|
|
|
|
self.num_obs = self.cfg["env"]["num_observations"]
|
|
|
|
self.num_envs = 1
|
|
|
|
self.num_privileged_obs = self.cfg["env"]["num_privileged_obs"]
|
|
|
|
self.num_actions = self.cfg["env"]["num_actions"]
|
|
|
|
self.num_commands = self.cfg["commands"]["num_commands"]
|
|
|
|
self.device = 'cpu'
|
|
|
|
|
|
|
|
if "obs_scales" in self.cfg.keys():
|
|
|
|
self.obs_scales = self.cfg["obs_scales"]
|
|
|
|
else:
|
|
|
|
self.obs_scales = self.cfg["normalization"]["obs_scales"]
|
|
|
|
|
|
|
|
self.commands_scale = np.array(
|
|
|
|
[self.obs_scales["lin_vel"], self.obs_scales["lin_vel"],
|
|
|
|
self.obs_scales["ang_vel"], self.obs_scales["body_height_cmd"], 1, 1, 1, 1, 1,
|
|
|
|
self.obs_scales["footswing_height_cmd"], self.obs_scales["body_pitch_cmd"],
|
|
|
|
# 0, self.obs_scales["body_pitch_cmd"],
|
|
|
|
self.obs_scales["body_roll_cmd"], self.obs_scales["stance_width_cmd"],
|
|
|
|
self.obs_scales["stance_length_cmd"], self.obs_scales["aux_reward_cmd"], 1, 1, 1, 1, 1, 1
|
|
|
|
])[:self.num_commands]
|
|
|
|
|
|
|
|
|
|
|
|
joint_names = [
|
|
|
|
"FL_hip_joint", "FL_thigh_joint", "FL_calf_joint",
|
|
|
|
"FR_hip_joint", "FR_thigh_joint", "FR_calf_joint",
|
|
|
|
"RL_hip_joint", "RL_thigh_joint", "RL_calf_joint",
|
|
|
|
"RR_hip_joint", "RR_thigh_joint", "RR_calf_joint", ]
|
|
|
|
self.default_dof_pos = np.array([self.cfg["init_state"]["default_joint_angles"][name] for name in joint_names])
|
|
|
|
try:
|
|
|
|
self.default_dof_pos_scale = np.array([self.cfg["init_state"]["default_hip_scales"], self.cfg["init_state"]["default_thigh_scales"], self.cfg["init_state"]["default_calf_scales"],
|
|
|
|
self.cfg["init_state"]["default_hip_scales"], self.cfg["init_state"]["default_thigh_scales"], self.cfg["init_state"]["default_calf_scales"],
|
|
|
|
self.cfg["init_state"]["default_hip_scales"], self.cfg["init_state"]["default_thigh_scales"], self.cfg["init_state"]["default_calf_scales"],
|
|
|
|
self.cfg["init_state"]["default_hip_scales"], self.cfg["init_state"]["default_thigh_scales"], self.cfg["init_state"]["default_calf_scales"]])
|
|
|
|
except KeyError:
|
|
|
|
self.default_dof_pos_scale = np.ones(12)
|
|
|
|
self.default_dof_pos = self.default_dof_pos * self.default_dof_pos_scale
|
|
|
|
|
|
|
|
self.p_gains = np.zeros(12)
|
|
|
|
self.d_gains = np.zeros(12)
|
|
|
|
for i in range(12):
|
|
|
|
joint_name = joint_names[i]
|
|
|
|
found = False
|
|
|
|
for dof_name in self.cfg["control"]["stiffness"].keys():
|
|
|
|
if dof_name in joint_name:
|
|
|
|
self.p_gains[i] = self.cfg["control"]["stiffness"][dof_name]
|
|
|
|
self.d_gains[i] = self.cfg["control"]["damping"][dof_name]
|
|
|
|
found = True
|
|
|
|
if not found:
|
|
|
|
self.p_gains[i] = 0.
|
|
|
|
self.d_gains[i] = 0.
|
|
|
|
if self.cfg["control"]["control_type"] in ["P", "V"]:
|
|
|
|
print(f"PD gain of joint {joint_name} were not defined, setting them to zero")
|
|
|
|
|
|
|
|
print(f"p_gains: {self.p_gains}")
|
|
|
|
|
|
|
|
self.commands = np.zeros((1, self.num_commands))
|
|
|
|
self.actions = torch.zeros(12)
|
|
|
|
self.last_actions = torch.zeros(12)
|
|
|
|
self.gravity_vector = np.zeros(3)
|
|
|
|
self.dof_pos = np.zeros(12)
|
|
|
|
self.dof_vel = np.zeros(12)
|
|
|
|
self.body_linear_vel = np.zeros(3)
|
|
|
|
self.body_angular_vel = np.zeros(3)
|
|
|
|
self.joint_pos_target = np.zeros(12)
|
|
|
|
self.joint_vel_target = np.zeros(12)
|
|
|
|
self.torques = np.zeros(12)
|
|
|
|
self.contact_state = np.ones(4)
|
|
|
|
|
|
|
|
self.joint_idxs = self.se.joint_idxs
|
|
|
|
|
|
|
|
self.gait_indices = torch.zeros(self.num_envs, dtype=torch.float)
|
|
|
|
self.clock_inputs = torch.zeros(self.num_envs, 4, dtype=torch.float)
|
|
|
|
|
|
|
|
if "obs_scales" in self.cfg.keys():
|
|
|
|
self.obs_scales = self.cfg["obs_scales"]
|
|
|
|
else:
|
|
|
|
self.obs_scales = self.cfg["normalization"]["obs_scales"]
|
|
|
|
|
|
|
|
self.is_currently_probing = False
|
|
|
|
|
|
|
|
def set_probing(self, is_currently_probing):
|
|
|
|
self.is_currently_probing = is_currently_probing
|
|
|
|
|
|
|
|
def get_obs(self):
|
|
|
|
|
|
|
|
self.gravity_vector = self.se.get_gravity_vector()
|
|
|
|
cmds, reset_timer = self.command_profile.get_command(self.timestep * self.dt, probe=self.is_currently_probing)
|
|
|
|
self.commands[:, :] = cmds[:self.num_commands]
|
|
|
|
if reset_timer:
|
|
|
|
self.reset_gait_indices()
|
|
|
|
#else:
|
|
|
|
# self.commands[:, 0:3] = self.command_profile.get_command(self.timestep * self.dt)[0:3]
|
|
|
|
self.dof_pos = self.se.get_dof_pos()
|
|
|
|
self.dof_vel = self.se.get_dof_vel()
|
|
|
|
self.body_linear_vel = self.se.get_body_linear_vel()
|
|
|
|
self.body_angular_vel = self.se.get_body_angular_vel()
|
|
|
|
|
|
|
|
ob = np.concatenate((self.gravity_vector.reshape(1, -1),
|
|
|
|
self.commands * self.commands_scale,
|
|
|
|
(self.dof_pos - self.default_dof_pos).reshape(1, -1) * self.obs_scales["dof_pos"],
|
|
|
|
self.dof_vel.reshape(1, -1) * self.obs_scales["dof_vel"],
|
|
|
|
torch.clip(self.actions, -self.cfg["normalization"]["clip_actions"],
|
|
|
|
self.cfg["normalization"]["clip_actions"]).cpu().detach().numpy().reshape(1, -1)
|
|
|
|
), axis=1)
|
|
|
|
|
|
|
|
if self.cfg["env"]["observe_two_prev_actions"]:
|
|
|
|
ob = np.concatenate((ob,
|
|
|
|
self.last_actions.cpu().detach().numpy().reshape(1, -1)), axis=1)
|
|
|
|
|
|
|
|
if self.cfg["env"]["observe_clock_inputs"]:
|
|
|
|
ob = np.concatenate((ob,
|
|
|
|
self.clock_inputs), axis=1)
|
|
|
|
# print(self.clock_inputs)
|
|
|
|
|
|
|
|
if self.cfg["env"]["observe_vel"]:
|
|
|
|
ob = np.concatenate(
|
|
|
|
(self.body_linear_vel.reshape(1, -1) * self.obs_scales["lin_vel"],
|
|
|
|
self.body_angular_vel.reshape(1, -1) * self.obs_scales["ang_vel"],
|
|
|
|
ob), axis=1)
|
|
|
|
|
|
|
|
if self.cfg["env"]["observe_only_lin_vel"]:
|
|
|
|
ob = np.concatenate(
|
|
|
|
(self.body_linear_vel.reshape(1, -1) * self.obs_scales["lin_vel"],
|
|
|
|
ob), axis=1)
|
|
|
|
|
|
|
|
if self.cfg["env"]["observe_yaw"]:
|
|
|
|
heading = self.se.get_yaw()
|
|
|
|
ob = np.concatenate((ob, heading.reshape(1, -1)), axis=-1)
|
|
|
|
|
|
|
|
self.contact_state = self.se.get_contact_state()
|
|
|
|
if "observe_contact_states" in self.cfg["env"].keys() and self.cfg["env"]["observe_contact_states"]:
|
|
|
|
ob = np.concatenate((ob, self.contact_state.reshape(1, -1)), axis=-1)
|
|
|
|
|
|
|
|
if "terrain" in self.cfg.keys() and self.cfg["terrain"]["measure_heights"]:
|
|
|
|
robot_height = 0.25
|
|
|
|
self.measured_heights = np.zeros(
|
|
|
|
(len(self.cfg["terrain"]["measured_points_x"]), len(self.cfg["terrain"]["measured_points_y"]))).reshape(
|
|
|
|
1, -1)
|
|
|
|
heights = np.clip(robot_height - 0.5 - self.measured_heights, -1, 1.) * self.obs_scales["height_measurements"]
|
|
|
|
ob = np.concatenate((ob, heights), axis=1)
|
|
|
|
|
|
|
|
|
|
|
|
return torch.tensor(ob, device=self.device).float()
|
|
|
|
|
|
|
|
def get_privileged_observations(self):
|
|
|
|
return None
|
|
|
|
|
|
|
|
def publish_action(self, action, hard_reset=False):
|
|
|
|
|
|
|
|
command_for_robot = pd_tau_targets_lcmt()
|
|
|
|
self.joint_pos_target = \
|
|
|
|
(action[0, :12].detach().cpu().numpy() * self.cfg["control"]["action_scale"]).flatten()
|
|
|
|
self.joint_pos_target[[0, 3, 6, 9]] *= self.cfg["control"]["hip_scale_reduction"]
|
|
|
|
# self.joint_pos_target[[0, 3, 6, 9]] *= -1
|
|
|
|
self.joint_pos_target = self.joint_pos_target
|
|
|
|
self.joint_pos_target += self.default_dof_pos
|
|
|
|
joint_pos_target = self.joint_pos_target[self.joint_idxs]
|
|
|
|
self.joint_vel_target = np.zeros(12)
|
|
|
|
# print(f'cjp {self.joint_pos_target}')
|
|
|
|
|
|
|
|
command_for_robot.q_des = joint_pos_target
|
|
|
|
command_for_robot.qd_des = self.joint_vel_target
|
|
|
|
command_for_robot.kp = self.p_gains
|
|
|
|
command_for_robot.kd = self.d_gains
|
|
|
|
command_for_robot.tau_ff = np.zeros(12)
|
|
|
|
command_for_robot.se_contactState = np.zeros(4)
|
|
|
|
command_for_robot.timestamp_us = int(time.time() * 10 ** 6)
|
|
|
|
command_for_robot.id = 0
|
|
|
|
|
|
|
|
if hard_reset:
|
|
|
|
command_for_robot.id = -1
|
|
|
|
|
|
|
|
|
|
|
|
self.torques = (self.joint_pos_target - self.dof_pos) * self.p_gains + (self.joint_vel_target - self.dof_vel) * self.d_gains
|
|
|
|
# 由lcm将神经网络输出的action传入c++ sdk
|
|
|
|
lc.publish("pd_plustau_targets", command_for_robot.encode())
|
|
|
|
|
|
|
|
def reset(self):
|
|
|
|
self.actions = torch.zeros(12)
|
|
|
|
self.time = time.time()
|
|
|
|
self.timestep = 0
|
|
|
|
return self.get_obs()
|
|
|
|
|
|
|
|
def reset_gait_indices(self):
|
|
|
|
self.gait_indices = torch.zeros(self.num_envs, dtype=torch.float)
|
|
|
|
|
|
|
|
def step(self, actions, hard_reset=False):
|
|
|
|
clip_actions = self.cfg["normalization"]["clip_actions"]
|
|
|
|
self.last_actions = self.actions[:]
|
|
|
|
self.actions = torch.clip(actions[0:1, :], -clip_actions, clip_actions)
|
|
|
|
self.publish_action(self.actions, hard_reset=hard_reset)
|
|
|
|
time.sleep(max(self.dt - (time.time() - self.time), 0))
|
2024-03-16 15:09:49 +08:00
|
|
|
if self.timestep % 100 == 0: print(f'frq: {1 / (time.time() - self.time)} Hz')
|
2024-01-28 17:11:38 +08:00
|
|
|
self.time = time.time()
|
|
|
|
obs = self.get_obs()
|
|
|
|
|
|
|
|
# clock accounting
|
|
|
|
frequencies = self.commands[:, 4]
|
|
|
|
phases = self.commands[:, 5]
|
|
|
|
offsets = self.commands[:, 6]
|
|
|
|
if self.num_commands == 8:
|
|
|
|
bounds = 0
|
|
|
|
durations = self.commands[:, 7]
|
|
|
|
else:
|
|
|
|
bounds = self.commands[:, 7]
|
|
|
|
durations = self.commands[:, 8]
|
|
|
|
self.gait_indices = torch.remainder(self.gait_indices + self.dt * frequencies, 1.0)
|
|
|
|
|
|
|
|
if "pacing_offset" in self.cfg["commands"] and self.cfg["commands"]["pacing_offset"]:
|
|
|
|
self.foot_indices = [self.gait_indices + phases + offsets + bounds,
|
|
|
|
self.gait_indices + bounds,
|
|
|
|
self.gait_indices + offsets,
|
|
|
|
self.gait_indices + phases]
|
|
|
|
else:
|
|
|
|
self.foot_indices = [self.gait_indices + phases + offsets + bounds,
|
|
|
|
self.gait_indices + offsets,
|
|
|
|
self.gait_indices + bounds,
|
|
|
|
self.gait_indices + phases]
|
|
|
|
self.clock_inputs[:, 0] = torch.sin(2 * np.pi * self.foot_indices[0])
|
|
|
|
self.clock_inputs[:, 1] = torch.sin(2 * np.pi * self.foot_indices[1])
|
|
|
|
self.clock_inputs[:, 2] = torch.sin(2 * np.pi * self.foot_indices[2])
|
|
|
|
self.clock_inputs[:, 3] = torch.sin(2 * np.pi * self.foot_indices[3])
|
|
|
|
|
|
|
|
# 注释掉了下面camera相关代码
|
|
|
|
# --------------------------------------------------------------------
|
|
|
|
# images = {'front': self.se.get_camera_front(),
|
|
|
|
# 'bottom': self.se.get_camera_bottom(),
|
|
|
|
# 'rear': self.se.get_camera_rear(),
|
|
|
|
# 'left': self.se.get_camera_left(),
|
|
|
|
# 'right': self.se.get_camera_right()
|
|
|
|
# }
|
|
|
|
# downscale_factor = 2
|
|
|
|
# temporal_downscale = 3
|
|
|
|
|
|
|
|
# for k, v in images.items():
|
|
|
|
# if images[k] is not None:
|
|
|
|
# images[k] = cv2.resize(images[k], dsize=(images[k].shape[0]//downscale_factor, images[k].shape[1]//downscale_factor), interpolation=cv2.INTER_CUBIC)
|
|
|
|
# if self.timestep % temporal_downscale != 0:
|
|
|
|
# images[k] = None
|
|
|
|
#print(self.commands)
|
|
|
|
|
|
|
|
infos = {"joint_pos": self.dof_pos[np.newaxis, :],
|
|
|
|
"joint_vel": self.dof_vel[np.newaxis, :],
|
|
|
|
"joint_pos_target": self.joint_pos_target[np.newaxis, :],
|
|
|
|
"joint_vel_target": self.joint_vel_target[np.newaxis, :],
|
|
|
|
"body_linear_vel": self.body_linear_vel[np.newaxis, :],
|
|
|
|
"body_angular_vel": self.body_angular_vel[np.newaxis, :],
|
|
|
|
"contact_state": self.contact_state[np.newaxis, :],
|
|
|
|
"clock_inputs": self.clock_inputs[np.newaxis, :],
|
|
|
|
"body_linear_vel_cmd": self.commands[:, 0:2],
|
|
|
|
"body_angular_vel_cmd": self.commands[:, 2:],
|
|
|
|
"privileged_obs": None,
|
|
|
|
# -------------------------------------------
|
|
|
|
# "camera_image_front": images['front'],
|
|
|
|
# "camera_image_bottom": images['bottom'],
|
|
|
|
# "camera_image_rear": images['rear'],
|
|
|
|
# "camera_image_left": images['left'],
|
|
|
|
# "camera_image_right": images['right'],
|
|
|
|
}
|
|
|
|
|
|
|
|
self.timestep += 1
|
|
|
|
return obs, None, None, infos
|