feat: 1.fix lower upper bug

2. ComputeTorques return origin value 3. change RobotState-IMU std::vector<T> 4. Update RunModel && ComputeObservation && Forward funcs 5. update a1 pt model
2024-05-27 17:36:41 +08:00 · 2024-05-27 17:36:41 +08:00 · 03cccc15db
parent 109ded0f12
commit 03cccc15db
7 changed files with 53 additions and 63 deletions
--- a/src/rl_sar/config.yaml
+++ b/src/rl_sar/config.yaml
@ -1,5 +1,5 @@
 a1:
-  model_name: "model_0522.pt"
+  model_name: "model_0526.pt"
  num_observations: 45
  clip_obs: 100.0
  clip_actions_lower: [-100, -100, -100, 
@ -34,7 +34,7 @@ a1:
  ang_vel_scale: 0.25
  dof_pos_scale: 1.0
  dof_vel_scale: 0.05
-  commands_scale: [2.0, 2.0, 0.5]
+  commands_scale: [2.0, 2.0, 1.0]
  torque_limits: [33.5, 33.5, 33.5, 
                  33.5, 33.5, 33.5, 
                  33.5, 33.5, 33.5, 
@ -52,10 +52,10 @@ gr1t1:
  model_name: "model_4000_jit.pt"
  num_observations: 39
  clip_obs: 100.0
  clip_actions_upper: [1.1391, 1.0491, 1.0491, 2.2691, 0.8691,
                       0.4391, 1.0491, 1.0491, 2.2691, 0.8691]
  clip_actions_lower: [-0.4391, -1.0491, -2.0991, -0.4391, -1.3991,
                       -1.1391, -1.0491, -2.0991, -0.4391, -1.3991]
  clip_actions_upper: [1.1391, 1.0491, 1.0491, 2.2691, 0.8691,
                       0.4391, 1.0491, 1.0491, 2.2691, 0.8691]
  rl_kp: [57.0, 43.0, 114.0, 114.0, 15.3, 
          57.0, 43.0, 114.0, 114.0, 15.3]
  rl_kd: [5.7, 4.3, 11.4, 11.4, 1.5, 
--- a/src/rl_sar/include/rl_real_a1.hpp
+++ b/src/rl_sar/include/rl_real_a1.hpp
@ -58,7 +58,6 @@ private:
    std::vector<double> mapped_joint_velocities;
    int command_mapping[12] = {3, 4, 5, 0, 1, 2, 9, 10, 11, 6, 7, 8};
    int state_mapping[12] = {3, 4, 5, 0, 1, 2, 9, 10, 11, 6, 7, 8};
    int hip_scale_reduction_indices[4] = {0, 3, 6, 9};
 };
 #endif
--- a/src/rl_sar/library/rl_sdk/rl_sdk.cpp
+++ b/src/rl_sar/library/rl_sdk/rl_sdk.cpp
@ -36,8 +36,6 @@ torch::Tensor RL::Forward()
 }
 */
 void RL::InitObservations()
 {
    this->obs.lin_vel = torch::tensor({{0.0, 0.0, 0.0}});
@ -68,8 +66,7 @@ torch::Tensor RL::ComputeTorques(torch::Tensor actions)
 {
    torch::Tensor actions_scaled = actions * this->params.action_scale;
    torch::Tensor output_torques = this->params.rl_kp * (actions_scaled + this->params.default_dof_pos - this->obs.dof_pos) - this->params.rl_kd * this->obs.dof_vel;
-    torch::Tensor clamped = torch::clamp(output_torques, -(this->params.torque_limits), this->params.torque_limits);
+    return output_torques;
    return clamped;
 }
 torch::Tensor RL::ComputePosition(torch::Tensor actions)
--- a/src/rl_sar/library/rl_sdk/rl_sdk.hpp
+++ b/src/rl_sar/library/rl_sdk/rl_sdk.hpp
@ -27,9 +27,9 @@ struct RobotState
 {
    struct IMU
    {
-        T quaternion[4] = {1.0, 0.0, 0.0, 0.0}; // w, x, y, z
+        std::vector<T> quaternion = {1.0, 0.0, 0.0, 0.0}; // w, x, y, z
-        T gyroscope[3] = {0.0, 0.0, 0.0};
+        std::vector<T> gyroscope = {0.0, 0.0, 0.0};
-        T accelerometer[3] = {0.0, 0.0, 0.0};
+        std::vector<T> accelerometer = {0.0, 0.0, 0.0};
    } imu;
    struct MotorState
--- a/src/rl_sar/models/a1/model_0526.pt
+++ b/src/rl_sar/models/a1/model_0526.pt
--- a/src/rl_sar/src/rl_real_a1.cpp
+++ b/src/rl_sar/src/rl_real_a1.cpp
@ -85,17 +85,14 @@ void RL_Real::GetState(RobotState<double> *state)
        keyboard.keyboard_state = STATE_POS_GETDOWN;
    }
-    for(int i = 0; i < 4; ++i)
+    state->imu.quaternion[3] = unitree_low_state.imu.quaternion[0]; // w
-    {
+    state->imu.quaternion[0] = unitree_low_state.imu.quaternion[1]; // x
-        state->imu.quaternion[i] = unitree_low_state.imu.quaternion[i];
+    state->imu.quaternion[1] = unitree_low_state.imu.quaternion[2]; // y
-    }
+    state->imu.quaternion[2] = unitree_low_state.imu.quaternion[3]; // z
    for(int i = 0; i < 3; ++i)
    {
        state->imu.gyroscope[i] = unitree_low_state.imu.gyroscope[i];
    }
    // state->imu.accelerometer
    for(int i = 0; i < params.num_of_dofs; ++i)
    {
        state->motor_state.q[i] = unitree_low_state.motorState[state_mapping[i]].q;
@ -116,8 +113,8 @@ void RL_Real::SetCommand(const RobotCommand<double> *command)
        unitree_low_command.motorCmd[i].tau = command->motor_command.tau[command_mapping[i]];
    }
-    unitree_safe.PowerProtect(unitree_low_command, unitree_low_state, 8);
+    unitree_safe.PowerProtect(unitree_low_command, unitree_low_state, 6);
-    // safe.PositionProtect(unitree_low_command, unitree_low_state);
+    // unitree_safe.PositionProtect(unitree_low_command, unitree_low_state);
    unitree_udp.SetSend(unitree_low_command);
 }
@ -134,34 +131,27 @@ void RL_Real::RunModel()
 {
    if(running_state == STATE_RL_RUNNING)
    {
-        this->obs.ang_vel = torch::tensor({{unitree_low_state.imu.gyroscope[0], unitree_low_state.imu.gyroscope[1], unitree_low_state.imu.gyroscope[2]}});
+        this->obs.ang_vel = torch::tensor(robot_state.imu.gyroscope).unsqueeze(0);
        this->obs.commands = torch::tensor({{unitree_joy.ly, -unitree_joy.rx, -unitree_joy.lx}});
-        this->obs.base_quat = torch::tensor({{unitree_low_state.imu.quaternion[1], unitree_low_state.imu.quaternion[2], unitree_low_state.imu.quaternion[3], unitree_low_state.imu.quaternion[0]}});
+        this->obs.base_quat = torch::tensor(robot_state.imu.quaternion).unsqueeze(0);
-        this->obs.dof_pos = torch::tensor({{unitree_low_state.motorState[3].q, unitree_low_state.motorState[4].q, unitree_low_state.motorState[5].q,
+        this->obs.dof_pos = torch::tensor(robot_state.motor_state.q).narrow(0, 0, params.num_of_dofs).unsqueeze(0);
-                                            unitree_low_state.motorState[0].q, unitree_low_state.motorState[1].q, unitree_low_state.motorState[2].q,
+        this->obs.dof_vel = torch::tensor(robot_state.motor_state.dq).narrow(0, 0, params.num_of_dofs).unsqueeze(0);
                                            unitree_low_state.motorState[9].q, unitree_low_state.motorState[10].q, unitree_low_state.motorState[11].q,
                                            unitree_low_state.motorState[6].q, unitree_low_state.motorState[7].q, unitree_low_state.motorState[8].q}});
        this->obs.dof_vel = torch::tensor({{unitree_low_state.motorState[3].dq, unitree_low_state.motorState[4].dq, unitree_low_state.motorState[5].dq,
                                            unitree_low_state.motorState[0].dq, unitree_low_state.motorState[1].dq, unitree_low_state.motorState[2].dq,
                                            unitree_low_state.motorState[9].dq, unitree_low_state.motorState[10].dq, unitree_low_state.motorState[11].dq,
                                            unitree_low_state.motorState[6].dq, unitree_low_state.motorState[7].dq, unitree_low_state.motorState[8].dq}});
        torch::Tensor clamped_actions = this->Forward();
-        for (int i : hip_scale_reduction_indices)
+        for (int i : this->params.hip_scale_reduction_indices)
        {
            clamped_actions[0][i] *= this->params.hip_scale_reduction;
        }
        this->obs.actions = clamped_actions;
-        output_torques = this->ComputeTorques(clamped_actions);
+        // torch::Tensor origin_output_torques = this->ComputeTorques(this->obs.actions);
-        output_dof_pos = this->ComputePosition(clamped_actions);
+        // output_torques = torch::clamp(origin_output_torques, -(this->params.torque_limits), this->params.torque_limits);
        output_dof_pos = this->ComputePosition(this->obs.actions);
 #ifdef CSV_LOGGER
-        torch::Tensor tau_est = torch::tensor({{unitree_low_state.motorState[3].tauEst, unitree_low_state.motorState[4].tauEst, unitree_low_state.motorState[5].tauEst,
+        torch::Tensor tau_est = torch::tensor(robot_state.motor_state.tauEst).unsqueeze(0);
                                                unitree_low_state.motorState[0].tauEst, unitree_low_state.motorState[1].tauEst, unitree_low_state.motorState[2].tauEst,
                                                unitree_low_state.motorState[9].tauEst, unitree_low_state.motorState[10].tauEst, unitree_low_state.motorState[11].tauEst,
                                                unitree_low_state.motorState[6].tauEst, unitree_low_state.motorState[7].tauEst, unitree_low_state.motorState[8].tauEst}});
        CSVLogger(output_torques, tau_est, this->obs.dof_pos, output_dof_pos, this->obs.dof_vel);
 #endif
    }
@ -177,22 +167,24 @@ torch::Tensor RL_Real::ComputeObservation()
                                    this->obs.dof_vel * this->params.dof_vel_scale,
                                    this->obs.actions
                                    },1);
-    obs = torch::clamp(obs, -this->params.clip_obs, this->params.clip_obs);
+    torch::Tensor clamped_obs = torch::clamp(obs, -this->params.clip_obs, this->params.clip_obs);
-    return obs;
+    return clamped_obs;
 }
 torch::Tensor RL_Real::Forward()
 {
-    torch::Tensor obs = this->ComputeObservation();
+    torch::autograd::GradMode::set_enabled(false);
-    history_obs_buf.insert(obs);
+    torch::Tensor clamped_obs = this->ComputeObservation();
    history_obs_buf.insert(clamped_obs);
    history_obs = history_obs_buf.get_obs_vec({0, 1, 2, 3, 4, 5});
-    torch::Tensor action = this->model.forward({history_obs}).toTensor();
+    torch::Tensor actions = this->model.forward({history_obs}).toTensor();
-    torch::Tensor clamped = torch::clamp(action, this->params.clip_actions_upper, this->params.clip_actions_lower);
+    torch::Tensor clamped_actions = torch::clamp(actions, this->params.clip_actions_lower, this->params.clip_actions_upper);
-    return clamped;
+    return clamped_actions;
 }
 void RL_Real::Plot()
--- a/src/rl_sar/src/rl_sim.cpp
+++ b/src/rl_sar/src/rl_sim.cpp
@ -95,10 +95,10 @@ RL_Sim::~RL_Sim()
 void RL_Sim::GetState(RobotState<double> *state)
 {
-    state->imu.quaternion[0] = pose.orientation.w;
+    state->imu.quaternion[3] = pose.orientation.w;
-    state->imu.quaternion[1] = pose.orientation.x;
+    state->imu.quaternion[0] = pose.orientation.x;
-    state->imu.quaternion[2] = pose.orientation.y;
+    state->imu.quaternion[1] = pose.orientation.y;
-    state->imu.quaternion[3] = pose.orientation.z;
+    state->imu.quaternion[2] = pose.orientation.z;
    state->imu.gyroscope[0] = vel.angular.x;
    state->imu.gyroscope[1] = vel.angular.y;
@ -133,8 +133,8 @@ void RL_Sim::SetCommand(const RobotCommand<double> *command)
 void RL_Sim::RobotControl()
 {
-    std::cout << "running_state " << keyboard.keyboard_state
+    std::cout << "running_state:" << keyboard.keyboard_state
-              << " x" << keyboard.x << " y" << keyboard.y << " yaw" << keyboard.yaw
+              << " x:" << keyboard.x << " y:" << keyboard.y << " yaw:" << keyboard.yaw
              << "      \r";
    motiontime++;
@ -182,12 +182,12 @@ void RL_Sim::RunModel()
    if(running_state == STATE_RL_RUNNING)
    {
        // this->obs.lin_vel = torch::tensor({{vel.linear.x, vel.linear.y, vel.linear.z}});
-        this->obs.ang_vel = torch::tensor({{vel.angular.x, vel.angular.y, vel.angular.z}});
+        this->obs.ang_vel = torch::tensor(robot_state.imu.gyroscope).unsqueeze(0);
        // this->obs.commands = torch::tensor({{cmd_vel.linear.x, cmd_vel.linear.y, cmd_vel.angular.z}});
        this->obs.commands = torch::tensor({{keyboard.x, keyboard.y, keyboard.yaw}});
-        this->obs.base_quat = torch::tensor({{pose.orientation.x, pose.orientation.y, pose.orientation.z, pose.orientation.w}});
+        this->obs.base_quat = torch::tensor(robot_state.imu.quaternion).unsqueeze(0);
-        this->obs.dof_pos = torch::tensor(mapped_joint_positions).unsqueeze(0);
+        this->obs.dof_pos = torch::tensor(robot_state.motor_state.q).narrow(0, 0, params.num_of_dofs).unsqueeze(0);
-        this->obs.dof_vel = torch::tensor(mapped_joint_velocities).unsqueeze(0);
+        this->obs.dof_vel = torch::tensor(robot_state.motor_state.dq).narrow(0, 0, params.num_of_dofs).unsqueeze(0);
        torch::Tensor clamped_actions = this->Forward();
@ -198,8 +198,9 @@ void RL_Sim::RunModel()
        this->obs.actions = clamped_actions;
-        // output_torques = this->ComputeTorques(clamped_actions);
+        // torch::Tensor origin_output_torques = this->ComputeTorques(this->obs.actions);
-        output_dof_pos = this->ComputePosition(clamped_actions);
+        // output_torques = torch::clamp(origin_output_torques, -(this->params.torque_limits), this->params.torque_limits);
        output_dof_pos = this->ComputePosition(this->obs.actions);
 #ifdef CSV_LOGGER
        torch::Tensor tau_est = torch::tensor(mapped_joint_efforts).unsqueeze(0);
@ -211,34 +212,35 @@ void RL_Sim::RunModel()
 torch::Tensor RL_Sim::ComputeObservation()
 {
    torch::Tensor obs = torch::cat({// this->obs.lin_vel * this->params.lin_vel_scale,
-                                    this->obs.ang_vel * this->params.ang_vel_scale,
+                                    this->QuatRotateInverse(this->obs.base_quat, this->obs.ang_vel) * this->params.ang_vel_scale,
                                    // this->obs.ang_vel * this->params.ang_vel_scale, // TODO
                                    this->QuatRotateInverse(this->obs.base_quat, this->obs.gravity_vec),
                                    this->obs.commands * this->params.commands_scale,
                                    (this->obs.dof_pos - this->params.default_dof_pos) * this->params.dof_pos_scale,
                                    this->obs.dof_vel * this->params.dof_vel_scale,
                                    this->obs.actions
                                    },1);
-    obs = torch::clamp(obs, -this->params.clip_obs, this->params.clip_obs);
+    torch::Tensor clamped_obs = torch::clamp(obs, -this->params.clip_obs, this->params.clip_obs);
-    return obs;
+    return clamped_obs;
 }
 torch::Tensor RL_Sim::Forward()
 {
    torch::autograd::GradMode::set_enabled(false);
-    torch::Tensor obs = this->ComputeObservation();
+    torch::Tensor clamped_obs = this->ComputeObservation();
    torch::Tensor actions;
    if(use_history)
    {
-        history_obs_buf.insert(obs);
+        history_obs_buf.insert(clamped_obs);
        history_obs = history_obs_buf.get_obs_vec({0, 1, 2, 3, 4, 5});
        actions = this->model.forward({history_obs}).toTensor();
    }
    else
    {
-        actions = this->model.forward({obs}).toTensor();
+        actions = this->model.forward({clamped_obs}).toTensor();
    }  
    torch::Tensor clamped_actions = torch::clamp(actions, this->params.clip_actions_lower, this->params.clip_actions_upper);