From 4868c7d065d904fbe9c4767f31c27905abf6dfbb Mon Sep 17 00:00:00 2001 From: fan-ziqi Date: Fri, 16 Aug 2024 11:44:00 +0800 Subject: [PATCH] feat: add obs list in config.yaml and move ComputeObservation to rl_sdk --- README.md | 14 ++--- README_CN.md | 14 ++--- src/rl_sar/include/rl_real_a1.hpp | 1 - src/rl_sar/include/rl_sim.hpp | 1 - src/rl_sar/library/rl_sdk/rl_sdk.cpp | 59 ++++++++++++++------ src/rl_sar/library/rl_sdk/rl_sdk.hpp | 3 +- src/rl_sar/models/a1_isaacgym/config.yaml | 1 + src/rl_sar/models/a1_isaacsim/config.yaml | 1 + src/rl_sar/models/gr1t1_isaacgym/config.yaml | 1 + src/rl_sar/models/gr1t1_isaacsim/config.yaml | 1 + src/rl_sar/models/gr1t2_isaacgym/config.yaml | 1 + src/rl_sar/models/gr1t2_isaacsim/config.yaml | 1 + src/rl_sar/scripts/rl_sdk.py | 24 ++++++++ src/rl_sar/scripts/rl_sim.py | 16 +----- src/rl_sar/src/rl_real_a1.cpp | 15 ----- src/rl_sar/src/rl_sim.cpp | 18 +----- 16 files changed, 85 insertions(+), 86 deletions(-) diff --git a/README.md b/README.md index 45c4da2..7c7bb97 100644 --- a/README.md +++ b/README.md @@ -57,14 +57,7 @@ sudo ldconfig ## Compilation -Customize the following two functions in your code to adapt to different models: - -```cpp -torch::Tensor forward() override; -torch::Tensor compute_observation() override; -``` - -Then compile in the root directory +Compile in the root directory of the project ```bash cd .. @@ -142,8 +135,9 @@ In the following text, `` represents the name of the robot 1. Create a model package named `_description` in the `rl_sar/src/robots` directory. Place the robot's URDF file in the `rl_sar/src/robots/_description/urdf` directory and name it `.urdf`. Additionally, create a joint configuration file with the namespace `_gazebo` in the `rl_sar/src/robots/_description/config` directory. 2. Place the trained RL model files in the `rl_sar/src/rl_sar/models/` directory. 3. In the `rl_sar/src/rl_sar/models/` directory, create a `config.yaml` file, and modify its parameters based on the `rl_sar/src/rl_sar/models/a1_isaacgym/config.yaml` file. -4. If you need to run simulations, modify the launch files as needed by referring to those in the `rl_sar/src/rl_sar/launch` directory. -5. If you need to run on the physical robot, modify the file `rl_sar/src/rl_sar/src/rl_real_a1.cpp` as needed. +4. Modify the `forward()` function in the code as needed to adapt to different models. +5. If you need to run simulations, modify the launch files as needed by referring to those in the `rl_sar/src/rl_sar/launch` directory. +6. If you need to run on the physical robot, modify the file `rl_sar/src/rl_sar/src/rl_real_a1.cpp` as needed. ## Reference diff --git a/README_CN.md b/README_CN.md index 4a7f1e6..5d92c70 100644 --- a/README_CN.md +++ b/README_CN.md @@ -57,14 +57,7 @@ sudo ldconfig ## 编译 -自定义代码中的以下两个函数,以适配不同的模型: - -```cpp -torch::Tensor forward() override; -torch::Tensor compute_observation() override; -``` - -然后到根目录编译 +在项目根目录编译 ```bash cd .. @@ -143,8 +136,9 @@ rosrun rl_sar rl_real_a1 1. 在`rl_sar/src/robots`路径下创建名为`_description`的模型包,将模型的urdf放到`rl_sar/src/robots/_description/urdf`路径下并命名为`.urdf`,并在`rl_sar/src/robots/_description/config`路径下创建命名空间为`_gazebo`的关节配置文件 2. 将训练好的RL模型文件放到`rl_sar/src/rl_sar/models/`路径下 3. 在`rl_sar/src/rl_sar/models/`中新建config.yaml文件,参考`rl_sar/src/rl_sar/models/a1_isaacgym/config.yaml`文件修改其中参数 -4. 若需要运行仿真,则参考`rl_sar/src/rl_sar/launch`路径下的launch文件自行修改 -5. 若需要运行实物,则参考`rl_sar/src/rl_sar/src/rl_real_a1.cpp`文件自行修改 +4. 按需修改代码中的`forward()`函数,以适配不同的模型 +5. 若需要运行仿真,则参考`rl_sar/src/rl_sar/launch`路径下的launch文件自行修改 +6. 若需要运行实物,则参考`rl_sar/src/rl_sar/src/rl_real_a1.cpp`文件自行修改 ## 参考 diff --git a/src/rl_sar/include/rl_real_a1.hpp b/src/rl_sar/include/rl_real_a1.hpp index c330b21..f60218e 100644 --- a/src/rl_sar/include/rl_real_a1.hpp +++ b/src/rl_sar/include/rl_real_a1.hpp @@ -19,7 +19,6 @@ class RL_Real : public RL private: // rl functions torch::Tensor Forward() override; - torch::Tensor ComputeObservation() override; void GetState(RobotState *state) override; void SetCommand(const RobotCommand *command) override; void RunModel(); diff --git a/src/rl_sar/include/rl_sim.hpp b/src/rl_sar/include/rl_sim.hpp index 2477b88..da0c6f3 100644 --- a/src/rl_sar/include/rl_sim.hpp +++ b/src/rl_sar/include/rl_sim.hpp @@ -24,7 +24,6 @@ class RL_Sim : public RL private: // rl functions torch::Tensor Forward() override; - torch::Tensor ComputeObservation() override; void GetState(RobotState *state) override; void SetCommand(const RobotCommand *command) override; void RunModel(); diff --git a/src/rl_sar/library/rl_sdk/rl_sdk.cpp b/src/rl_sar/library/rl_sdk/rl_sdk.cpp index 30ad610..78a9bd8 100644 --- a/src/rl_sar/library/rl_sdk/rl_sdk.cpp +++ b/src/rl_sar/library/rl_sdk/rl_sdk.cpp @@ -1,21 +1,5 @@ #include "rl_sdk.hpp" -/* You may need to override this ComputeObservation() function -torch::Tensor RL_XXX::ComputeObservation() -{ - torch::Tensor obs = torch::cat({ - this->QuatRotateInverse(this->obs.base_quat, this->obs.ang_vel, this->params.framework) * this->params.ang_vel_scale, - this->QuatRotateInverse(this->obs.base_quat, this->obs.gravity_vec, this->params.framework), - this->obs.commands * this->params.commands_scale, - (this->obs.dof_pos - this->params.default_dof_pos) * this->params.dof_pos_scale, - this->obs.dof_vel * this->params.dof_vel_scale, - this->obs.actions - },1); - torch::Tensor clamped_obs = torch::clamp(obs, -this->params.clip_obs, this->params.clip_obs); - return clamped_obs; -} -*/ - /* You may need to override this Forward() function torch::Tensor RL_XXX::Forward() { @@ -27,6 +11,48 @@ torch::Tensor RL_XXX::Forward() } */ +torch::Tensor RL::ComputeObservation() +{ + std::vector obs_list; + + for(const std::string& observation : this->params.observations) + { + if(observation == "lin_vel") + { + obs_list.push_back(this->obs.lin_vel * this->params.lin_vel_scale); + } + else if(observation == "ang_vel") + { + // obs_list.push_back(this->obs.ang_vel * this->params.ang_vel_scale); // TODO is QuatRotateInverse necessery? + obs_list.push_back(this->QuatRotateInverse(this->obs.base_quat, this->obs.ang_vel, this->params.framework) * this->params.ang_vel_scale); + } + else if(observation == "gravity_vec") + { + obs_list.push_back(this->QuatRotateInverse(this->obs.base_quat, this->obs.gravity_vec, this->params.framework)); + } + else if(observation == "commands") + { + obs_list.push_back(this->obs.commands * this->params.commands_scale); + } + else if(observation == "dof_pos") + { + obs_list.push_back((this->obs.dof_pos - this->params.default_dof_pos) * this->params.dof_pos_scale); + } + else if(observation == "dof_vel") + { + obs_list.push_back(this->obs.dof_vel * this->params.dof_vel_scale); + } + else if(observation == "actions") + { + obs_list.push_back(this->obs.actions); + } + } + + torch::Tensor obs = torch::cat(obs_list, 1); + torch::Tensor clamped_obs = torch::clamp(obs, -this->params.clip_obs, this->params.clip_obs); + return clamped_obs; +} + void RL::InitObservations() { this->obs.lin_vel = torch::tensor({{0.0, 0.0, 0.0}}); @@ -369,6 +395,7 @@ void RL::ReadYaml(std::string robot_name) this->params.dt = config["dt"].as(); this->params.decimation = config["decimation"].as(); this->params.num_observations = config["num_observations"].as(); + this->params.observations = ReadVectorFromYaml(config["observations"]); this->params.clip_obs = config["clip_obs"].as(); this->params.clip_actions_upper = torch::tensor(ReadVectorFromYaml(config["clip_actions_upper"], this->params.framework, rows, cols)).view({1, -1}); this->params.clip_actions_lower = torch::tensor(ReadVectorFromYaml(config["clip_actions_lower"], this->params.framework, rows, cols)).view({1, -1}); diff --git a/src/rl_sar/library/rl_sdk/rl_sdk.hpp b/src/rl_sar/library/rl_sdk/rl_sdk.hpp index e861eb2..703770b 100644 --- a/src/rl_sar/library/rl_sdk/rl_sdk.hpp +++ b/src/rl_sar/library/rl_sdk/rl_sdk.hpp @@ -74,6 +74,7 @@ struct ModelParams double dt; int decimation; int num_observations; + std::vector observations; double damping; double stiffness; double action_scale; @@ -128,7 +129,7 @@ class RL // rl functions virtual torch::Tensor Forward() = 0; - virtual torch::Tensor ComputeObservation() = 0; + torch::Tensor ComputeObservation(); virtual void GetState(RobotState *state) = 0; virtual void SetCommand(const RobotCommand *command) = 0; void StateController(const RobotState *state, RobotCommand *command); diff --git a/src/rl_sar/models/a1_isaacgym/config.yaml b/src/rl_sar/models/a1_isaacgym/config.yaml index 0f11b42..1462540 100644 --- a/src/rl_sar/models/a1_isaacgym/config.yaml +++ b/src/rl_sar/models/a1_isaacgym/config.yaml @@ -7,6 +7,7 @@ a1_isaacgym: dt: 0.005 decimation: 4 num_observations: 45 + observations: ["ang_vel", "gravity_vec", "commands", "dof_pos", "dof_vel", "actions"] clip_obs: 100.0 clip_actions_lower: [-100, -100, -100, -100, -100, -100, diff --git a/src/rl_sar/models/a1_isaacsim/config.yaml b/src/rl_sar/models/a1_isaacsim/config.yaml index 2c5f3d8..845bbdd 100644 --- a/src/rl_sar/models/a1_isaacsim/config.yaml +++ b/src/rl_sar/models/a1_isaacsim/config.yaml @@ -7,6 +7,7 @@ a1_isaacsim: dt: 0.005 decimation: 4 num_observations: 45 + observations: ["ang_vel", "gravity_vec", "commands", "dof_pos", "dof_vel", "actions"] clip_obs: 100.0 clip_actions_lower: [-100, -100, -100, -100, -100, -100, diff --git a/src/rl_sar/models/gr1t1_isaacgym/config.yaml b/src/rl_sar/models/gr1t1_isaacgym/config.yaml index 7062f4d..c6a7a65 100644 --- a/src/rl_sar/models/gr1t1_isaacgym/config.yaml +++ b/src/rl_sar/models/gr1t1_isaacgym/config.yaml @@ -7,6 +7,7 @@ gr1t1_isaacgym: dt: 0.001 decimation: 20 num_observations: 39 + observations: ["ang_vel", "gravity_vec", "commands", "dof_pos", "dof_vel", "actions"] clip_obs: 100.0 clip_actions_lower: [-0.4391, -1.0491, -2.0991, -0.4391, -1.3991, -1.1391, -1.0491, -2.0991, -0.4391, -1.3991] diff --git a/src/rl_sar/models/gr1t1_isaacsim/config.yaml b/src/rl_sar/models/gr1t1_isaacsim/config.yaml index 8dc3319..f8b54a5 100644 --- a/src/rl_sar/models/gr1t1_isaacsim/config.yaml +++ b/src/rl_sar/models/gr1t1_isaacsim/config.yaml @@ -7,6 +7,7 @@ gr1t1_isaacsim: dt: 0.001 decimation: 20 num_observations: 39 + observations: ["ang_vel", "gravity_vec", "commands", "dof_pos", "dof_vel", "actions"] clip_obs: 100.0 clip_actions_lower: [-0.4391, -1.0491, -2.0991, -0.4391, -1.3991, -1.1391, -1.0491, -2.0991, -0.4391, -1.3991] diff --git a/src/rl_sar/models/gr1t2_isaacgym/config.yaml b/src/rl_sar/models/gr1t2_isaacgym/config.yaml index 87bbd25..9b25700 100644 --- a/src/rl_sar/models/gr1t2_isaacgym/config.yaml +++ b/src/rl_sar/models/gr1t2_isaacgym/config.yaml @@ -7,6 +7,7 @@ gr1t2_isaacgym: dt: 0.001 decimation: 20 num_observations: 39 + observations: ["ang_vel", "gravity_vec", "commands", "dof_pos", "dof_vel", "actions"] clip_obs: 100.0 clip_actions_lower: [-0.4391, -1.0491, -2.0991, -0.4391, -1.3991, -1.1391, -1.0491, -2.0991, -0.4391, -1.3991] diff --git a/src/rl_sar/models/gr1t2_isaacsim/config.yaml b/src/rl_sar/models/gr1t2_isaacsim/config.yaml index d09a118..c8abfab 100644 --- a/src/rl_sar/models/gr1t2_isaacsim/config.yaml +++ b/src/rl_sar/models/gr1t2_isaacsim/config.yaml @@ -7,6 +7,7 @@ gr1t2_isaacsim: dt: 0.001 decimation: 20 num_observations: 39 + observations: ["ang_vel", "gravity_vec", "commands", "dof_pos", "dof_vel", "actions"] clip_obs: 100.0 clip_actions_lower: [-0.4391, -1.0491, -2.0991, -0.4391, -1.3991, -1.1391, -1.0491, -2.0991, -0.4391, -1.3991] diff --git a/src/rl_sar/scripts/rl_sdk.py b/src/rl_sar/scripts/rl_sdk.py index 5cdbc4b..69556b5 100644 --- a/src/rl_sar/scripts/rl_sdk.py +++ b/src/rl_sar/scripts/rl_sdk.py @@ -68,6 +68,7 @@ def __init__(self): self.dt = None self.decimation = None self.num_observations = None + self.observations = None self.damping = None self.stiffness = None self.action_scale = None @@ -134,6 +135,28 @@ def __init__(self): self.output_torques = torch.zeros(1, 32) self.output_dof_pos = torch.zeros(1, 32) + def ComputeObservation(self): + obs_list = [] + for observation in self.params.observations: + if observation == "lin_vel": + obs_list.append(self.obs.lin_vel * self.params.lin_vel_scale) + elif observation == "ang_vel": + # obs_list.append(self.obs.ang_vel * self.params.ang_vel_scale) # TODO is QuatRotateInverse necessery? + obs_list.append(self.QuatRotateInverse(self.obs.base_quat, self.obs.ang_vel, self.params.framework) * self.params.ang_vel_scale) + elif observation == "gravity_vec": + obs_list.append(self.QuatRotateInverse(self.obs.base_quat, self.obs.gravity_vec, self.params.framework)) + elif observation == "commands": + obs_list.append(self.obs.commands * self.params.commands_scale) + elif observation == "dof_pos": + obs_list.append((self.obs.dof_pos - self.params.default_dof_pos) * self.params.dof_pos_scale) + elif observation == "dof_vel": + obs_list.append(self.obs.dof_vel * self.params.dof_vel_scale) + elif observation == "actions": + obs_list.append(self.obs.actions) + obs = torch.cat(obs_list, dim=-1) + clamped_obs = torch.clamp(obs, -self.params.clip_obs, self.params.clip_obs) + return clamped_obs + def InitObservations(self): self.obs.lin_vel = torch.zeros(1, 3, dtype=torch.float) self.obs.ang_vel = torch.zeros(1, 3, dtype=torch.float) @@ -359,6 +382,7 @@ def ReadYaml(self, robot_name): self.params.dt = config["dt"] self.params.decimation = config["decimation"] self.params.num_observations = config["num_observations"] + self.params.observations = config["observations"] self.params.clip_obs = config["clip_obs"] self.params.action_scale = config["action_scale"] self.params.hip_scale_reduction = config["hip_scale_reduction"] diff --git a/src/rl_sar/scripts/rl_sim.py b/src/rl_sar/scripts/rl_sim.py index b7fd821..f9fde79 100644 --- a/src/rl_sar/scripts/rl_sim.py +++ b/src/rl_sar/scripts/rl_sim.py @@ -173,7 +173,7 @@ def JointStatesCallback(self, msg): def RunModel(self): if self.running_state == STATE.STATE_RL_RUNNING and self.simulation_running: - # self.obs.lin_vel = torch.tensor([[self.vel.linear.x, self.vel.linear.y, self.vel.linear.z]]) + self.obs.lin_vel = torch.tensor([[self.vel.linear.x, self.vel.linear.y, self.vel.linear.z]]) self.obs.ang_vel = torch.tensor(self.robot_state.imu.gyroscope).unsqueeze(0) # self.obs.commands = torch.tensor([[self.cmd_vel.linear.x, self.cmd_vel.linear.y, self.cmd_vel.angular.z]]) self.obs.commands = torch.tensor([[self.control.x, self.control.y, self.control.yaw]]) @@ -199,20 +199,6 @@ def RunModel(self): tau_est = torch.tensor(self.mapped_joint_efforts).unsqueeze(0) self.CSVLogger(self.output_torques, tau_est, self.obs.dof_pos, self.output_dof_pos, self.obs.dof_vel) - def ComputeObservation(self): - obs = torch.cat([ - # self.obs.lin_vel * self.params.lin_vel_scale, - # self.obs.ang_vel * self.params.ang_vel_scale, # TODO is QuatRotateInverse necessery? - self.QuatRotateInverse(self.obs.base_quat, self.obs.ang_vel, self.params.framework) * self.params.ang_vel_scale, - self.QuatRotateInverse(self.obs.base_quat, self.obs.gravity_vec, self.params.framework), - self.obs.commands * self.params.commands_scale, - (self.obs.dof_pos - self.params.default_dof_pos) * self.params.dof_pos_scale, - self.obs.dof_vel * self.params.dof_vel_scale, - self.obs.actions - ], dim = -1) - clamped_obs = torch.clamp(obs, -self.params.clip_obs, self.params.clip_obs) - return clamped_obs - def Forward(self): torch.set_grad_enabled(False) clamped_obs = self.ComputeObservation() diff --git a/src/rl_sar/src/rl_real_a1.cpp b/src/rl_sar/src/rl_real_a1.cpp index 479ef4e..4a9f98f 100644 --- a/src/rl_sar/src/rl_real_a1.cpp +++ b/src/rl_sar/src/rl_real_a1.cpp @@ -170,21 +170,6 @@ void RL_Real::RunModel() } } -torch::Tensor RL_Real::ComputeObservation() -{ - torch::Tensor obs = torch::cat({ - // this->QuatRotateInverse(this->obs.base_quat, this->obs.lin_vel) * this->params.lin_vel_scale, - this->QuatRotateInverse(this->obs.base_quat, this->obs.ang_vel, this->params.framework) * this->params.ang_vel_scale, - this->QuatRotateInverse(this->obs.base_quat, this->obs.gravity_vec, this->params.framework), - this->obs.commands * this->params.commands_scale, - (this->obs.dof_pos - this->params.default_dof_pos) * this->params.dof_pos_scale, - this->obs.dof_vel * this->params.dof_vel_scale, - this->obs.actions - },1); - torch::Tensor clamped_obs = torch::clamp(obs, -this->params.clip_obs, this->params.clip_obs); - return clamped_obs; -} - torch::Tensor RL_Real::Forward() { torch::autograd::GradMode::set_enabled(false); diff --git a/src/rl_sar/src/rl_sim.cpp b/src/rl_sar/src/rl_sim.cpp index 2bfee62..fd3ea09 100644 --- a/src/rl_sar/src/rl_sim.cpp +++ b/src/rl_sar/src/rl_sim.cpp @@ -212,7 +212,7 @@ void RL_Sim::RunModel() { if(this->running_state == STATE_RL_RUNNING && simulation_running) { - // this->obs.lin_vel = torch::tensor({{this->vel.linear.x, this->vel.linear.y, this->vel.linear.z}}); + this->obs.lin_vel = torch::tensor({{this->vel.linear.x, this->vel.linear.y, this->vel.linear.z}}); this->obs.ang_vel = torch::tensor(this->robot_state.imu.gyroscope).unsqueeze(0); // this->obs.commands = torch::tensor({{this->cmd_vel.linear.x, this->cmd_vel.linear.y, this->cmd_vel.angular.z}}); this->obs.commands = torch::tensor({{this->control.x, this->control.y, this->control.yaw}}); @@ -243,22 +243,6 @@ void RL_Sim::RunModel() } } -torch::Tensor RL_Sim::ComputeObservation() -{ - torch::Tensor obs = torch::cat({ - // this->obs.lin_vel * this->params.lin_vel_scale, - // this->obs.ang_vel * this->params.ang_vel_scale, // TODO is QuatRotateInverse necessery? - this->QuatRotateInverse(this->obs.base_quat, this->obs.ang_vel, this->params.framework) * this->params.ang_vel_scale, - this->QuatRotateInverse(this->obs.base_quat, this->obs.gravity_vec, this->params.framework), - this->obs.commands * this->params.commands_scale, - (this->obs.dof_pos - this->params.default_dof_pos) * this->params.dof_pos_scale, - this->obs.dof_vel * this->params.dof_vel_scale, - this->obs.actions - },1); - torch::Tensor clamped_obs = torch::clamp(obs, -this->params.clip_obs, this->params.clip_obs); - return clamped_obs; -} - torch::Tensor RL_Sim::Forward() { torch::autograd::GradMode::set_enabled(false);