Skip to content

Commit ecc4943

Browse files
committed
important update
1 parent 1038a70 commit ecc4943

File tree

150 files changed

+28870
-1231
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

150 files changed

+28870
-1231
lines changed

README.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -131,7 +131,7 @@ python3 scripts/rsl_rl/play.py --task Template-Isaac-Reach-Kinova-Play-v0--num_e
131131
python3 scripts/rsl_rl/play.py --task Template-Isaac-Reach-Franka-Play-v0 --num_envs 16
132132
```
133133
```bash
134-
python3 scripts/rsl_rl/play.py --task Template-Isaac-Reach-Franka-Play-v0 --num_envs 16
134+
python3 scripts/rsl_rl/play.py --task Template-Isaac-Reach-UR10-Play-v0 --num_envs 16
135135
```
136136
5.2 Dextrous Hand
137137
```bash

isaacLab/manipulation/tasks/Dextrous_hand/inhand/__init__.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
# Copyright (c) 2022-2024, The Isaac Lab Project Developers.
1+
# Copyright (c) 2022-2025, The Isaac Lab Project Developers.
22
# All rights reserved.
33
#
44
# SPDX-License-Identifier: BSD-3-Clause

isaacLab/manipulation/tasks/Dextrous_hand/inhand/config/__init__.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
# Copyright (c) 2022-2024, The Isaac Lab Project Developers.
1+
# Copyright (c) 2022-2025, The Isaac Lab Project Developers.
22
# All rights reserved.
33
#
44
# SPDX-License-Identifier: BSD-3-Clause

isaacLab/manipulation/tasks/Dextrous_hand/inhand/config/allegro_hand/__init__.py

Lines changed: 10 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -1,11 +1,11 @@
1-
# Copyright (c) 2022-2024, The Isaac Lab Project Developers.
1+
# Copyright (c) 2022-2025, The Isaac Lab Project Developers.
22
# All rights reserved.
33
#
44
# SPDX-License-Identifier: BSD-3-Clause
55

66
import gymnasium as gym
77

8-
from . import agents, allegro_env_cfg
8+
from . import agents
99

1010
##
1111
# Register Gym environments.
@@ -20,8 +20,8 @@
2020
entry_point="isaaclab.envs:ManagerBasedRLEnv",
2121
disable_env_checker=True,
2222
kwargs={
23-
"env_cfg_entry_point": allegro_env_cfg.AllegroCubeEnvCfg,
24-
"rsl_rl_cfg_entry_point": agents.rsl_rl_cfg.AllegroCubePPORunnerCfg,
23+
"env_cfg_entry_point": f"{__name__}.allegro_env_cfg:AllegroCubeEnvCfg",
24+
"rsl_rl_cfg_entry_point": f"{agents.__name__}.rsl_rl_ppo_cfg:AllegroCubePPORunnerCfg",
2525
"rl_games_cfg_entry_point": f"{agents.__name__}:rl_games_ppo_cfg.yaml",
2626
"skrl_cfg_entry_point": f"{agents.__name__}:skrl_ppo_cfg.yaml",
2727
},
@@ -32,8 +32,8 @@
3232
entry_point="isaaclab.envs:ManagerBasedRLEnv",
3333
disable_env_checker=True,
3434
kwargs={
35-
"env_cfg_entry_point": allegro_env_cfg.AllegroCubeEnvCfg_PLAY,
36-
"rsl_rl_cfg_entry_point": agents.rsl_rl_cfg.AllegroCubePPORunnerCfg,
35+
"env_cfg_entry_point": f"{__name__}.allegro_env_cfg:AllegroCubeEnvCfg_PLAY",
36+
"rsl_rl_cfg_entry_point": f"{agents.__name__}.rsl_rl_ppo_cfg:AllegroCubePPORunnerCfg",
3737
"rl_games_cfg_entry_point": f"{agents.__name__}:rl_games_ppo_cfg.yaml",
3838
"skrl_cfg_entry_point": f"{agents.__name__}:skrl_ppo_cfg.yaml",
3939
},
@@ -48,8 +48,8 @@
4848
entry_point="isaaclab.envs:ManagerBasedRLEnv",
4949
disable_env_checker=True,
5050
kwargs={
51-
"env_cfg_entry_point": allegro_env_cfg.AllegroCubeNoVelObsEnvCfg,
52-
"rsl_rl_cfg_entry_point": agents.rsl_rl_cfg.AllegroCubeNoVelObsPPORunnerCfg,
51+
"env_cfg_entry_point": f"{__name__}.allegro_env_cfg:AllegroCubeNoVelObsEnvCfg",
52+
"rsl_rl_cfg_entry_point": f"{agents.__name__}.rsl_rl_ppo_cfg:AllegroCubeNoVelObsPPORunnerCfg",
5353
"rl_games_cfg_entry_point": f"{agents.__name__}:rl_games_ppo_cfg.yaml",
5454
"skrl_cfg_entry_point": f"{agents.__name__}:skrl_ppo_cfg.yaml",
5555
},
@@ -60,8 +60,8 @@
6060
entry_point="isaaclab.envs:ManagerBasedRLEnv",
6161
disable_env_checker=True,
6262
kwargs={
63-
"env_cfg_entry_point": allegro_env_cfg.AllegroCubeNoVelObsEnvCfg_PLAY,
64-
"rsl_rl_cfg_entry_point": agents.rsl_rl_cfg.AllegroCubeNoVelObsPPORunnerCfg,
63+
"env_cfg_entry_point": f"{__name__}.allegro_env_cfg:AllegroCubeNoVelObsEnvCfg_PLAY",
64+
"rsl_rl_cfg_entry_point": f"{agents.__name__}.rsl_rl_ppo_cfg:AllegroCubeNoVelObsPPORunnerCfg",
6565
"rl_games_cfg_entry_point": f"{agents.__name__}:rl_games_ppo_cfg.yaml",
6666
"skrl_cfg_entry_point": f"{agents.__name__}:skrl_ppo_cfg.yaml",
6767
},
Lines changed: 1 addition & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,4 @@
1-
# Copyright (c) 2022-2024, The Isaac Lab Project Developers.
1+
# Copyright (c) 2022-2025, The Isaac Lab Project Developers.
22
# All rights reserved.
33
#
44
# SPDX-License-Identifier: BSD-3-Clause
5-
6-
from . import rsl_rl_cfg # noqa: F401, F403

isaacLab/manipulation/tasks/Dextrous_hand/inhand/config/allegro_hand/agents/rsl_rl_cfg.py renamed to isaacLab/manipulation/tasks/Dextrous_hand/inhand/config/allegro_hand/agents/rsl_rl_ppo_cfg.py

Lines changed: 2 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -1,15 +1,11 @@
1-
# Copyright (c) 2022-2024, The Isaac Lab Project Developers.
1+
# Copyright (c) 2022-2025, The Isaac Lab Project Developers.
22
# All rights reserved.
33
#
44
# SPDX-License-Identifier: BSD-3-Clause
55

66
from isaaclab.utils import configclass
77

8-
from isaaclab_rl.rsl_rl import (
9-
RslRlOnPolicyRunnerCfg,
10-
RslRlPpoActorCriticCfg,
11-
RslRlPpoAlgorithmCfg,
12-
)
8+
from isaaclab_rl.rsl_rl import RslRlOnPolicyRunnerCfg, RslRlPpoActorCriticCfg, RslRlPpoAlgorithmCfg
139

1410

1511
@configclass
Lines changed: 38 additions & 25 deletions
Original file line numberDiff line numberDiff line change
@@ -1,46 +1,57 @@
11
seed: 42
22

3+
34
# Models are instantiated using skrl's model instantiator utility
45
# https://skrl.readthedocs.io/en/latest/api/utils/model_instantiators.html
56
models:
67
separate: False
7-
policy: # see skrl.utils.model_instantiators.torch.gaussian_model for parameter details
8+
policy: # see gaussian_model parameters
9+
class: GaussianMixin
810
clip_actions: False
911
clip_log_std: True
10-
initial_log_std: 0
1112
min_log_std: -20.0
1213
max_log_std: 2.0
13-
input_shape: "Shape.STATES"
14-
hiddens: [512, 256, 128]
15-
hidden_activation: ["elu", "elu"]
16-
output_shape: "Shape.ACTIONS"
17-
output_activation: ""
18-
output_scale: 1.0
19-
value: # see skrl.utils.model_instantiators.torch.deterministic_model for parameter details
14+
initial_log_std: 0.0
15+
network:
16+
- name: net
17+
input: STATES
18+
layers: [512, 256, 128]
19+
activations: elu
20+
output: ACTIONS
21+
value: # see deterministic_model parameters
22+
class: DeterministicMixin
2023
clip_actions: False
21-
input_shape: "Shape.STATES"
22-
hiddens: [512, 256, 128]
23-
hidden_activation: ["elu", "elu"]
24-
output_shape: "Shape.ONE"
25-
output_activation: ""
26-
output_scale: 1.0
24+
network:
25+
- name: net
26+
input: STATES
27+
layers: [512, 256, 128]
28+
activations: elu
29+
output: ONE
30+
31+
32+
# Rollout memory
33+
# https://skrl.readthedocs.io/en/latest/api/memories/random.html
34+
memory:
35+
class: RandomMemory
36+
memory_size: -1 # automatically determined (same as agent:rollouts)
2737

2838

2939
# PPO agent configuration (field names are from PPO_DEFAULT_CONFIG)
3040
# https://skrl.readthedocs.io/en/latest/api/agents/ppo.html
3141
agent:
42+
class: PPO
3243
rollouts: 24
3344
learning_epochs: 5
34-
mini_batches: 4
45+
mini_batches: 12
3546
discount_factor: 0.998
3647
lambda: 0.95
37-
learning_rate: 1.e-3
38-
learning_rate_scheduler: "KLAdaptiveLR"
48+
learning_rate: 5.0e-04
49+
learning_rate_scheduler: KLAdaptiveLR
3950
learning_rate_scheduler_kwargs:
40-
kl_threshold: 0.01
41-
state_preprocessor: "RunningStandardScaler"
51+
kl_threshold: 0.016
52+
state_preprocessor: RunningStandardScaler
4253
state_preprocessor_kwargs: null
43-
value_preprocessor: "RunningStandardScaler"
54+
value_preprocessor: RunningStandardScaler
4455
value_preprocessor_kwargs: null
4556
random_timesteps: 0
4657
learning_starts: 0
@@ -50,18 +61,20 @@ agent:
5061
clip_predicted_values: True
5162
entropy_loss_scale: 0.002
5263
value_loss_scale: 2.0
53-
kl_threshold: 0
64+
kl_threshold: 0.0
5465
rewards_shaper_scale: 0.1
66+
time_limit_bootstrap: False
5567
# logging and checkpoint
5668
experiment:
5769
directory: "allegro_cube"
5870
experiment_name: ""
59-
write_interval: 600
60-
checkpoint_interval: 6000
71+
write_interval: auto
72+
checkpoint_interval: auto
6173

6274

6375
# Sequential trainer
6476
# https://skrl.readthedocs.io/en/latest/api/trainers/sequential.html
6577
trainer:
78+
class: SequentialTrainer
6679
timesteps: 120000
67-
environment_info: "log"
80+
environment_info: log

isaacLab/manipulation/tasks/Dextrous_hand/inhand/config/allegro_hand/allegro_env_cfg.py

Lines changed: 2 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -1,14 +1,11 @@
1-
# Copyright (c) 2022-2024, The Isaac Lab Project Developers.
1+
# Copyright (c) 2022-2025, The Isaac Lab Project Developers.
22
# All rights reserved.
33
#
44
# SPDX-License-Identifier: BSD-3-Clause
55

66
from isaaclab.utils import configclass
77

8-
#import isaacLab.manipulation.tasks.Robot_arm.reach.mdp as mdp
9-
import isaacLab.manipulation.tasks.Dextrous_hand.inhand.mdp as mdp
10-
import isaacLab.manipulation.tasks.Dextrous_hand.inhand.inhand_env_cfg as inhand_env_cfg
11-
#import isaaclab_tasks.manager_based.manipulation.inhand.inhand_env_cfg as inhand_env_cfg
8+
import isaaclab_tasks.manager_based.manipulation.inhand.inhand_env_cfg as inhand_env_cfg
129

1310
##
1411
# Pre-defined configs

isaacLab/manipulation/tasks/Dextrous_hand/inhand/inhand_env_cfg.py

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
# Copyright (c) 2022-2024, The Isaac Lab Project Developers.
1+
# Copyright (c) 2022-2025, The Isaac Lab Project Developers.
22
# All rights reserved.
33
#
44
# SPDX-License-Identifier: BSD-3-Clause
@@ -23,7 +23,7 @@
2323
from isaaclab.utils.assets import ISAAC_NUCLEUS_DIR
2424
from isaaclab.utils.noise import AdditiveGaussianNoiseCfg as Gnoise
2525

26-
import isaacLab.manipulation.tasks.Dextrous_hand.inhand.mdp as mdp
26+
import isaaclab_tasks.manager_based.manipulation.inhand.mdp as mdp
2727

2828
##
2929
# Scene definition
@@ -341,5 +341,6 @@ def __post_init__(self):
341341
self.episode_length_s = 20.0
342342
# simulation settings
343343
self.sim.dt = 1.0 / 120.0
344+
self.sim.render_interval = self.decimation
344345
# change viewer settings
345346
self.viewer.eye = (2.0, 2.0, 2.0)

isaacLab/manipulation/tasks/Dextrous_hand/inhand/mdp/__init__.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
# Copyright (c) 2022-2024, The Isaac Lab Project Developers.
1+
# Copyright (c) 2022-2025, The Isaac Lab Project Developers.
22
# All rights reserved.
33
#
44
# SPDX-License-Identifier: BSD-3-Clause

0 commit comments

Comments
 (0)