NathanWu7
diff --git a/‎README.md‎
Lines changed: 1 addition & 1 deletion b/‎README.md‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎isaacLab/manipulation/tasks/Dextrous_hand/inhand/__init__.py‎
Lines changed: 1 addition & 1 deletion b/‎isaacLab/manipulation/tasks/Dextrous_hand/inhand/__init__.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎isaacLab/manipulation/tasks/Dextrous_hand/inhand/config/__init__.py‎
Lines changed: 1 addition & 1 deletion b/‎isaacLab/manipulation/tasks/Dextrous_hand/inhand/config/__init__.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎isaacLab/manipulation/tasks/Dextrous_hand/inhand/config/allegro_hand/__init__.py‎
Lines changed: 10 additions & 10 deletions b/‎isaacLab/manipulation/tasks/Dextrous_hand/inhand/config/allegro_hand/__init__.py‎
Lines changed: 10 additions & 10 deletions
diff --git a/‎isaacLab/manipulation/tasks/Dextrous_hand/inhand/config/allegro_hand/agents/__init__.py‎
Lines changed: 1 addition & 3 deletions b/‎isaacLab/manipulation/tasks/Dextrous_hand/inhand/config/allegro_hand/agents/__init__.py‎
Lines changed: 1 addition & 3 deletions
diff --git a/‎isaacLab/manipulation/tasks/Dextrous_hand/inhand/config/allegro_hand/agents/rsl_rl_cfg.py‎ renamed to ‎isaacLab/manipulation/tasks/Dextrous_hand/inhand/config/allegro_hand/agents/rsl_rl_ppo_cfg.py‎
Lines changed: 2 additions & 6 deletions b/‎isaacLab/manipulation/tasks/Dextrous_hand/inhand/config/allegro_hand/agents/rsl_rl_cfg.py‎ renamed to ‎isaacLab/manipulation/tasks/Dextrous_hand/inhand/config/allegro_hand/agents/rsl_rl_ppo_cfg.py‎
Lines changed: 2 additions & 6 deletions
diff --git a/‎isaacLab/manipulation/tasks/Dextrous_hand/inhand/config/allegro_hand/agents/skrl_ppo_cfg.yaml‎
Lines changed: 38 additions & 25 deletions b/‎isaacLab/manipulation/tasks/Dextrous_hand/inhand/config/allegro_hand/agents/skrl_ppo_cfg.yaml‎
Lines changed: 38 additions & 25 deletions
diff --git a/‎isaacLab/manipulation/tasks/Dextrous_hand/inhand/config/allegro_hand/allegro_env_cfg.py‎
Lines changed: 2 additions & 5 deletions b/‎isaacLab/manipulation/tasks/Dextrous_hand/inhand/config/allegro_hand/allegro_env_cfg.py‎
Lines changed: 2 additions & 5 deletions
diff --git a/‎isaacLab/manipulation/tasks/Dextrous_hand/inhand/inhand_env_cfg.py‎
Lines changed: 3 additions & 2 deletions b/‎isaacLab/manipulation/tasks/Dextrous_hand/inhand/inhand_env_cfg.py‎
Lines changed: 3 additions & 2 deletions
diff --git a/‎isaacLab/manipulation/tasks/Dextrous_hand/inhand/mdp/__init__.py‎
Lines changed: 1 addition & 1 deletion b/‎isaacLab/manipulation/tasks/Dextrous_hand/inhand/mdp/__init__.py‎
Lines changed: 1 addition & 1 deletion
@@ -131,7 +131,7 @@ python3 scripts/rsl_rl/play.py --task Template-Isaac-Reach-Kinova-Play-v0--num_e
 python3 scripts/rsl_rl/play.py --task Template-Isaac-Reach-Franka-Play-v0 --num_envs 16
 ```
 ```bash
-python3 scripts/rsl_rl/play.py --task Template-Isaac-Reach-Franka-Play-v0 --num_envs 16
+python3 scripts/rsl_rl/play.py --task Template-Isaac-Reach-UR10-Play-v0 --num_envs 16
 ```
 5.2 Dextrous Hand
 ```bash
 
@@ -1,4 +1,4 @@
-# Copyright (c) 2022-2024, The Isaac Lab Project Developers.
+# Copyright (c) 2022-2025, The Isaac Lab Project Developers.
 # All rights reserved.
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
@@ -1,4 +1,4 @@
-# Copyright (c) 2022-2024, The Isaac Lab Project Developers.
+# Copyright (c) 2022-2025, The Isaac Lab Project Developers.
 # All rights reserved.
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
@@ -1,11 +1,11 @@
-# Copyright (c) 2022-2024, The Isaac Lab Project Developers.
+# Copyright (c) 2022-2025, The Isaac Lab Project Developers.
 # All rights reserved.
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
 import gymnasium as gym
 
-from . import agents, allegro_env_cfg
+from . import agents
 
 ##
 # Register Gym environments.
@@ -20,8 +20,8 @@
     entry_point="isaaclab.envs:ManagerBasedRLEnv",
     disable_env_checker=True,
     kwargs={
-        "env_cfg_entry_point": allegro_env_cfg.AllegroCubeEnvCfg,
-        "rsl_rl_cfg_entry_point": agents.rsl_rl_cfg.AllegroCubePPORunnerCfg,
+        "env_cfg_entry_point": f"{__name__}.allegro_env_cfg:AllegroCubeEnvCfg",
+        "rsl_rl_cfg_entry_point": f"{agents.__name__}.rsl_rl_ppo_cfg:AllegroCubePPORunnerCfg",
         "rl_games_cfg_entry_point": f"{agents.__name__}:rl_games_ppo_cfg.yaml",
         "skrl_cfg_entry_point": f"{agents.__name__}:skrl_ppo_cfg.yaml",
     },
@@ -32,8 +32,8 @@
     entry_point="isaaclab.envs:ManagerBasedRLEnv",
     disable_env_checker=True,
     kwargs={
-        "env_cfg_entry_point": allegro_env_cfg.AllegroCubeEnvCfg_PLAY,
-        "rsl_rl_cfg_entry_point": agents.rsl_rl_cfg.AllegroCubePPORunnerCfg,
+        "env_cfg_entry_point": f"{__name__}.allegro_env_cfg:AllegroCubeEnvCfg_PLAY",
+        "rsl_rl_cfg_entry_point": f"{agents.__name__}.rsl_rl_ppo_cfg:AllegroCubePPORunnerCfg",
         "rl_games_cfg_entry_point": f"{agents.__name__}:rl_games_ppo_cfg.yaml",
         "skrl_cfg_entry_point": f"{agents.__name__}:skrl_ppo_cfg.yaml",
     },
@@ -48,8 +48,8 @@
     entry_point="isaaclab.envs:ManagerBasedRLEnv",
     disable_env_checker=True,
     kwargs={
-        "env_cfg_entry_point": allegro_env_cfg.AllegroCubeNoVelObsEnvCfg,
-        "rsl_rl_cfg_entry_point": agents.rsl_rl_cfg.AllegroCubeNoVelObsPPORunnerCfg,
+        "env_cfg_entry_point": f"{__name__}.allegro_env_cfg:AllegroCubeNoVelObsEnvCfg",
+        "rsl_rl_cfg_entry_point": f"{agents.__name__}.rsl_rl_ppo_cfg:AllegroCubeNoVelObsPPORunnerCfg",
         "rl_games_cfg_entry_point": f"{agents.__name__}:rl_games_ppo_cfg.yaml",
         "skrl_cfg_entry_point": f"{agents.__name__}:skrl_ppo_cfg.yaml",
     },
@@ -60,8 +60,8 @@
     entry_point="isaaclab.envs:ManagerBasedRLEnv",
     disable_env_checker=True,
     kwargs={
-        "env_cfg_entry_point": allegro_env_cfg.AllegroCubeNoVelObsEnvCfg_PLAY,
-        "rsl_rl_cfg_entry_point": agents.rsl_rl_cfg.AllegroCubeNoVelObsPPORunnerCfg,
+        "env_cfg_entry_point": f"{__name__}.allegro_env_cfg:AllegroCubeNoVelObsEnvCfg_PLAY",
+        "rsl_rl_cfg_entry_point": f"{agents.__name__}.rsl_rl_ppo_cfg:AllegroCubeNoVelObsPPORunnerCfg",
         "rl_games_cfg_entry_point": f"{agents.__name__}:rl_games_ppo_cfg.yaml",
         "skrl_cfg_entry_point": f"{agents.__name__}:skrl_ppo_cfg.yaml",
     },
 
@@ -1,6 +1,4 @@
-# Copyright (c) 2022-2024, The Isaac Lab Project Developers.
+# Copyright (c) 2022-2025, The Isaac Lab Project Developers.
 # All rights reserved.
 #
 # SPDX-License-Identifier: BSD-3-Clause
-
-from . import rsl_rl_cfg  # noqa: F401, F403
@@ -1,15 +1,11 @@
-# Copyright (c) 2022-2024, The Isaac Lab Project Developers.
+# Copyright (c) 2022-2025, The Isaac Lab Project Developers.
 # All rights reserved.
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
 from isaaclab.utils import configclass
 
-from isaaclab_rl.rsl_rl import (
-    RslRlOnPolicyRunnerCfg,
-    RslRlPpoActorCriticCfg,
-    RslRlPpoAlgorithmCfg,
-)
+from isaaclab_rl.rsl_rl import RslRlOnPolicyRunnerCfg, RslRlPpoActorCriticCfg, RslRlPpoAlgorithmCfg
 
 
 @configclass
 
@@ -1,46 +1,57 @@
 seed: 42
 
+
 # Models are instantiated using skrl's model instantiator utility
 # https://skrl.readthedocs.io/en/latest/api/utils/model_instantiators.html
 models:
   separate: False
-  policy:  # see skrl.utils.model_instantiators.torch.gaussian_model for parameter details
+  policy:  # see gaussian_model parameters
+    class: GaussianMixin
     clip_actions: False
     clip_log_std: True
-    initial_log_std: 0
     min_log_std: -20.0
     max_log_std: 2.0
-    input_shape: "Shape.STATES"
-    hiddens: [512, 256, 128]
-    hidden_activation: ["elu", "elu"]
-    output_shape: "Shape.ACTIONS"
-    output_activation: ""
-    output_scale: 1.0
-  value:  # see skrl.utils.model_instantiators.torch.deterministic_model for parameter details
+    initial_log_std: 0.0
+    network:
+      - name: net
+        input: STATES
+        layers: [512, 256, 128]
+        activations: elu
+    output: ACTIONS
+  value:  # see deterministic_model parameters
+    class: DeterministicMixin
     clip_actions: False
-    input_shape: "Shape.STATES"
-    hiddens: [512, 256, 128]
-    hidden_activation: ["elu", "elu"]
-    output_shape: "Shape.ONE"
-    output_activation: ""
-    output_scale: 1.0
+    network:
+      - name: net
+        input: STATES
+        layers: [512, 256, 128]
+        activations: elu
+    output: ONE
+
+
+# Rollout memory
+# https://skrl.readthedocs.io/en/latest/api/memories/random.html
+memory:
+  class: RandomMemory
+  memory_size: -1  # automatically determined (same as agent:rollouts)
 
 
 # PPO agent configuration (field names are from PPO_DEFAULT_CONFIG)
 # https://skrl.readthedocs.io/en/latest/api/agents/ppo.html
 agent:
+  class: PPO
   rollouts: 24
   learning_epochs: 5
-  mini_batches: 4
+  mini_batches: 12
   discount_factor: 0.998
   lambda: 0.95
-  learning_rate: 1.e-3
-  learning_rate_scheduler: "KLAdaptiveLR"
+  learning_rate: 5.0e-04
+  learning_rate_scheduler: KLAdaptiveLR
   learning_rate_scheduler_kwargs:
-    kl_threshold: 0.01
-  state_preprocessor: "RunningStandardScaler"
+    kl_threshold: 0.016
+  state_preprocessor: RunningStandardScaler
   state_preprocessor_kwargs: null
-  value_preprocessor: "RunningStandardScaler"
+  value_preprocessor: RunningStandardScaler
   value_preprocessor_kwargs: null
   random_timesteps: 0
   learning_starts: 0
@@ -50,18 +61,20 @@ agent:
   clip_predicted_values: True
   entropy_loss_scale: 0.002
   value_loss_scale: 2.0
-  kl_threshold: 0
+  kl_threshold: 0.0
   rewards_shaper_scale: 0.1
+  time_limit_bootstrap: False
   # logging and checkpoint
   experiment:
     directory: "allegro_cube"
     experiment_name: ""
-    write_interval: 600
-    checkpoint_interval: 6000
+    write_interval: auto
+    checkpoint_interval: auto
 
 
 # Sequential trainer
 # https://skrl.readthedocs.io/en/latest/api/trainers/sequential.html
 trainer:
+  class: SequentialTrainer
   timesteps: 120000
-  environment_info: "log"
+  environment_info: log
@@ -1,14 +1,11 @@
-# Copyright (c) 2022-2024, The Isaac Lab Project Developers.
+# Copyright (c) 2022-2025, The Isaac Lab Project Developers.
 # All rights reserved.
 #
 # SPDX-License-Identifier: BSD-3-Clause
 
 from isaaclab.utils import configclass
 
-#import isaacLab.manipulation.tasks.Robot_arm.reach.mdp as mdp
-import isaacLab.manipulation.tasks.Dextrous_hand.inhand.mdp as mdp
-import isaacLab.manipulation.tasks.Dextrous_hand.inhand.inhand_env_cfg as inhand_env_cfg
-#import isaaclab_tasks.manager_based.manipulation.inhand.inhand_env_cfg as inhand_env_cfg
+import isaaclab_tasks.manager_based.manipulation.inhand.inhand_env_cfg as inhand_env_cfg
 
 ##
 # Pre-defined configs
 
@@ -1,4 +1,4 @@
-# Copyright (c) 2022-2024, The Isaac Lab Project Developers.
+# Copyright (c) 2022-2025, The Isaac Lab Project Developers.
 # All rights reserved.
 #
 # SPDX-License-Identifier: BSD-3-Clause
@@ -23,7 +23,7 @@
 from isaaclab.utils.assets import ISAAC_NUCLEUS_DIR
 from isaaclab.utils.noise import AdditiveGaussianNoiseCfg as Gnoise
 
-import isaacLab.manipulation.tasks.Dextrous_hand.inhand.mdp as mdp
+import isaaclab_tasks.manager_based.manipulation.inhand.mdp as mdp
 
 ##
 # Scene definition
@@ -341,5 +341,6 @@ def __post_init__(self):
         self.episode_length_s = 20.0
         # simulation settings
         self.sim.dt = 1.0 / 120.0
+        self.sim.render_interval = self.decimation
         # change viewer settings
         self.viewer.eye = (2.0, 2.0, 2.0)
@@ -1,4 +1,4 @@
-# Copyright (c) 2022-2024, The Isaac Lab Project Developers.
+# Copyright (c) 2022-2025, The Isaac Lab Project Developers.
 # All rights reserved.
 #
 # SPDX-License-Identifier: BSD-3-Clause
Original file line number	Diff line number	Diff line change
`@@ -1,4 +1,4 @@`
`1`		`-# Copyright (c) 2022-2024, The Isaac Lab Project Developers.`
	`1`	`+# Copyright (c) 2022-2025, The Isaac Lab Project Developers.`
`2`	`2`	`# All rights reserved.`
`3`	`3`	`#`
`4`	`4`	`# SPDX-License-Identifier: BSD-3-Clause`
Original file line number	Diff line number	Diff line change
`@@ -1,6 +1,4 @@`
`1`		`-# Copyright (c) 2022-2024, The Isaac Lab Project Developers.`
	`1`	`+# Copyright (c) 2022-2025, The Isaac Lab Project Developers.`
`2`	`2`	`# All rights reserved.`
`3`	`3`	`#`
`4`	`4`	`# SPDX-License-Identifier: BSD-3-Clause`
`5`		`-`
`6`		`-from . import rsl_rl_cfg # noqa: F401, F403`