RoboVerseOrg · Anchor1021 · Dec 3, 2025 · Dec 6, 2025 · Dec 6, 2025 · Dec 6, 2025
diff --git a/metasim/sim/isaacgym/isaacgym.py b/metasim/sim/isaacgym/isaacgym.py
@@ -774,7 +774,11 @@ def _get_states(self, env_ids: list[int] | None = None) -> list[DictEnvState]:
 
         # Apply GS background rendering if enabled
         # TODO: Render with batch parallelization for efficiency
-        if self.scenario.gs_scene.with_gs_background and self.gs_background is not None:
+        if (
+            self.scenario.gs_scene is not None
+            and self.scenario.gs_scene.with_gs_background
+            and self.gs_background is not None
+        ):
             assert ROBO_SPLATTER_AVAILABLE, "RoboSplatter is not available. GS background rendering will be disabled."
             camera_states = self._apply_gs_background_rendering(camera_states, env_ids)
 

diff --git a/roboverse_learn/rl/fast_td3/configs/pick_place_banana2.yaml b/roboverse_learn/rl/fast_td3/configs/pick_place_banana2.yaml
@@ -0,0 +1,89 @@
+# Base Configuration for FastTD3 Training - Banana
+# Default configuration with IsaacGym simulator and Franka robot
+
+# -------------------------------------------------------------------------------
+# Environment
+# -------------------------------------------------------------------------------
+sim: "isaacgym"
+robots: ["franka"]
+task: "pick_place.approach_grasp_simple_banana2"
+decimation: 4
+train_or_eval: "train"
+headless: True
+
+# -------------------------------------------------------------------------------
+# Seeds & Device
+# -------------------------------------------------------------------------------
+seed: 1
+cuda: true
+torch_deterministic: true
+device_rank: 0
+
+# -------------------------------------------------------------------------------
+# Rollout & Timesteps
+# -------------------------------------------------------------------------------
+num_envs: 400
+num_eval_envs: 400
+total_timesteps: 2000000
+learning_starts: 10
+num_steps: 1
+
+# -------------------------------------------------------------------------------
+# Replay, Batching, Discounting
+# -------------------------------------------------------------------------------
+buffer_size: 20480
+batch_size: 32768
+gamma: 0.99
+tau: 0.1
+
+# -------------------------------------------------------------------------------
+# Update Schedule
+# -------------------------------------------------------------------------------
+policy_frequency: 2
+num_updates: 5
+# -------------------------------------------------------------------------------
+# Optimizer & Network
+# -------------------------------------------------------------------------------
+critic_learning_rate: 0.0003
+actor_learning_rate: 0.0003
+weight_decay: 0.1
+critic_hidden_dim: 512
+actor_hidden_dim: 256
+init_scale: 0.01
+num_atoms: 101
+
+# -------------------------------------------------------------------------------
+# Value Distribution & Exploration
+# -------------------------------------------------------------------------------
+v_min: 0
+v_max: 600.0
+policy_noise: 0.001
+std_min: 0.001
+std_max: 0.4
+noise_clip: 0.5
+
+# -------------------------------------------------------------------------------
+# Algorithm Flags
+# -------------------------------------------------------------------------------
+use_cdq: true
+compile: true
+obs_normalization: true
+max_grad_norm: 0.0
+amp: true
+amp_dtype: "fp16"
+disable_bootstrap: false
+measure_burnin: 3
+
+# -------------------------------------------------------------------------------
+# Logging & Checkpointing
+# -------------------------------------------------------------------------------
+wandb_project: "get_started_fttd3"
+exp_name: "get_started_fttd3_banana"
+use_wandb: false
+checkpoint_path: null
+run_name: "pick_place.approach_grasp_simple_banana2"  # Unique run name
+model_dir: "models/banana2"  # Separate directory for banana checkpoints
+eval_interval: 5000
+save_interval: 5000
+video_width: 1024
+video_height: 1024
diff --git a/roboverse_learn/rl/fast_td3/configs/pick_place_banana3.yaml b/roboverse_learn/rl/fast_td3/configs/pick_place_banana3.yaml
@@ -0,0 +1,89 @@
+# Base Configuration for FastTD3 Training - Banana
+# Default configuration with IsaacGym simulator and Franka robot
+
+# -------------------------------------------------------------------------------
+# Environment
+# -------------------------------------------------------------------------------
+sim: "isaacgym"
+robots: ["franka"]
+task: "pick_place.approach_grasp_simple_banana3"
+decimation: 4
+train_or_eval: "train"
+headless: True
+
+# -------------------------------------------------------------------------------
+# Seeds & Device
+# -------------------------------------------------------------------------------
+seed: 1
+cuda: true
+torch_deterministic: true
+device_rank: 0
+
+# -------------------------------------------------------------------------------
+# Rollout & Timesteps
+# -------------------------------------------------------------------------------
+num_envs: 400
+num_eval_envs: 400
+total_timesteps: 2000000
+learning_starts: 10
+num_steps: 1
+
+# -------------------------------------------------------------------------------
+# Replay, Batching, Discounting
+# -------------------------------------------------------------------------------
+buffer_size: 20480
+batch_size: 32768
+gamma: 0.99
+tau: 0.1
+
+# -------------------------------------------------------------------------------
+# Update Schedule
+# -------------------------------------------------------------------------------
+policy_frequency: 2
+num_updates: 5
+# -------------------------------------------------------------------------------
+# Optimizer & Network
+# -------------------------------------------------------------------------------
+critic_learning_rate: 0.0003
+actor_learning_rate: 0.0003
+weight_decay: 0.1
+critic_hidden_dim: 512
+actor_hidden_dim: 256
+init_scale: 0.01
+num_atoms: 101
+
+# -------------------------------------------------------------------------------
+# Value Distribution & Exploration
+# -------------------------------------------------------------------------------
+v_min: 0
+v_max: 600.0
+policy_noise: 0.001
+std_min: 0.001
+std_max: 0.4
+noise_clip: 0.5
+
+# -------------------------------------------------------------------------------
+# Algorithm Flags
+# -------------------------------------------------------------------------------
+use_cdq: true
+compile: true
+obs_normalization: true
+max_grad_norm: 0.0
+amp: true
+amp_dtype: "fp16"
+disable_bootstrap: false
+measure_burnin: 3
+
+# -------------------------------------------------------------------------------
+# Logging & Checkpointing
+# -------------------------------------------------------------------------------
+wandb_project: "get_started_fttd3"
+exp_name: "get_started_fttd3_banana3"
+use_wandb: false
+checkpoint_path: null
+run_name: "pick_place.approach_grasp_simple_banana3"  # Unique run name
+model_dir: "models/banana3"  # Separate directory for banana checkpoints
+eval_interval: 5000
+save_interval: 5000
+video_width: 1024
+video_height: 1024
diff --git a/roboverse_learn/rl/fast_td3/configs/pick_place_banana4.yaml b/roboverse_learn/rl/fast_td3/configs/pick_place_banana4.yaml
@@ -0,0 +1,89 @@
+# Base Configuration for FastTD3 Training - Banana
+# Default configuration with IsaacGym simulator and Franka robot
+
+# -------------------------------------------------------------------------------
+# Environment
+# -------------------------------------------------------------------------------
+sim: "isaacgym"
+robots: ["franka"]
+task: "pick_place.approach_grasp_simple_banana4"
+decimation: 4
+train_or_eval: "train"
+headless: True
+
+# -------------------------------------------------------------------------------
+# Seeds & Device
+# -------------------------------------------------------------------------------
+seed: 1
+cuda: true
+torch_deterministic: true
+device_rank: 0
+
+# -------------------------------------------------------------------------------
+# Rollout & Timesteps
+# -------------------------------------------------------------------------------
+num_envs: 400
+num_eval_envs: 400
+total_timesteps: 2000000
+learning_starts: 10
+num_steps: 1
+
+# -------------------------------------------------------------------------------
+# Replay, Batching, Discounting
+# -------------------------------------------------------------------------------
+buffer_size: 20480
+batch_size: 32768
+gamma: 0.99
+tau: 0.1
+
+# -------------------------------------------------------------------------------
+# Update Schedule
+# -------------------------------------------------------------------------------
+policy_frequency: 2
+num_updates: 5
+# -------------------------------------------------------------------------------
+# Optimizer & Network
+# -------------------------------------------------------------------------------
+critic_learning_rate: 0.0003
+actor_learning_rate: 0.0003
+weight_decay: 0.1
+critic_hidden_dim: 512
+actor_hidden_dim: 256
+init_scale: 0.01
+num_atoms: 101
+
+# -------------------------------------------------------------------------------
+# Value Distribution & Exploration
+# -------------------------------------------------------------------------------
+v_min: 0
+v_max: 600.0
+policy_noise: 0.001
+std_min: 0.001
+std_max: 0.4
+noise_clip: 0.5
+
+# -------------------------------------------------------------------------------
+# Algorithm Flags
+# -------------------------------------------------------------------------------
+use_cdq: true
+compile: true
+obs_normalization: true
+max_grad_norm: 0.0
+amp: true
+amp_dtype: "fp16"
+disable_bootstrap: false
+measure_burnin: 3
+
+# -------------------------------------------------------------------------------
+# Logging & Checkpointing
+# -------------------------------------------------------------------------------
+wandb_project: "get_started_fttd3"
+exp_name: "get_started_fttd3_banana4"
+use_wandb: false
+checkpoint_path: null
+run_name: "pick_place.approach_grasp_simple_banana4"  # Unique run name
+model_dir: "models/banana4"  # Separate directory for banana checkpoints
+eval_interval: 5000
+save_interval: 5000
+video_width: 1024
+video_height: 1024
diff --git a/roboverse_learn/rl/fast_td3/configs/pick_place_banana5.yaml b/roboverse_learn/rl/fast_td3/configs/pick_place_banana5.yaml
@@ -0,0 +1,89 @@
+# Base Configuration for FastTD3 Training - Banana
+# Default configuration with IsaacGym simulator and Franka robot
+
+# -------------------------------------------------------------------------------
+# Environment
+# -------------------------------------------------------------------------------
+sim: "isaacgym"
+robots: ["franka"]
+task: "pick_place.approach_grasp_simple_banana5"
+decimation: 4
+train_or_eval: "train"
+headless: True
+
+# -------------------------------------------------------------------------------
+# Seeds & Device
+# -------------------------------------------------------------------------------
+seed: 1
+cuda: true
+torch_deterministic: true
+device_rank: 0
+
+# -------------------------------------------------------------------------------
+# Rollout & Timesteps
+# -------------------------------------------------------------------------------
+num_envs: 400
+num_eval_envs: 400
+total_timesteps: 2000000
+learning_starts: 10
+num_steps: 1
+
+# -------------------------------------------------------------------------------
+# Replay, Batching, Discounting
+# -------------------------------------------------------------------------------
+buffer_size: 20480
+batch_size: 32768
+gamma: 0.99
+tau: 0.1
+
+# -------------------------------------------------------------------------------
+# Update Schedule
+# -------------------------------------------------------------------------------
+policy_frequency: 2
+num_updates: 5
+# -------------------------------------------------------------------------------
+# Optimizer & Network
+# -------------------------------------------------------------------------------
+critic_learning_rate: 0.0003
+actor_learning_rate: 0.0003
+weight_decay: 0.1
+critic_hidden_dim: 512
+actor_hidden_dim: 256
+init_scale: 0.01
+num_atoms: 101
+
+# -------------------------------------------------------------------------------
+# Value Distribution & Exploration
+# -------------------------------------------------------------------------------
+v_min: 0
+v_max: 600.0
+policy_noise: 0.001
+std_min: 0.001
+std_max: 0.4
+noise_clip: 0.5
+
+# -------------------------------------------------------------------------------
+# Algorithm Flags
+# -------------------------------------------------------------------------------
+use_cdq: true
+compile: true
+obs_normalization: true
+max_grad_norm: 0.0
+amp: true
+amp_dtype: "fp16"
+disable_bootstrap: false
+measure_burnin: 3
+
+# -------------------------------------------------------------------------------
+# Logging & Checkpointing
+# -------------------------------------------------------------------------------
+wandb_project: "get_started_fttd3"
+exp_name: "get_started_fttd3_banana5"
+use_wandb: false
+checkpoint_path: null
+run_name: "pick_place.approach_grasp_simple_banana5"  # Unique run name
+model_dir: "models/banana5"  # Separate directory for banana checkpoints
+eval_interval: 5000
+save_interval: 5000
+video_width: 1024
+video_height: 1024