Adds command generator to manage different command types (#68)

# Description This PR introduces the concept of command generators that can be used for goal-conditioned environments. The idea is that these classes can be used for task specification and the same environment can be configured for different task logics (position-based locomotion vs velocity based control). Currently, the included command generators are specific to locomotion (SE(2) control). They have their own visualization schemes (arrows, boxes etc.) that can be useful for debugging. ## Type of change - New feature (non-breaking change which adds functionality) - This change requires a documentation update ## Checklist - [x] I have run the [`pre-commit` checks](https://pre-commit.com/) with `./orbit.sh --format` - [x] I have made corresponding changes to the documentation - [x] My changes generate no new warnings - [ ] I have added tests that prove my fix is effective or that my feature works - [x] I have updated the changelog and the corresponding version in the extension's `config/extension.toml` file

Adds command generator to manage different command types (#68)
# Description This PR introduces the concept of command generators that can be used for goal-conditioned environments. The idea is that these classes can be used for task specification and the same environment can be configured for different task logics (position-based locomotion vs velocity based control). Currently, the included command generators are specific to locomotion (SE(2) control). They have their own visualization schemes (arrows, boxes etc.) that can be useful for debugging. ## Type of change - New feature (non-breaking change which adds functionality) - This change requires a documentation update ## Checklist - [x] I have run the [`pre-commit` checks](https://pre-commit.com/) with `./orbit.sh --format` - [x] I have made corresponding changes to the documentation - [x] My changes generate no new warnings - [ ] I have added tests that prove my fix is effective or that my feature works - [x] I have updated the changelog and the corresponding version in the extension's `config/extension.toml` file
4e727991 · Mayank Mittal · GitHub · f4bb9875 · 4e727991 · 4e727991
Unverified Commit 4e727991 authored Jul 21, 2023 by Mayank Mittal Committed by GitHub Jul 21, 2023
10 changed files
--- a/docs/source/api/index.rst
+++ b/docs/source/api/index.rst
@@ -18,6 +18,7 @@ omni.isaac.orbit extension
   orbit.robots
   orbit.sensors
   orbit.terrains
+   orbit.command_generators
   orbit.utils
   orbit.utils.assets
   orbit.utils.kit

--- a/docs/source/api/orbit.command_generators.rst
+++ b/docs/source/api/orbit.command_generators.rst
+omni.isaac.orbit.command_generators
+====================================
+.. automodule:: omni.isaac.orbit.command_generators
+   :members:
+   :show-inheritance:
--- a/source/extensions/omni.isaac.orbit/config/extension.toml
+++ b/source/extensions/omni.isaac.orbit/config/extension.toml
 [package]
 # Note: Semantic Versioning is used: https://semver.org/
-version = "0.6.1"
+version = "0.6.2"
 # Description
 title = "ORBIT framework for Robot Learning"

--- a/source/extensions/omni.isaac.orbit/docs/CHANGELOG.rst
+++ b/source/extensions/omni.isaac.orbit/docs/CHANGELOG.rst
 Changelog
 ---------
+0.6.2 (2023-07-21)
+~~~~~~~~~~~~~~~~~~
+Added
+^^^^^
+* Added the :mod:`omni.isaac.orbit.command_generators` to generate different commands based on the desired task.
+  It allows the user to generate commands for different tasks in the same environment without having to write
+  custom code for each task.
 0.6.1 (2023-07-16)
 ~~~~~~~~~~~~~~~~~~

--- a/source/extensions/omni.isaac.orbit/omni/isaac/orbit/command_generators/__init__.py
+++ b/source/extensions/omni.isaac.orbit/omni/isaac/orbit/command_generators/__init__.py
+# Copyright (c) 2022, NVIDIA CORPORATION & AFFILIATES, ETH Zurich, and University of Toronto
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+"""
+This submodule provides command generators for goal-conditioned tasks.
+The command generators are used to generate commands for the agent to execute. The command generators act
+as utility classes to make it convenient to switch between different command generation strategies within
+the same environment. For instance, in an environment consisting of a quadrupedal robot, the command to it
+could be a velocity command or position command. By keeping the command generation logic separate from the
+environment, it is easy to switch between different command generation strategies.
+The command generators are implemented as classes that inherit from the :class:`CommandGeneratorBase` class.
+Each command generator class should also have a corresponding configuration class that inherits from the
+:class:`CommandGeneratorBaseCfg` class.
+"""
+from .command_generator_base import CommandGeneratorBase
+from .command_generator_cfg import (
+    CommandGeneratorBaseCfg,
+    NormalVelocityCommandGeneratorCfg,
+    TerrainBasedPositionCommandGeneratorCfg,
+    UniformVelocityCommandGeneratorCfg,
+)
+from .position_command_generator import TerrainBasedPositionCommandGenerator
+from .velocity_command_generator import NormalVelocityCommandGenerator, UniformVelocityCommandGenerator
+__all__ = [
+    "CommandGeneratorBase",
+    "CommandGeneratorBaseCfg",
+    # velocity command generators
+    "UniformVelocityCommandGenerator",
+    "UniformVelocityCommandGeneratorCfg",
+    "NormalVelocityCommandGenerator",
+    "NormalVelocityCommandGeneratorCfg",
+    # position command generators
+    "TerrainBasedPositionCommandGenerator",
+    "TerrainBasedPositionCommandGeneratorCfg",
+]
--- a/source/extensions/omni.isaac.orbit/omni/isaac/orbit/command_generators/command_generator_base.py
+++ b/source/extensions/omni.isaac.orbit/omni/isaac/orbit/command_generators/command_generator_base.py
+# Copyright (c) 2022, NVIDIA CORPORATION & AFFILIATES, ETH Zurich, and University of Toronto
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+"""Base class for command generators.
+This class defines an interface for command generators that can be used for goal-conditioned
+tasks. Each command generator class should inherit from this class and implement the abstract
+methods.
+"""
+import torch
+from abc import ABC, abstractmethod
+from typing import Dict, Optional, Sequence
+from .command_generator_cfg import CommandGeneratorBaseCfg
+class CommandGeneratorBase(ABC):
+    """The base class for implementing a command generator.
+    A command generator is used to generate commands for goal-conditioned tasks. For example,
+    in the case of a goal-conditioned navigation task, the command generator can be used to
+    generate a target position for the robot to navigate to.
+    The command generator implements a resampling mechanism that allows the command to be
+    resampled at a fixed frequency. The resampling frequency can be specified in the
+    configuration object. Additionally, it is possible to assign a visualization function
+    to the command generator that can be used to visualize the command in the simulator.
+    """
+    def __init__(self, cfg: CommandGeneratorBaseCfg, env: object):
+        """Initialize the command generator class.
+        Args:
+            cfg (CommandGeneratorBaseCfg): The configuration parameters for the command generator.
+            env (object): The environment object.
+        """
+        # store the inputs
+        self.cfg = cfg
+        # extract the environment parameters
+        self.dt = env.dt
+        self.num_envs = env.num_envs
+        self.device = env.device
+        # create buffers to store the command
+        # -- metrics that can be used for logging
+        self.metrics = dict()
+        # -- time left before resampling
+        self.time_left = torch.zeros(self.num_envs, device=self.device)
+        # -- counter for the number of times the command has been resampled within the current episode
+        self.command_counter = torch.zeros(self.num_envs, device=self.device, dtype=torch.long)
+    """
+    Properties
+    """
+    @property
+    @abstractmethod
+    def command(self) -> torch.Tensor:
+        """The command tensor. Shape is (num_envs, command_dim)."""
+        raise NotImplementedError
+    """
+    Operations.
+    """
+    def reset(self, env_ids: Optional[Sequence[int]] = None):
+        """Reset the command generator.
+        This function resets the command counter and resamples the command. It should be called
+        at the beginning of each episode.
+        Args:
+            env_ids (Optional[Sequence[int]], optional): The list of environment IDs to reset. Defaults to None.
+        """
+        # resolve the environment IDs
+        if env_ids is None:
+            env_ids = ...
+        # set the command counter to zero
+        self.command_counter[env_ids] = 0
+        # resample the command
+        self._resample(env_ids)
+    def compute(self):
+        """Compute the command."""
+        # update the metrics based on current state
+        self._update_metrics()
+        # reduce the time left before resampling
+        self.time_left -= self.dt
+        # resample the command if necessary
+        resample_env_ids = (self.time_left <= 0.0).nonzero().flatten()
+        if len(resample_env_ids) > 0:
+            self._resample(resample_env_ids)
+        # update the command
+        self._update_command()
+    def log_info(self, env_ids: Sequence[int]) -> Dict[str, float]:
+        """Log information such as metrics.
+        Args:
+            env_ids (Sequence[int]): The list of environment IDs to log the information for.
+        Returns:
+            Dict[str, float]: A dictionary containing the information to log under the "Metrics/{name}" key.
+        """
+        extras = {}
+        for metric_name, metric_value in self.metrics.items():
+            # compute the mean metric value
+            extras[f"Metrics/{metric_name}"] = torch.mean(metric_value[env_ids]).item()
+            # reset the metric value
+            metric_value[env_ids] = 0.0
+        return extras
+    def debug_vis(self):
+        """Visualize the command in the simulator.
+        This is an optional function that can be used to visualize the command in the simulator.
+        """
+        if self.cfg.debug_vis:
+            pass
+    """
+    Helper functions.
+    """
+    def _resample(self, env_ids: Sequence[int]):
+        """Resample the command.
+        This function resamples the command and time for which the command is applied for the
+        specified environment indices.
+        Args:
+            env_ids (Sequence[int]): The list of environment IDs to resample.
+        """
+        # resample the time left before resampling
+        self.time_left[env_ids] = self.time_left[env_ids].uniform_(*self.cfg.resampling_time_range)
+        # increment the command counter
+        self.command_counter[env_ids] += 1
+        # resample the command
+        self._resample_command(env_ids)
+    """
+    Implementation specific functions.
+    """
+    @abstractmethod
+    def _resample_command(self, env_ids: Sequence[int]):
+        """Resample the command for the specified environments."""
+        raise NotImplementedError
+    @abstractmethod
+    def _update_command(self):
+        """Update the command based on the current state."""
+        raise NotImplementedError
+    @abstractmethod
+    def _update_metrics(self):
+        """Update the metrics based on the current state."""
+        raise NotImplementedError
--- a/source/extensions/omni.isaac.orbit/omni/isaac/orbit/command_generators/command_generator_cfg.py
+++ b/source/extensions/omni.isaac.orbit/omni/isaac/orbit/command_generators/command_generator_cfg.py
+# Copyright (c) 2022, NVIDIA CORPORATION & AFFILIATES, ETH Zurich, and University of Toronto
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+from dataclasses import MISSING
+from typing import ClassVar, Tuple
+from omni.isaac.orbit.utils import configclass
+"""
+Base command generator.
+"""
+@configclass
+class CommandGeneratorBaseCfg:
+    """Configuration for the base command generator."""
+    class_name: ClassVar[str] = MISSING
+    """Name of the command generator class."""
+    resampling_time_range: Tuple[float, float] = MISSING
+    """Time before commands are changed [s]."""
+    debug_vis: bool = False
+    """Whether to visualize debug information. Defaults to False."""
+"""
+Locomotion-specific command generators.
+"""
+@configclass
+class UniformVelocityCommandGeneratorCfg(CommandGeneratorBaseCfg):
+    """Configuration for the uniform velocity command generator."""
+    class_name = "UniformVelocityCommandGenerator"
+    robot_attr: str = MISSING
+    """Name of the robot attribute from the environment."""
+    heading_command: bool = MISSING
+    """Whether to use heading command or angular velocity command.
+    If True, the angular velocity command is computed from the heading error, where the
+    target heading is sampled uniformly from provided range. Otherwise, the angular velocity
+    command is sampled uniformly from provided range.
+    """
+    rel_standing_envs: float = MISSING
+    """Probability threshold for environments where the robots that are standing still."""
+    rel_heading_envs: float = MISSING
+    """Probability threshold for environments where the robots follow the heading-based angular velocity command
+    (the others follow the sampled angular velocity command)."""
+    @configclass
+    class Ranges:
+        """Uniform distribution ranges for the velocity commands."""
+        lin_vel_x: Tuple[float, float] = MISSING  # min max [m/s]
+        lin_vel_y: Tuple[float, float] = MISSING  # min max [m/s]
+        ang_vel_z: Tuple[float, float] = MISSING  # min max [rad/s]
+        heading: Tuple[float, float] = MISSING  # [rad]
+    ranges: Ranges = MISSING
+    """Distribution ranges for the velocity commands."""
+@configclass
+class NormalVelocityCommandGeneratorCfg(UniformVelocityCommandGeneratorCfg):
+    """Configuration for the normal velocity command generator."""
+    class_name = "NormalVelocityCommandGenerator"
+    heading_command: bool = False  # --> we don't use heading command for normal velocity command.
+    @configclass
+    class Ranges:
+        """Normal distribution ranges for the velocity commands."""
+        mean_vel: Tuple[float, float, float] = MISSING
+        """Mean velocity for the normal distribution.
+        The tuple contains the mean linear-x, linear-y, and angular-z velocity.
+        """
+        std_vel: Tuple[float, float, float] = MISSING
+        """Standard deviation for the normal distribution.
+        The tuple contains the standard deviation linear-x, linear-y, and angular-z velocity.
+        """
+        zero_prob: Tuple[float, float, float] = MISSING
+        """Probability of zero velocity for the normal distribution.
+        The tuple contains the probability of zero linear-x, linear-y, and angular-z velocity.
+        """
+    ranges: Ranges = MISSING
+    """Distribution ranges for the velocity commands."""
+@configclass
+class TerrainBasedPositionCommandGeneratorCfg(CommandGeneratorBaseCfg):
+    """Configuration for the terrain-based position command generator."""
+    class_name = "TerrainBasedPositionCommandGenerator"
+    robot_attr: str = MISSING
+    """Name of the robot attribute from the environment."""
+    rel_standing_envs: float = MISSING
+    """Probability threshold for environments where the robots that are standing still."""
+    simple_heading: bool = MISSING
+    """Whether to use simple heading or not.
+    If True, the heading is in the direction of the target position.
+    """
+    @configclass
+    class Ranges:
+        """Uniform distribution ranges for the velocity commands."""
+        heading: Tuple[float, float] = MISSING
+        """Heading range for the position commands (in rad).
+        Used only if :attr:`simple_heading` is False.
+        """
+    ranges: Ranges = MISSING
+    """Distribution ranges for the position commands."""
--- a/source/extensions/omni.isaac.orbit/omni/isaac/orbit/command_generators/position_command_generator.py
+++ b/source/extensions/omni.isaac.orbit/omni/isaac/orbit/command_generators/position_command_generator.py
+# Copyright (c) 2022, NVIDIA CORPORATION & AFFILIATES, ETH Zurich, and University of Toronto
+# All rights reserved.
+#
+# SPDX-License-Identifier: BSD-3-Clause
+"""Sub-module containing command generators for the position-based locomotion task."""
+import torch
+from typing import Sequence
+from omni.isaac.orbit.markers import VisualizationMarkers
+from omni.isaac.orbit.markers.config import CUBOID_MARKER_CFG
+from omni.isaac.orbit.robots.robot_base import RobotBase
+from omni.isaac.orbit.terrains import TerrainImporter
+from omni.isaac.orbit.utils.math import quat_rotate_inverse, wrap_to_pi, yaw_quat
+from .command_generator_base import CommandGeneratorBase
+from .command_generator_cfg import TerrainBasedPositionCommandGeneratorCfg
+class TerrainBasedPositionCommandGenerator(CommandGeneratorBase):
+    """Command generator that generates position commands based on the terrain.
+    The position commands are sampled from the terrain mesh and the heading commands are either set
+    to point towards the target or are sampled uniformly.
+    """
+    cfg: TerrainBasedPositionCommandGeneratorCfg
+    """Configuration for the command generator."""
+    def __init__(self, cfg: TerrainBasedPositionCommandGeneratorCfg, env: object):
+        """Initialize the command generator class.
+        Args:
+            cfg (TerrainBasedPositionCommandGeneratorCfg): The configuration parameters for the command generator.
+            env (object): The environment object.
+        """
+        super().__init__(cfg, env)
+        # -- robot
+        # TODO: Should we make this configurable like this?
+        self.robot: RobotBase = getattr(env, cfg.robot_attr)
+        # -- terrain
+        self.terrain: TerrainImporter = env.terrain
+        # -- commands: (x, y, z, heading)
+        self.pos_command_w = torch.zeros(self.num_envs, 3, device=self.device)
+        self.heading_command_w = torch.zeros(self.num_envs, device=self.device)
+        self.pos_command_b = torch.zeros_like(self.pos_command_w)
+        self.heading_command_b = torch.zeros_like(self.heading_command_w)
+        # -- metrics
+        self.metrics["error_pos"] = torch.zeros(self.num_envs, device=self.device)
+        self.metrics["error_heading"] = torch.zeros(self.num_envs, device=self.device)
+        # -- debug vis
+        self._box_goal_marker = None
+    def __str__(self) -> str:
+        msg = "TerrainBasedPositionCommandGenerator:\n"
+        msg += f"\tCommand dimension: {tuple(self.command.shape[1:])}\n"
+        msg += f"\tResampling time range: {self.cfg.resampling_time_range}\n"
+        msg += f"\tStanding probability: {self.cfg.rel_standing_envs}"
+        return msg
+    """
+    Properties
+    """
+    @property
+    def command(self) -> torch.Tensor:
+        """The desired base position in base frame. Shape is (num_envs, 3)."""
+        return self.pos_command_b
+    """
+    Operations.
+    """
+    def debug_vis(self):
+        if self.cfg.debug_vis:
+            # create the box marker if necessary
+            if self._box_goal_marker is None:
+                marker_cfg = CUBOID_MARKER_CFG
+                marker_cfg.markers["cuboid"].color = (1.0, 0.0, 0.0)
+                marker_cfg.markers["cuboid"].scale = (0.1, 0.1, 0.1)
+                self._box_goal_marker = VisualizationMarkers("/Visuals/base_position_goal", marker_cfg)
+            # update the box marker
+            self._box_goal_marker.visualize(self.pos_command_w)
+    """
+    Implementation specific functions.
+    """
+    def _resample_command(self, env_ids: Sequence[int]):
+        # sample new position targets from the terrain
+        # TODO: need to add that here directly
+        self.pos_command_w[env_ids] = self.terrain.sample_new_targets(env_ids)
+        # offset the position command by the current root position
+        self.pos_command_w[env_ids, 2] += self.robot.get_default_root_states(clone=False)[env_ids, 2]
+        if self.cfg.simple_heading:
+            # set heading command to point towards target
+            target_vec = self.pos_command_w[env_ids] - self.robot.data.root_pos_w[env_ids]
+            target_direction = torch.atan2(target_vec[:, 1], target_vec[:, 0])
+            flipped_heading = wrap_to_pi(target_direction + torch.pi)
+            self.heading_command_w[env_ids] = torch.where(
+                wrap_to_pi(target_direction - self.robot.data.heading_w[env_ids]).abs()
+                < wrap_to_pi(flipped_heading - self.robot.data.heading_w[env_ids]).abs(),
+                target_direction,
+                flipped_heading,
+            )
+        else:
+            # random heading command
+            r = torch.empty(len(env_ids), device=self.device)
+            self.heading_command_w[env_ids] = r.uniform_(*self.cfg.ranges.heading)
+    def _update_command(self):
+        """Retargets the position command to the current root position and heading."""
+        target_vec = self.pos_command_w - self.robot.root_pos_w[:, :3]
+        self.pos_command_b[:] = quat_rotate_inverse(yaw_quat(self.robot.root_quat_w), target_vec)
+        self.heading_command_b[:] = wrap_to_pi(self.heading_command_w - self.robot.heading_w)
+    def _update_metrics(self):
+        # logs data
+        self.metrics["error_pos"] = torch.norm(self.pos_command_w - self.robot.root_pos_w[:, :3], dim=1)
+        self.metrics["error_heading"] = torch.abs(wrap_to_pi(self.heading_command_w - self.robot.heading_w))
--- a/source/extensions/omni.isaac.orbit/omni/isaac/orbit/command_generators/velocity_command_generator.py
+++ b/source/extensions/omni.isaac.orbit/omni/isaac/orbit/command_generators/velocity_command_generator.py
--- a/source/extensions/omni.isaac.orbit/omni/isaac/orbit/markers/config/__init__.py
+++ b/source/extensions/omni.isaac.orbit/omni/isaac/orbit/markers/config/__init__.py
@@ -62,3 +62,23 @@ CONTACT_SENSOR_MARKER_CFG = VisualizationMarkersCfg(
    },
 )
 """Configuration for the contact sensor marker."""
+ARROW_X_MARKER_CFG = VisualizationMarkersCfg(
+    markers={
+        "arrow": VisualizationMarkersCfg.FileMarkerCfg(
+            usd_path=f"{ISAAC_NUCLEUS_DIR}/Props/UIElements/arrow_x.usd",
+            scale=[1.0, 0.1, 0.1],
+        )
+    }
+)
+"""Configuration for the arrow marker (along x-direction)."""
+CUBOID_MARKER_CFG = VisualizationMarkersCfg(
+    markers={
+        "cuboid": VisualizationMarkersCfg.MarkerCfg(
+            prim_type="Cube",
+        )
+    }
+)
+"""Configuration for the cuboid marker."""