src/lerobot/processor/delta_action_processor.py

# !/usr/bin/env python

# Copyright 2025 The HuggingFace Inc. team. All rights reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

from dataclasses import dataclass, field

from torch import Tensor

from lerobot.configs.types import FeatureType, PolicyFeature
from lerobot.processor.pipeline import ActionProcessor, ProcessorStepRegistry


@ProcessorStepRegistry.register("map_delta_action_to_robot_action")
@dataclass
class MapDeltaActionToRobotAction(ActionProcessor):
    """
    Map delta actions from teleoperators (gamepad, keyboard) to robot target actions
    for use with inverse kinematics processors.

    Expected input ACTION keys:
    {
        "action.delta_x": float,
        "action.delta_y": float,
        "action.delta_z": float,
        "action.gripper": float (optional),
    }

    Output ACTION keys:
    {
        "action.enabled": bool,
        "action.target_x": float,
        "action.target_y": float,
        "action.target_z": float,
        "action.target_wx": float,
        "action.target_wy": float,
        "action.target_wz": float,
        "action.gripper": float,
    }
    """

    # Scale factors for delta movements
    position_scale: float = 1.0
    rotation_scale: float = 0.0  # No rotation deltas for gamepad/keyboard
    gripper_deadzone: float = 0.1  # Threshold for gripper activation
    _prev_enabled: bool = field(default=False, init=False, repr=False)

    def action(self, action: dict | Tensor | None) -> dict:
        if action is None:
            return {}

        # NOTE (maractingi): Action can be a dict from the teleop_devices or a tensor from the policy
        # TODO (maractingi): changing this target_xyz naming convention from the teleop_devices
        if isinstance(action, dict):
            delta_x = action.pop("action.delta_x", 0.0)
            delta_y = action.pop("action.delta_y", 0.0)
            delta_z = action.pop("action.delta_z", 0.0)
            gripper = action.pop("action.gripper", 1.0)  # Default to "stay" (1.0)
        else:
            delta_x = action[0].item()
            delta_y = action[1].item()
            delta_z = action[2].item()
            gripper = action[3].item()

        # Determine if the teleoperator is actively providing input
        # Consider enabled if any significant movement delta is detected
        position_magnitude = abs(delta_x) + abs(delta_y) + abs(delta_z)
        enabled = position_magnitude > 1e-6  # Small threshold to avoid noise

        # Scale the deltas appropriately
        scaled_delta_x = float(delta_x) * self.position_scale
        scaled_delta_y = float(delta_y) * self.position_scale
        scaled_delta_z = float(delta_z) * self.position_scale

        # For gamepad/keyboard, we don't have rotation input, so set to 0
        # These could be extended in the future for more sophisticated teleoperators
        target_wx = 0.0
        target_wy = 0.0
        target_wz = 0.0

        # Update action with robot target format
        action = {
            "action.enabled": enabled,
            "action.target_x": scaled_delta_x,
            "action.target_y": scaled_delta_y,
            "action.target_z": scaled_delta_z,
            "action.target_wx": target_wx,
            "action.target_wy": target_wy,
            "action.target_wz": target_wz,
            "action.gripper": float(gripper),
        }

        self._prev_enabled = enabled
        return action

    def transform_features(self, features: dict[str, PolicyFeature]) -> dict[str, PolicyFeature]:
        """Transform features to match output format."""
        # Update features to reflect the new action format
        features.update(
            {
                "action.enabled": PolicyFeature(type=FeatureType.ACTION, shape=(1,)),
                "action.target_x": PolicyFeature(type=FeatureType.ACTION, shape=(1,)),
                "action.target_y": PolicyFeature(type=FeatureType.ACTION, shape=(1,)),
                "action.target_z": PolicyFeature(type=FeatureType.ACTION, shape=(1,)),
                "action.target_wx": PolicyFeature(type=FeatureType.ACTION, shape=(1,)),
                "action.target_wy": PolicyFeature(type=FeatureType.ACTION, shape=(1,)),
                "action.target_wz": PolicyFeature(type=FeatureType.ACTION, shape=(1,)),
                "action.gripper": PolicyFeature(type=FeatureType.ACTION, shape=(1,)),
            }
        )
        return features

    def reset(self):
        self._prev_enabled = False
Refactor`gym_manipulator.py` using the universal pipeline (#1650) * Migrate gym_manipulator to use the pipeline Added get_teleop_events function to capture relevant events from teleop devices unrelated to actions * Added the capability to record a dataset * Added the replay functionality with the pipeline * Refactored `actor.py` to use the pipeline * [pre-commit.ci] auto fixes from pre-commit.com hooks for more information, see https://pre-commit.ci * RL works at this commit - fixed actor.py and bugs in gym_manipulator * change folder structure to reduce the size of gym_manip * Refactored hilserl config * Remove dataset and mode from HilSerlEnvConfig to a GymManipulatorConfig to reduce verbose of configs during training * format docs * removed get_teleop_events from abc * Refactor environment configuration and processing pipeline for GymHIL support. Removed device attribute from HILSerlRobotEnvConfig, added DummyTeleopDevice for simulation, and updated processor creation to accommodate GymHIL environments. * Improved typing for HILRobotEnv config and GymManipulator config * [pre-commit.ci] auto fixes from pre-commit.com hooks for more information, see https://pre-commit.ci * Migrated `gym_manipulator` to use a more modular structure similar to phone teleop * Refactor gripper handling and transition processing in HIL and robot kinematic processors - Updated gripper position handling to use a consistent key format across processors - Improved the EEReferenceAndDelta class to handle reference joint positions. - Added support for discrete gripper actions in the GripperVelocityToJoint processor. - Refactored the gym manipulator to improve modularity and clarity in processing steps. * Added delta_action_processor mapping wrapper * Added missing file delta_action_processor and improved imports in `gym_manipulator` * nit * Added missing file joint_observation_processor * Enhance processing architecture with new teleoperation processors - Introduced `AddTeleopActionAsComplimentaryData` and `AddTeleopEventsAsInfo` for integrating teleoperator actions and events into transitions. - Added `Torch2NumpyActionProcessor` and `Numpy2TorchActionProcessor` for seamless conversion between PyTorch tensors and NumPy arrays. - Updated `__init__.py` to include new processors in module exports, improving modularity and clarity in the processing pipeline. - GymHIL is now fully supported with HIL using the pipeline * Refactor configuration structure for gym_hil integration - Renamed sections for better readability, such as changing "Gym Wrappers Configuration" to "Processor Configuration." - Enhanced documentation with clear examples for dataset collection and policy evaluation configurations. * Enhance reset configuration and teleoperation event handling - Added `terminate_on_success` parameter to `ResetConfig` and `InterventionActionProcessor` for controlling episode termination behavior upon success detection. - Updated documentation to clarify the impact of `terminate_on_success` on data collection for reward classifier training. - Refactored teleoperation event handling to use `TeleopEvents` constants for improved readability and maintainability across various modules. * fix(keyboard teleop), delta action keys * Added transform features and feature contract * Added transform features for image crop * Enum for TeleopEvents * Update tranform_features delta action proc --------- Co-authored-by: pre-commit-ci[bot] <66853113+pre-commit-ci[bot]@users.noreply.github.com> 2025-08-11 11:07:55 +02:00			`# !/usr/bin/env python`

			`# Copyright 2025 The HuggingFace Inc. team. All rights reserved.`
			`#`
			`# Licensed under the Apache License, Version 2.0 (the "License");`
			`# you may not use this file except in compliance with the License.`
			`# You may obtain a copy of the License at`
			`#`
			`# http://www.apache.org/licenses/LICENSE-2.0`
			`#`
			`# Unless required by applicable law or agreed to in writing, software`
			`# distributed under the License is distributed on an "AS IS" BASIS,`
			`# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`# See the License for the specific language governing permissions and`
			`# limitations under the License.`

			`from dataclasses import dataclass, field`

			`from torch import Tensor`

			`from lerobot.configs.types import FeatureType, PolicyFeature`
			`from lerobot.processor.pipeline import ActionProcessor, ProcessorStepRegistry`


			`@ProcessorStepRegistry.register("map_delta_action_to_robot_action")`
			`@dataclass`
			`class MapDeltaActionToRobotAction(ActionProcessor):`
			`"""`
			`Map delta actions from teleoperators (gamepad, keyboard) to robot target actions`
			`for use with inverse kinematics processors.`

			`Expected input ACTION keys:`
			`{`
			`"action.delta_x": float,`
			`"action.delta_y": float,`
			`"action.delta_z": float,`
			`"action.gripper": float (optional),`
			`}`

			`Output ACTION keys:`
			`{`
			`"action.enabled": bool,`
			`"action.target_x": float,`
			`"action.target_y": float,`
			`"action.target_z": float,`
			`"action.target_wx": float,`
			`"action.target_wy": float,`
			`"action.target_wz": float,`
			`"action.gripper": float,`
			`}`
			`"""`

			`# Scale factors for delta movements`
			`position_scale: float = 1.0`
			`rotation_scale: float = 0.0 # No rotation deltas for gamepad/keyboard`
			`gripper_deadzone: float = 0.1 # Threshold for gripper activation`
			`_prev_enabled: bool = field(default=False, init=False, repr=False)`

			`def action(self, action: dict \| Tensor \| None) -> dict:`
			`if action is None:`
			`return {}`

			`# NOTE (maractingi): Action can be a dict from the teleop_devices or a tensor from the policy`
			`# TODO (maractingi): changing this target_xyz naming convention from the teleop_devices`
			`if isinstance(action, dict):`
			`delta_x = action.pop("action.delta_x", 0.0)`
			`delta_y = action.pop("action.delta_y", 0.0)`
			`delta_z = action.pop("action.delta_z", 0.0)`
			`gripper = action.pop("action.gripper", 1.0) # Default to "stay" (1.0)`
			`else:`
			`delta_x = action[0].item()`
			`delta_y = action[1].item()`
			`delta_z = action[2].item()`
			`gripper = action[3].item()`

			`# Determine if the teleoperator is actively providing input`
			`# Consider enabled if any significant movement delta is detected`
			`position_magnitude = abs(delta_x) + abs(delta_y) + abs(delta_z)`
			`enabled = position_magnitude > 1e-6 # Small threshold to avoid noise`

			`# Scale the deltas appropriately`
			`scaled_delta_x = float(delta_x) * self.position_scale`
			`scaled_delta_y = float(delta_y) * self.position_scale`
			`scaled_delta_z = float(delta_z) * self.position_scale`

			`# For gamepad/keyboard, we don't have rotation input, so set to 0`
			`# These could be extended in the future for more sophisticated teleoperators`
			`target_wx = 0.0`
			`target_wy = 0.0`
			`target_wz = 0.0`

			`# Update action with robot target format`
			`action = {`
			`"action.enabled": enabled,`
			`"action.target_x": scaled_delta_x,`
			`"action.target_y": scaled_delta_y,`
			`"action.target_z": scaled_delta_z,`
			`"action.target_wx": target_wx,`
			`"action.target_wy": target_wy,`
			`"action.target_wz": target_wz,`
			`"action.gripper": float(gripper),`
			`}`

			`self._prev_enabled = enabled`
			`return action`

			`def transform_features(self, features: dict[str, PolicyFeature]) -> dict[str, PolicyFeature]:`
			`"""Transform features to match output format."""`
			`# Update features to reflect the new action format`
			`features.update(`
			`{`
			`"action.enabled": PolicyFeature(type=FeatureType.ACTION, shape=(1,)),`
			`"action.target_x": PolicyFeature(type=FeatureType.ACTION, shape=(1,)),`
			`"action.target_y": PolicyFeature(type=FeatureType.ACTION, shape=(1,)),`
			`"action.target_z": PolicyFeature(type=FeatureType.ACTION, shape=(1,)),`
			`"action.target_wx": PolicyFeature(type=FeatureType.ACTION, shape=(1,)),`
			`"action.target_wy": PolicyFeature(type=FeatureType.ACTION, shape=(1,)),`
			`"action.target_wz": PolicyFeature(type=FeatureType.ACTION, shape=(1,)),`
			`"action.gripper": PolicyFeature(type=FeatureType.ACTION, shape=(1,)),`
			`}`
			`)`
			`return features`

			`def reset(self):`
			`self._prev_enabled = False`