mirror of
https://github.com/huggingface/lerobot.git
synced 2026-06-02 20:01:25 +00:00
* [Port codebase pipeline] General fixes for RL and scripts (#1748) * Refactor dataset configuration in documentation and codebase - Updated dataset configuration keys from `dataset_root` to `root` and `num_episodes` to `num_episodes_to_record` for consistency. - Adjusted replay episode handling by renaming `episode` to `replay_episode`. - Enhanced documentation - added specific processor to transform from policy actions to delta actions * Added Robot action to tensor processor Added new processor script for dealing with gym specific action processing * removed RobotAction2Tensor processor; imrpoved choosing observations in actor * nit in delta action * added missing reset functions to kinematics * Adapt teleoperate and replay to pipeline similar to record * refactor(processors): move to inheritance (#1750) * fix(teleoperator): improvements phone implementation (#1752) * fix(teleoperator): protect shared state in phone implementation * refactor(teleop): separate classes in phone * fix: solve breaking changes (#1753) * refactor(policies): multiple improvements (#1754) * refactor(processor): simpler logic in device processor (#1755) * refactor(processor): euclidean distance in delta action processor (#1757) * refactor(processor): improvements to joint observations processor migration (#1758) * refactor(processor): improvements to tokenizer migration (#1759) * refactor(processor): improvements to tokenizer migration * fix(tests): tokenizer tests regression from #1750 * fix(processors): fix float comparison and config in hil processors (#1760) * chore(teleop): remove unnecessary callbacks in KeyboardEndEffectorTeleop (#1761) * refactor(processor): improvements normalize pipeline migration (#1756) * refactor(processor): several improvements normalize processor step * refactor(processor): more improvements normalize processor * refactor(processor): more changes to normalizer * refactor(processor): take a different approach to DRY * refactor(processor): final design * chore(record): revert comment and continue deleted (#1764) * refactor(examples): pipeline phone examples (#1769) * refactor(examples): phone teleop + teleop script * refactor(examples): phone replay + replay * chore(examples): rename phone example files & folders * feat(processor): fix improvements to the pipeline porting (#1796) * refactor(processor): enhance tensor device handling in normalization process (#1795) * refactor(tests): remove unsupported device detection test for complementary data (#1797) * chore(tests): update ToBatchProcessor test (#1798) * refactor(tests): remove in-place mutation tests for actions and complementary data in batch processor * test(tests): add tests for action and task processing in batch processor * add names for android and ios phone (#1799) * use _tensor_stats in normalize processor (#1800) * fix(normalize_processor): correct device reference for tensor epsilon handling (#1801) * add point 5 add missing feature contracts (#1806) * Fix PR comments 1452 (#1807) * use key to determine image * Address rest of PR comments * use PolicyFeatures in transform_features --------- Co-authored-by: Pepijn <138571049+pkooij@users.noreply.github.com> --------- Co-authored-by: Michel Aractingi <michel.aractingi@huggingface.co> Co-authored-by: Adil Zouitine <adilzouitinegm@gmail.com> Co-authored-by: Pepijn <138571049+pkooij@users.noreply.github.com>
136 lines
5.1 KiB
Python
136 lines
5.1 KiB
Python
# !/usr/bin/env python
|
|
|
|
# Copyright 2025 The HuggingFace Inc. team. All rights reserved.
|
|
#
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
# you may not use this file except in compliance with the License.
|
|
# You may obtain a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
# See the License for the specific language governing permissions and
|
|
# limitations under the License.
|
|
|
|
from dataclasses import dataclass
|
|
|
|
from torch import Tensor
|
|
|
|
from lerobot.configs.types import FeatureType, PolicyFeature
|
|
from lerobot.processor.pipeline import ActionProcessor, ProcessorStepRegistry
|
|
|
|
|
|
@ProcessorStepRegistry.register("map_tensor_to_delta_action_dict")
|
|
@dataclass
|
|
class MapTensorToDeltaActionDict(ActionProcessor):
|
|
"""
|
|
Map a tensor to a delta action dictionary.
|
|
"""
|
|
|
|
def action(self, action: Tensor) -> dict:
|
|
if isinstance(action, dict):
|
|
return action
|
|
if action.dim() > 1:
|
|
action = action.squeeze(0)
|
|
|
|
# TODO (maractingi): add rotation
|
|
delta_action = {
|
|
"action.delta_x": action[0],
|
|
"action.delta_y": action[1],
|
|
"action.delta_z": action[2],
|
|
}
|
|
if action.shape[0] > 3:
|
|
delta_action["action.gripper"] = action[3]
|
|
return delta_action
|
|
|
|
|
|
@ProcessorStepRegistry.register("map_delta_action_to_robot_action")
|
|
@dataclass
|
|
class MapDeltaActionToRobotAction(ActionProcessor):
|
|
"""
|
|
Map delta actions from teleoperators (gamepad, keyboard) to robot target actions
|
|
for use with inverse kinematics processors.
|
|
|
|
Expected input ACTION keys:
|
|
{
|
|
"action.delta_x": float,
|
|
"action.delta_y": float,
|
|
"action.delta_z": float,
|
|
"action.gripper": float (optional),
|
|
}
|
|
|
|
Output ACTION keys:
|
|
{
|
|
"action.enabled": bool,
|
|
"action.target_x": float,
|
|
"action.target_y": float,
|
|
"action.target_z": float,
|
|
"action.target_wx": float,
|
|
"action.target_wy": float,
|
|
"action.target_wz": float,
|
|
"action.gripper": float,
|
|
}
|
|
"""
|
|
|
|
# Scale factors for delta movements
|
|
position_scale: float = 1.0
|
|
rotation_scale: float = 0.0 # No rotation deltas for gamepad/keyboard
|
|
noise_threshold: float = 1e-3 # 1 mm threshold to filter out noise
|
|
|
|
def action(self, action: dict) -> dict:
|
|
# NOTE (maractingi): Action can be a dict from the teleop_devices or a tensor from the policy
|
|
# TODO (maractingi): changing this target_xyz naming convention from the teleop_devices
|
|
delta_x = action.pop("action.delta_x", 0.0)
|
|
delta_y = action.pop("action.delta_y", 0.0)
|
|
delta_z = action.pop("action.delta_z", 0.0)
|
|
gripper = action.pop("action.gripper", 1.0) # Default to "stay" (1.0)
|
|
|
|
# Determine if the teleoperator is actively providing input
|
|
# Consider enabled if any significant movement delta is detected
|
|
position_magnitude = (delta_x**2 + delta_y**2 + delta_z**2) ** 0.5 # Use Euclidean norm for position
|
|
enabled = position_magnitude > self.noise_threshold # Small threshold to avoid noise
|
|
|
|
# Scale the deltas appropriately
|
|
scaled_delta_x = delta_x * self.position_scale
|
|
scaled_delta_y = delta_y * self.position_scale
|
|
scaled_delta_z = delta_z * self.position_scale
|
|
|
|
# For gamepad/keyboard, we don't have rotation input, so set to 0
|
|
# These could be extended in the future for more sophisticated teleoperators
|
|
target_wx = 0.0
|
|
target_wy = 0.0
|
|
target_wz = 0.0
|
|
|
|
# Update action with robot target format
|
|
action = {
|
|
"action.enabled": enabled,
|
|
"action.target_x": scaled_delta_x,
|
|
"action.target_y": scaled_delta_y,
|
|
"action.target_z": scaled_delta_z,
|
|
"action.target_wx": target_wx,
|
|
"action.target_wy": target_wy,
|
|
"action.target_wz": target_wz,
|
|
"action.gripper": float(gripper),
|
|
}
|
|
|
|
return action
|
|
|
|
def transform_features(self, features: dict[str, PolicyFeature]) -> dict[str, PolicyFeature]:
|
|
"""Transform features to match output format."""
|
|
# Update features to reflect the new action format
|
|
features.update(
|
|
{
|
|
"action.enabled": PolicyFeature(type=FeatureType.ACTION, shape=(1,)),
|
|
"action.target_x": PolicyFeature(type=FeatureType.ACTION, shape=(1,)),
|
|
"action.target_y": PolicyFeature(type=FeatureType.ACTION, shape=(1,)),
|
|
"action.target_z": PolicyFeature(type=FeatureType.ACTION, shape=(1,)),
|
|
"action.target_wx": PolicyFeature(type=FeatureType.ACTION, shape=(1,)),
|
|
"action.target_wy": PolicyFeature(type=FeatureType.ACTION, shape=(1,)),
|
|
"action.target_wz": PolicyFeature(type=FeatureType.ACTION, shape=(1,)),
|
|
"action.gripper": PolicyFeature(type=FeatureType.ACTION, shape=(1,)),
|
|
}
|
|
)
|
|
return features
|