[pre-commit.ci] auto fixes from pre-commit.com hooks

for more information, see https://pre-commit.ci
2026-06-02 03:41:25 +00:00 · 2025-07-02 15:31:15 +00:00
parent f6c7287ae7
commit 769f531603
9 changed files with 485 additions and 475 deletions
--- a/src/lerobot/processor/observation_processor.py
+++ b/src/lerobot/processor/observation_processor.py
@@ -15,35 +15,36 @@
 # limitations under the License.
 from __future__ import annotations

-from typing import Any
 from dataclasses import dataclass, field
+from typing import Any
+
+import einops
 import numpy as np
 import torch
-import einops
 from torch import Tensor

-from lerobot.processor.pipeline import EnvTransition, PipelineStep, TransitionIndex
+from lerobot.processor.pipeline import EnvTransition, TransitionIndex


@dataclass
 class ImageProcessor:
    """Process image observations from environment format to policy format.
-    
+
    Converts images from:
    - Channel-last (H, W, C) to channel-first (C, H, W)
    - uint8 [0, 255] to float32 [0, 1]
    - Adds batch dimension if needed
    - Handles both single images and dictionaries of images
    """
-    
+
    def __call__(self, transition: EnvTransition) -> EnvTransition:
        observation = transition[TransitionIndex.OBSERVATION]
-        
+
        if observation is None:
            return transition
-            
+
        processed_obs = {}
-        
+
        # Handle pixels key
        if "pixels" in observation:
            if isinstance(observation["pixels"], dict):
@@ -54,12 +55,12 @@ class ImageProcessor:
            for imgkey, img in imgs.items():
                processed_img = self._process_single_image(img)
                processed_obs[imgkey] = processed_img
-        
+
        # Copy other observations unchanged
        for key, value in observation.items():
            if key != "pixels":
                processed_obs[key] = value
-        
+
        # Return new transition with processed observation
        return (
            processed_obs,
@@ -70,44 +71,44 @@ class ImageProcessor:
            transition[TransitionIndex.INFO],
            transition[TransitionIndex.COMPLEMENTARY_DATA],
        )
-    
+
    def _process_single_image(self, img: np.ndarray) -> Tensor:
        """Process a single image array."""
        # Convert to tensor
        img_tensor = torch.from_numpy(img)
-        
+
        # Add batch dimension if needed
        if img_tensor.ndim == 3:
            img_tensor = img_tensor.unsqueeze(0)
-        
+
        # Validate image format
        _, h, w, c = img_tensor.shape
        if not (c < h and c < w):
            raise ValueError(f"Expected channel-last images, but got shape {img_tensor.shape}")
-        
+
        if img_tensor.dtype != torch.uint8:
            raise ValueError(f"Expected torch.uint8 images, but got {img_tensor.dtype}")
-        
+
        # Convert to channel-first format
        img_tensor = einops.rearrange(img_tensor, "b h w c -> b c h w").contiguous()
-        
+
        # Convert to float32 and normalize to [0, 1]
        img_tensor = img_tensor.type(torch.float32) / 255.0
-        
+
        return img_tensor
-    
+
    def get_config(self) -> dict[str, Any]:
        """Return configuration for serialization."""
        return {}
-    
+
    def state_dict(self) -> dict[str, torch.Tensor]:
        """Return state dictionary (empty for this processor)."""
        return {}
-    
+
    def load_state_dict(self, state: dict[str, torch.Tensor]) -> None:
        """Load state dictionary (no-op for this processor)."""
        pass
-    
+
    def reset(self) -> None:
        """Reset processor state (no-op for this processor)."""
        pass
@@ -116,22 +117,22 @@ class ImageProcessor:
@dataclass
 class StateProcessor:
    """Process state observations from environment format to policy format.
-    
+
    Handles:
    - environment_state -> observation.environment_state
    - agent_pos -> observation.state
    - Converts numpy arrays to tensors
    - Adds batch dimension if needed
    """
-    
+
    def __call__(self, transition: EnvTransition) -> EnvTransition:
        observation = transition[TransitionIndex.OBSERVATION]
-        
+
        if observation is None:
            return transition
-            
+
        processed_obs = dict(observation)  # Copy existing observations
-        
+
        # Process environment_state
        if "environment_state" in observation:
            env_state = torch.from_numpy(observation["environment_state"]).float()
@@ -140,16 +141,16 @@ class StateProcessor:
            processed_obs["observation.environment_state"] = env_state
            # Remove original key
            del processed_obs["environment_state"]
-        
+
        # Process agent_pos
        if "agent_pos" in observation:
            agent_pos = torch.from_numpy(observation["agent_pos"]).float()
            if agent_pos.dim() == 1:
                agent_pos = agent_pos.unsqueeze(0)
            processed_obs["observation.state"] = agent_pos
-            # Remove original key  
+            # Remove original key
            del processed_obs["agent_pos"]
-        
+
        # Return new transition with processed observation
        return (
            processed_obs,
@@ -160,19 +161,19 @@ class StateProcessor:
            transition[TransitionIndex.INFO],
            transition[TransitionIndex.COMPLEMENTARY_DATA],
        )
-    
+
    def get_config(self) -> dict[str, Any]:
        """Return configuration for serialization."""
        return {}
-    
+
    def state_dict(self) -> dict[str, torch.Tensor]:
        """Return state dictionary (empty for this processor)."""
        return {}
-    
+
    def load_state_dict(self, state: dict[str, torch.Tensor]) -> None:
        """Load state dictionary (no-op for this processor)."""
        pass
-    
+
    def reset(self) -> None:
        """Reset processor state (no-op for this processor)."""
        pass
@@ -181,43 +182,47 @@ class StateProcessor:
@dataclass
 class ObservationProcessor:
    """Complete observation processor that combines image and state processing.
-    
+
    This processor replicates the functionality of the original preprocess_observation
    function but in a modular, composable way that fits into the pipeline architecture.
    """
-    
+
    image_processor: ImageProcessor = field(default_factory=ImageProcessor)
    state_processor: StateProcessor = field(default_factory=StateProcessor)
-    
+
    def __call__(self, transition: EnvTransition) -> EnvTransition:
        # First process images
        transition = self.image_processor(transition)
        # Then process state
        transition = self.state_processor(transition)
        return transition
-    
+
    def get_config(self) -> dict[str, Any]:
        """Return configuration for serialization."""
        return {
            "image_processor": self.image_processor.get_config(),
            "state_processor": self.state_processor.get_config(),
        }
-    
+
    def state_dict(self) -> dict[str, torch.Tensor]:
        """Return state dictionary."""
        state = {}
        state.update({f"image_processor.{k}": v for k, v in self.image_processor.state_dict().items()})
        state.update({f"state_processor.{k}": v for k, v in self.state_processor.state_dict().items()})
        return state
-    
+
    def load_state_dict(self, state: dict[str, torch.Tensor]) -> None:
        """Load state dictionary."""
-        image_state = {k.replace("image_processor.", ""): v for k, v in state.items() if k.startswith("image_processor.")}
-        state_state = {k.replace("state_processor.", ""): v for k, v in state.items() if k.startswith("state_processor.")}
-        
+        image_state = {
+            k.replace("image_processor.", ""): v for k, v in state.items() if k.startswith("image_processor.")
+        }
+        state_state = {
+            k.replace("state_processor.", ""): v for k, v in state.items() if k.startswith("state_processor.")
+        }
+
        self.image_processor.load_state_dict(image_state)
        self.state_processor.load_state_dict(state_state)
-    
+
    def reset(self) -> None:
        """Reset processor state."""
        self.image_processor.reset()