src/lerobot/processor/render_messages_processor.py

#!/usr/bin/env python

# Copyright 2026 The HuggingFace Inc. team. All rights reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

from __future__ import annotations

from dataclasses import dataclass
from typing import Any

from lerobot.configs import PipelineFeatureType, PolicyFeature
from lerobot.configs.recipe import TrainingRecipe
from lerobot.datasets.language import LANGUAGE_EVENTS, LANGUAGE_PERSISTENT
from lerobot.datasets.language_render import render_sample
from lerobot.types import EnvTransition, TransitionKey

from .pipeline import ProcessorStep, ProcessorStepRegistry


@dataclass
@ProcessorStepRegistry.register(name="render_messages_processor")
class RenderMessagesStep(ProcessorStep):
    """Processor step that turns raw language columns into rendered chat messages.

    Reads ``language_persistent`` and ``language_events`` from the transition's
    complementary data, renders them through ``recipe`` at the sample timestamp,
    and replaces the raw columns with the resulting ``messages`` /
    ``message_streams`` / ``target_message_indices`` keys.
    """

    recipe: TrainingRecipe
    dataset_ctx: Any | None = None

    def __call__(self, transition: EnvTransition) -> EnvTransition | None:
        """Render messages for a single transition; return ``None`` to drop it."""
        complementary_data = transition.get(TransitionKey.COMPLEMENTARY_DATA) or {}
        persistent = complementary_data.get(LANGUAGE_PERSISTENT) or []
        events = complementary_data.get(LANGUAGE_EVENTS) or []

        if not persistent and not events:
            return transition

        timestamp = complementary_data.get("timestamp")
        if timestamp is None:
            raise KeyError("RenderMessagesStep requires sample timestamp in complementary data.")

        sample_idx = complementary_data.get("index", 0)
        rendered = render_sample(
            recipe=self.recipe,
            persistent=persistent,
            events=events,
            t=_scalar(timestamp),
            sample_idx=int(_scalar(sample_idx)),
            task=complementary_data.get("task"),
            dataset_ctx=self.dataset_ctx,
        )
        if rendered is None:
            return None

        new_transition = transition.copy()
        new_complementary_data = dict(complementary_data)
        new_complementary_data.pop(LANGUAGE_PERSISTENT, None)
        new_complementary_data.pop(LANGUAGE_EVENTS, None)
        new_complementary_data.update(rendered)
        new_transition[TransitionKey.COMPLEMENTARY_DATA] = new_complementary_data
        return new_transition

    def transform_features(
        self, features: dict[PipelineFeatureType, dict[str, PolicyFeature]]
    ) -> dict[PipelineFeatureType, dict[str, PolicyFeature]]:
        """Pass features through unchanged; rendering only touches complementary data."""
        return features


def _scalar(value: Any) -> float | int:
    """Unwrap a tensor/array/single-element list into a Python scalar."""
    if hasattr(value, "item"):
        return value.item()
    if isinstance(value, list) and len(value) == 1:
        return _scalar(value[0])
    return value
Add extensive language support 2026-04-27 10:56:32 +02:00			`#!/usr/bin/env python`

			`# Copyright 2026 The HuggingFace Inc. team. All rights reserved.`
			`#`
			`# Licensed under the Apache License, Version 2.0 (the "License");`
			`# you may not use this file except in compliance with the License.`
			`# You may obtain a copy of the License at`
			`#`
			`# http://www.apache.org/licenses/LICENSE-2.0`
			`#`
			`# Unless required by applicable law or agreed to in writing, software`
			`# distributed under the License is distributed on an "AS IS" BASIS,`
			`# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`# See the License for the specific language governing permissions and`
			`# limitations under the License.`

			`from __future__ import annotations`

			`from dataclasses import dataclass`
			`from typing import Any`

			`from lerobot.configs import PipelineFeatureType, PolicyFeature`
			`from lerobot.configs.recipe import TrainingRecipe`
			`from lerobot.datasets.language import LANGUAGE_EVENTS, LANGUAGE_PERSISTENT`
			`from lerobot.datasets.language_render import render_sample`
			`from lerobot.types import EnvTransition, TransitionKey`

			`from .pipeline import ProcessorStep, ProcessorStepRegistry`


			`@dataclass`
			`@ProcessorStepRegistry.register(name="render_messages_processor")`
			`class RenderMessagesStep(ProcessorStep):`
Address review: split persistent/event schemas, drop event timestamps - recipe.py: derive _VALID_ROLES/_VALID_STREAMS from MessageRole/MessageStream Literals - dataset_metadata.py: keep CODEBASE_VERSION at v3.0 - language.py: remove RESERVED_STYLES; split arrow/feature schemas into persistent (with timestamp) and event (without timestamp); add docstrings - language_render.py: events use frame-row timestamp implicitly; no per-event timestamp filtering or sorting - converters.py: drop unused subtask_key passthrough - add docstrings to new public APIs (recipe, render_messages_processor, collate) - update tests for split schemas; revert uv.lock Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com> 2026-04-27 13:38:23 +02:00			`"""Processor step that turns raw language columns into rendered chat messages.`

			Reads ``language_persistent`` and ``language_events`` from the transition's
			complementary data, renders them through ``recipe`` at the sample timestamp,
			and replaces the raw columns with the resulting ``messages`` /
			``message_streams`` / ``target_message_indices`` keys.
			`"""`

Add extensive language support 2026-04-27 10:56:32 +02:00			`recipe: TrainingRecipe`
			`dataset_ctx: Any \| None = None`

			`def __call__(self, transition: EnvTransition) -> EnvTransition \| None:`
Address review: split persistent/event schemas, drop event timestamps - recipe.py: derive _VALID_ROLES/_VALID_STREAMS from MessageRole/MessageStream Literals - dataset_metadata.py: keep CODEBASE_VERSION at v3.0 - language.py: remove RESERVED_STYLES; split arrow/feature schemas into persistent (with timestamp) and event (without timestamp); add docstrings - language_render.py: events use frame-row timestamp implicitly; no per-event timestamp filtering or sorting - converters.py: drop unused subtask_key passthrough - add docstrings to new public APIs (recipe, render_messages_processor, collate) - update tests for split schemas; revert uv.lock Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com> 2026-04-27 13:38:23 +02:00			"""Render messages for a single transition; return ``None`` to drop it."""
Add extensive language support 2026-04-27 10:56:32 +02:00			`complementary_data = transition.get(TransitionKey.COMPLEMENTARY_DATA) or {}`
			`persistent = complementary_data.get(LANGUAGE_PERSISTENT) or []`
			`events = complementary_data.get(LANGUAGE_EVENTS) or []`

			`if not persistent and not events:`
			`return transition`

			`timestamp = complementary_data.get("timestamp")`
			`if timestamp is None:`
			`raise KeyError("RenderMessagesStep requires sample timestamp in complementary data.")`

			`sample_idx = complementary_data.get("index", 0)`
			`rendered = render_sample(`
			`recipe=self.recipe,`
			`persistent=persistent,`
			`events=events,`
			`t=_scalar(timestamp),`
			`sample_idx=int(_scalar(sample_idx)),`
			`task=complementary_data.get("task"),`
			`dataset_ctx=self.dataset_ctx,`
			`)`
			`if rendered is None:`
			`return None`

			`new_transition = transition.copy()`
			`new_complementary_data = dict(complementary_data)`
			`new_complementary_data.pop(LANGUAGE_PERSISTENT, None)`
			`new_complementary_data.pop(LANGUAGE_EVENTS, None)`
			`new_complementary_data.update(rendered)`
			`new_transition[TransitionKey.COMPLEMENTARY_DATA] = new_complementary_data`
			`return new_transition`

			`def transform_features(`
			`self, features: dict[PipelineFeatureType, dict[str, PolicyFeature]]`
			`) -> dict[PipelineFeatureType, dict[str, PolicyFeature]]:`
Add docstrings to all new helpers; revert uv.lock Covers private helpers in recipe.py, language.py, language_render.py, and render_messages_processor.py. Also reverts uv.lock to main (it was re-generated by `uv run` during local checks). Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com> 2026-04-27 14:15:03 +02:00			`"""Pass features through unchanged; rendering only touches complementary data."""`
Add extensive language support 2026-04-27 10:56:32 +02:00			`return features`


			`def _scalar(value: Any) -> float \| int:`
Add docstrings to all new helpers; revert uv.lock Covers private helpers in recipe.py, language.py, language_render.py, and render_messages_processor.py. Also reverts uv.lock to main (it was re-generated by `uv run` during local checks). Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com> 2026-04-27 14:15:03 +02:00			`"""Unwrap a tensor/array/single-element list into a Python scalar."""`
Add extensive language support 2026-04-27 10:56:32 +02:00			`if hasattr(value, "item"):`
			`return value.item()`
			`if isinstance(value, list) and len(value) == 1:`
			`return _scalar(value[0])`
			`return value`