lerobot/common/transforms.py

from typing import Sequence

import torch
from tensordict import TensorDictBase
from tensordict.nn import dispatch
from tensordict.utils import NestedKey
from torchrl.envs.transforms import ObservationTransform, Transform


class Prod(ObservationTransform):
    invertible = True

    def __init__(self, in_keys: Sequence[NestedKey], prod: float):
        super().__init__()
        self.in_keys = in_keys
        self.prod = prod
        self.original_dtypes = {}

    def _reset(self, tensordict: TensorDictBase, tensordict_reset: TensorDictBase) -> TensorDictBase:
        # _reset is called once when the environment reset to normalize the first observation
        tensordict_reset = self._call(tensordict_reset)
        return tensordict_reset

    @dispatch(source="in_keys", dest="out_keys")
    def forward(self, tensordict: TensorDictBase) -> TensorDictBase:
        return self._call(tensordict)

    def _call(self, td):
        for key in self.in_keys:
            if td.get(key, None) is None:
                continue
            self.original_dtypes[key] = td[key].dtype
            td[key] = td[key].type(torch.float32) * self.prod
        return td

    def _inv_call(self, td: TensorDictBase) -> TensorDictBase:
        for key in self.in_keys:
            if td.get(key, None) is None:
                continue
            td[key] = (td[key] / self.prod).type(self.original_dtypes[key])
        return td

    def transform_observation_spec(self, obs_spec):
        for key in self.in_keys:
            if obs_spec.get(key, None) is None:
                continue
            obs_spec[key].space.high = obs_spec[key].space.high.type(torch.float32) * self.prod
            obs_spec[key].space.low = obs_spec[key].space.low.type(torch.float32) * self.prod
            obs_spec[key].dtype = torch.float32
        return obs_spec


class NormalizeTransform(Transform):
    invertible = True

    def __init__(
        self,
        stats: TensorDictBase,
        in_keys: Sequence[NestedKey] = None,
        out_keys: Sequence[NestedKey] | None = None,
        in_keys_inv: Sequence[NestedKey] | None = None,
        out_keys_inv: Sequence[NestedKey] | None = None,
        mode="mean_std",
    ):
        if out_keys is None:
            out_keys = in_keys
        if in_keys_inv is None:
            in_keys_inv = out_keys
        if out_keys_inv is None:
            out_keys_inv = in_keys
        super().__init__(
            in_keys=in_keys, out_keys=out_keys, in_keys_inv=in_keys_inv, out_keys_inv=out_keys_inv
        )
        self.stats = stats
        assert mode in ["mean_std", "min_max"]
        self.mode = mode

    def _reset(self, tensordict: TensorDictBase, tensordict_reset: TensorDictBase) -> TensorDictBase:
        # _reset is called once when the environment reset to normalize the first observation
        tensordict_reset = self._call(tensordict_reset)
        return tensordict_reset

    @dispatch(source="in_keys", dest="out_keys")
    def forward(self, tensordict: TensorDictBase) -> TensorDictBase:
        return self._call(tensordict)

    def _call(self, td: TensorDictBase) -> TensorDictBase:
        for inkey, outkey in zip(self.in_keys, self.out_keys, strict=False):
            # TODO(rcadene): don't know how to do `inkey not in td`
            if td.get(inkey, None) is None:
                continue
            if self.mode == "mean_std":
                mean = self.stats[inkey]["mean"]
                std = self.stats[inkey]["std"]
                td[outkey] = (td[inkey] - mean) / (std + 1e-8)
            else:
                min = self.stats[inkey]["min"]
                max = self.stats[inkey]["max"]
                # normalize to [0,1]
                td[outkey] = (td[inkey] - min) / (max - min)
                # normalize to [-1, 1]
                td[outkey] = td[outkey] * 2 - 1
        return td

    def _inv_call(self, td: TensorDictBase) -> TensorDictBase:
        for inkey, outkey in zip(self.in_keys_inv, self.out_keys_inv, strict=False):
            # TODO(rcadene): don't know how to do `inkey not in td`
            if td.get(inkey, None) is None:
                continue
            if self.mode == "mean_std":
                mean = self.stats[inkey]["mean"]
                std = self.stats[inkey]["std"]
                td[outkey] = td[inkey] * std + mean
            else:
                min = self.stats[inkey]["min"]
                max = self.stats[inkey]["max"]
                td[outkey] = (td[inkey] + 1) / 2
                td[outkey] = td[outkey] * (max - min) + min
        return td
Add Prod transform, Add test_factory 2024-02-20 14:22:16 +00:00			`from typing import Sequence`

Add Aloha env and ACT policy WIP Aloha env tests pass Rendering works (fps look fast tho? TODO action bounding is too wide [-1,1]) Update README Copy past from act repo Remove download.py add a WIP for Simxarm Remove download.py add a WIP for Simxarm Add act yaml (TODO: try train.py) Training can runs (TODO: eval) Add tasks without end_effector that are compatible with dataset, Eval can run (TODO: training and pretrained model) Add AbstractEnv, Refactor AlohaEnv, Add rendering_hook in env, Minor modifications, (TODO: Refactor Pusht and Simxarm) poetry lock fix bug in compute_stats for action normalization fix more bugs in normalization fix training fix import PushtEnv inheriates AbstractEnv, Improve factory Normalization Add _make_env to EnvAbstract Add call_rendering_hooks to pusht env SimxarmEnv inherites from AbstractEnv (NOT TESTED) Add aloha tests artifacts + update pusht stats fix image normalization: before env was in [0,1] but dataset in [0,255], and now both in [0,255] Small fix on simxarm Add next to obs Add top camera to Aloha env (TODO: make it compatible with set of cameras) Add top camera to Aloha env (TODO: make it compatible with set of cameras) 2024-03-08 09:47:39 +00:00			`import torch`
pre-commit run -a 2024-03-02 15:58:21 +00:00			`from tensordict import TensorDictBase`
Add Normalize, non_blocking=True in tdmpc, tdmpc run (TODO: diffusion) 2024-03-02 15:53:29 +00:00			`from tensordict.nn import dispatch`
pre-commit run -a 2024-03-02 15:58:21 +00:00			`from tensordict.utils import NestedKey`
			`from torchrl.envs.transforms import ObservationTransform, Transform`
Add Prod transform, Add test_factory 2024-02-20 14:22:16 +00:00

			`class Prod(ObservationTransform):`
Add Aloha env and ACT policy WIP Aloha env tests pass Rendering works (fps look fast tho? TODO action bounding is too wide [-1,1]) Update README Copy past from act repo Remove download.py add a WIP for Simxarm Remove download.py add a WIP for Simxarm Add act yaml (TODO: try train.py) Training can runs (TODO: eval) Add tasks without end_effector that are compatible with dataset, Eval can run (TODO: training and pretrained model) Add AbstractEnv, Refactor AlohaEnv, Add rendering_hook in env, Minor modifications, (TODO: Refactor Pusht and Simxarm) poetry lock fix bug in compute_stats for action normalization fix more bugs in normalization fix training fix import PushtEnv inheriates AbstractEnv, Improve factory Normalization Add _make_env to EnvAbstract Add call_rendering_hooks to pusht env SimxarmEnv inherites from AbstractEnv (NOT TESTED) Add aloha tests artifacts + update pusht stats fix image normalization: before env was in [0,1] but dataset in [0,255], and now both in [0,255] Small fix on simxarm Add next to obs Add top camera to Aloha env (TODO: make it compatible with set of cameras) Add top camera to Aloha env (TODO: make it compatible with set of cameras) 2024-03-08 09:47:39 +00:00			`invertible = True`

Add Prod transform, Add test_factory 2024-02-20 14:22:16 +00:00			`def __init__(self, in_keys: Sequence[NestedKey], prod: float):`
			`super().__init__()`
			`self.in_keys = in_keys`
			`self.prod = prod`
Add Aloha env and ACT policy WIP Aloha env tests pass Rendering works (fps look fast tho? TODO action bounding is too wide [-1,1]) Update README Copy past from act repo Remove download.py add a WIP for Simxarm Remove download.py add a WIP for Simxarm Add act yaml (TODO: try train.py) Training can runs (TODO: eval) Add tasks without end_effector that are compatible with dataset, Eval can run (TODO: training and pretrained model) Add AbstractEnv, Refactor AlohaEnv, Add rendering_hook in env, Minor modifications, (TODO: Refactor Pusht and Simxarm) poetry lock fix bug in compute_stats for action normalization fix more bugs in normalization fix training fix import PushtEnv inheriates AbstractEnv, Improve factory Normalization Add _make_env to EnvAbstract Add call_rendering_hooks to pusht env SimxarmEnv inherites from AbstractEnv (NOT TESTED) Add aloha tests artifacts + update pusht stats fix image normalization: before env was in [0,1] but dataset in [0,255], and now both in [0,255] Small fix on simxarm Add next to obs Add top camera to Aloha env (TODO: make it compatible with set of cameras) Add top camera to Aloha env (TODO: make it compatible with set of cameras) 2024-03-08 09:47:39 +00:00			`self.original_dtypes = {}`

			`def _reset(self, tensordict: TensorDictBase, tensordict_reset: TensorDictBase) -> TensorDictBase:`
			`# _reset is called once when the environment reset to normalize the first observation`
			`tensordict_reset = self._call(tensordict_reset)`
			`return tensordict_reset`

			`@dispatch(source="in_keys", dest="out_keys")`
			`def forward(self, tensordict: TensorDictBase) -> TensorDictBase:`
			`return self._call(tensordict)`
Add Prod transform, Add test_factory 2024-02-20 14:22:16 +00:00
			`def _call(self, td):`
			`for key in self.in_keys:`
Add Aloha env and ACT policy WIP Aloha env tests pass Rendering works (fps look fast tho? TODO action bounding is too wide [-1,1]) Update README Copy past from act repo Remove download.py add a WIP for Simxarm Remove download.py add a WIP for Simxarm Add act yaml (TODO: try train.py) Training can runs (TODO: eval) Add tasks without end_effector that are compatible with dataset, Eval can run (TODO: training and pretrained model) Add AbstractEnv, Refactor AlohaEnv, Add rendering_hook in env, Minor modifications, (TODO: Refactor Pusht and Simxarm) poetry lock fix bug in compute_stats for action normalization fix more bugs in normalization fix training fix import PushtEnv inheriates AbstractEnv, Improve factory Normalization Add _make_env to EnvAbstract Add call_rendering_hooks to pusht env SimxarmEnv inherites from AbstractEnv (NOT TESTED) Add aloha tests artifacts + update pusht stats fix image normalization: before env was in [0,1] but dataset in [0,255], and now both in [0,255] Small fix on simxarm Add next to obs Add top camera to Aloha env (TODO: make it compatible with set of cameras) Add top camera to Aloha env (TODO: make it compatible with set of cameras) 2024-03-08 09:47:39 +00:00			`if td.get(key, None) is None:`
			`continue`
			`self.original_dtypes[key] = td[key].dtype`
			`td[key] = td[key].type(torch.float32) * self.prod`
			`return td`

			`def _inv_call(self, td: TensorDictBase) -> TensorDictBase:`
			`for key in self.in_keys:`
			`if td.get(key, None) is None:`
			`continue`
			`td[key] = (td[key] / self.prod).type(self.original_dtypes[key])`
Add Prod transform, Add test_factory 2024-02-20 14:22:16 +00:00			`return td`

			`def transform_observation_spec(self, obs_spec):`
			`for key in self.in_keys:`
Add Aloha env and ACT policy WIP Aloha env tests pass Rendering works (fps look fast tho? TODO action bounding is too wide [-1,1]) Update README Copy past from act repo Remove download.py add a WIP for Simxarm Remove download.py add a WIP for Simxarm Add act yaml (TODO: try train.py) Training can runs (TODO: eval) Add tasks without end_effector that are compatible with dataset, Eval can run (TODO: training and pretrained model) Add AbstractEnv, Refactor AlohaEnv, Add rendering_hook in env, Minor modifications, (TODO: Refactor Pusht and Simxarm) poetry lock fix bug in compute_stats for action normalization fix more bugs in normalization fix training fix import PushtEnv inheriates AbstractEnv, Improve factory Normalization Add _make_env to EnvAbstract Add call_rendering_hooks to pusht env SimxarmEnv inherites from AbstractEnv (NOT TESTED) Add aloha tests artifacts + update pusht stats fix image normalization: before env was in [0,1] but dataset in [0,255], and now both in [0,255] Small fix on simxarm Add next to obs Add top camera to Aloha env (TODO: make it compatible with set of cameras) Add top camera to Aloha env (TODO: make it compatible with set of cameras) 2024-03-08 09:47:39 +00:00			`if obs_spec.get(key, None) is None:`
			`continue`
			`obs_spec[key].space.high = obs_spec[key].space.high.type(torch.float32) * self.prod`
			`obs_spec[key].space.low = obs_spec[key].space.low.type(torch.float32) * self.prod`
			`obs_spec[key].dtype = torch.float32`
Add Prod transform, Add test_factory 2024-02-20 14:22:16 +00:00			`return obs_spec`
Add Normalize, non_blocking=True in tdmpc, tdmpc run (TODO: diffusion) 2024-03-02 15:53:29 +00:00

			`class NormalizeTransform(Transform):`
			`invertible = True`

pre-commit run -a 2024-03-02 15:58:21 +00:00			`def __init__(`
			`self,`
Add mode to NormalizeTransform with mean_std or min_max (Not fully tested) 2024-03-03 13:19:02 +00:00			`stats: TensorDictBase,`
pre-commit run -a 2024-03-02 15:58:21 +00:00			`in_keys: Sequence[NestedKey] = None,`
			`out_keys: Sequence[NestedKey] \| None = None,`
			`in_keys_inv: Sequence[NestedKey] \| None = None,`
			`out_keys_inv: Sequence[NestedKey] \| None = None,`
Add mode to NormalizeTransform with mean_std or min_max (Not fully tested) 2024-03-03 13:19:02 +00:00			`mode="mean_std",`
pre-commit run -a 2024-03-02 15:58:21 +00:00			`):`
Add Normalize, non_blocking=True in tdmpc, tdmpc run (TODO: diffusion) 2024-03-02 15:53:29 +00:00			`if out_keys is None:`
			`out_keys = in_keys`
			`if in_keys_inv is None:`
			`in_keys_inv = out_keys`
			`if out_keys_inv is None:`
			`out_keys_inv = in_keys`
pre-commit run -a 2024-03-02 15:58:21 +00:00			`super().__init__(`
			`in_keys=in_keys, out_keys=out_keys, in_keys_inv=in_keys_inv, out_keys_inv=out_keys_inv`
			`)`
Add mode to NormalizeTransform with mean_std or min_max (Not fully tested) 2024-03-03 13:19:02 +00:00			`self.stats = stats`
			`assert mode in ["mean_std", "min_max"]`
			`self.mode = mode`

			`def _reset(self, tensordict: TensorDictBase, tensordict_reset: TensorDictBase) -> TensorDictBase:`
			`# _reset is called once when the environment reset to normalize the first observation`
			`tensordict_reset = self._call(tensordict_reset)`
			`return tensordict_reset`
pre-commit run -a 2024-03-02 15:58:21 +00:00
Add Normalize, non_blocking=True in tdmpc, tdmpc run (TODO: diffusion) 2024-03-02 15:53:29 +00:00			`@dispatch(source="in_keys", dest="out_keys")`
			`def forward(self, tensordict: TensorDictBase) -> TensorDictBase:`
			`return self._call(tensordict)`

			`def _call(self, td: TensorDictBase) -> TensorDictBase:`
pre-commit run -a 2024-03-02 15:58:21 +00:00			`for inkey, outkey in zip(self.in_keys, self.out_keys, strict=False):`
Add Normalize, non_blocking=True in tdmpc, tdmpc run (TODO: diffusion) 2024-03-02 15:53:29 +00:00			# TODO(rcadene): don't know how to do `inkey not in td`
			`if td.get(inkey, None) is None:`
			`continue`
Add mode to NormalizeTransform with mean_std or min_max (Not fully tested) 2024-03-03 13:19:02 +00:00			`if self.mode == "mean_std":`
			`mean = self.stats[inkey]["mean"]`
			`std = self.stats[inkey]["std"]`
			`td[outkey] = (td[inkey] - mean) / (std + 1e-8)`
			`else:`
			`min = self.stats[inkey]["min"]`
			`max = self.stats[inkey]["max"]`
			`# normalize to [0,1]`
			`td[outkey] = (td[inkey] - min) / (max - min)`
			`# normalize to [-1, 1]`
			`td[outkey] = td[outkey] * 2 - 1`
Add Normalize, non_blocking=True in tdmpc, tdmpc run (TODO: diffusion) 2024-03-02 15:53:29 +00:00			`return td`

			`def _inv_call(self, td: TensorDictBase) -> TensorDictBase:`
pre-commit run -a 2024-03-02 15:58:21 +00:00			`for inkey, outkey in zip(self.in_keys_inv, self.out_keys_inv, strict=False):`
Add Normalize, non_blocking=True in tdmpc, tdmpc run (TODO: diffusion) 2024-03-02 15:53:29 +00:00			# TODO(rcadene): don't know how to do `inkey not in td`
			`if td.get(inkey, None) is None:`
			`continue`
Add mode to NormalizeTransform with mean_std or min_max (Not fully tested) 2024-03-03 13:19:02 +00:00			`if self.mode == "mean_std":`
			`mean = self.stats[inkey]["mean"]`
			`std = self.stats[inkey]["std"]`
			`td[outkey] = td[inkey] * std + mean`
			`else:`
			`min = self.stats[inkey]["min"]`
			`max = self.stats[inkey]["max"]`
			`td[outkey] = (td[inkey] + 1) / 2`
			`td[outkey] = td[outkey] * (max - min) + min`
Add Normalize, non_blocking=True in tdmpc, tdmpc run (TODO: diffusion) 2024-03-02 15:53:29 +00:00			`return td`