lerobot/common/utils/utils.py

#!/usr/bin/env python

# Copyright 2024 The HuggingFace Inc. team. All rights reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
import logging
import os
import os.path as osp
import platform
import random
from contextlib import contextmanager
from datetime import datetime, timezone
from pathlib import Path
from typing import Any, Generator

import hydra
import numpy as np
import torch
from omegaconf import DictConfig


def none_or_int(value):
    if value == "None":
        return None
    return int(value)


def inside_slurm():
    """Check whether the python process was launched through slurm"""
    # TODO(rcadene): return False for interactive mode `--pty bash`
    return "SLURM_JOB_ID" in os.environ


def get_safe_torch_device(cfg_device: str, log: bool = False) -> torch.device:
    """Given a string, return a torch.device with checks on whether the device is available."""
    match cfg_device:
        case "cuda":
            assert torch.cuda.is_available()
            device = torch.device("cuda")
        case "mps":
            assert torch.backends.mps.is_available()
            device = torch.device("mps")
        case "cpu":
            device = torch.device("cpu")
            if log:
                logging.warning("Using CPU, this will be slow.")
        case _:
            device = torch.device(cfg_device)
            if log:
                logging.warning(f"Using custom {cfg_device} device.")

    return device


def get_global_random_state() -> dict[str, Any]:
    """Get the random state for `random`, `numpy`, and `torch`."""
    random_state_dict = {
        "random_state": random.getstate(),
        "numpy_random_state": np.random.get_state(),
        "torch_random_state": torch.random.get_rng_state(),
    }
    if torch.cuda.is_available():
        random_state_dict["torch_cuda_random_state"] = torch.cuda.random.get_rng_state()
    return random_state_dict


def set_global_random_state(random_state_dict: dict[str, Any]):
    """Set the random state for `random`, `numpy`, and `torch`.

    Args:
        random_state_dict: A dictionary of the form returned by `get_global_random_state`.
    """
    random.setstate(random_state_dict["random_state"])
    np.random.set_state(random_state_dict["numpy_random_state"])
    torch.random.set_rng_state(random_state_dict["torch_random_state"])
    if torch.cuda.is_available():
        torch.cuda.random.set_rng_state(random_state_dict["torch_cuda_random_state"])


def set_global_seed(seed):
    """Set seed for reproducibility."""
    random.seed(seed)
    np.random.seed(seed)
    torch.manual_seed(seed)
    if torch.cuda.is_available():
        torch.cuda.manual_seed_all(seed)


@contextmanager
def seeded_context(seed: int) -> Generator[None, None, None]:
    """Set the seed when entering a context, and restore the prior random state at exit.

    Example usage:

    ```
    a = random.random()  # produces some random number
    with seeded_context(1337):
        b = random.random()  # produces some other random number
    c = random.random()  # produces yet another random number, but the same it would have if we never made `b`
    ```
    """
    random_state_dict = get_global_random_state()
    set_global_seed(seed)
    yield None
    set_global_random_state(random_state_dict)


def init_logging():
    def custom_format(record):
        dt = datetime.now().strftime("%Y-%m-%d %H:%M:%S")
        fnameline = f"{record.pathname}:{record.lineno}"
        message = f"{record.levelname} {dt} {fnameline[-15:]:>15} {record.msg}"
        return message

    logging.basicConfig(level=logging.INFO)

    for handler in logging.root.handlers[:]:
        logging.root.removeHandler(handler)

    formatter = logging.Formatter()
    formatter.format = custom_format
    console_handler = logging.StreamHandler()
    console_handler.setFormatter(formatter)
    logging.getLogger().addHandler(console_handler)


def format_big_number(num, precision=0):
    suffixes = ["", "K", "M", "B", "T", "Q"]
    divisor = 1000.0

    for suffix in suffixes:
        if abs(num) < divisor:
            return f"{num:.{precision}f}{suffix}"
        num /= divisor

    return num


def _relative_path_between(path1: Path, path2: Path) -> Path:
    """Returns path1 relative to path2."""
    path1 = path1.absolute()
    path2 = path2.absolute()
    try:
        return path1.relative_to(path2)
    except ValueError:  # most likely because path1 is not a subpath of path2
        common_parts = Path(osp.commonpath([path1, path2])).parts
        return Path(
            "/".join([".."] * (len(path2.parts) - len(common_parts)) + list(path1.parts[len(common_parts) :]))
        )


def init_hydra_config(config_path: str, overrides: list[str] | None = None) -> DictConfig:
    """Initialize a Hydra config given only the path to the relevant config file.

    For config resolution, it is assumed that the config file's parent is the Hydra config dir.
    """
    # TODO(alexander-soare): Resolve configs without Hydra initialization.
    hydra.core.global_hydra.GlobalHydra.instance().clear()
    # Hydra needs a path relative to this file.
    hydra.initialize(
        str(_relative_path_between(Path(config_path).absolute().parent, Path(__file__).absolute().parent)),
        version_base="1.2",
    )
    cfg = hydra.compose(Path(config_path).stem, overrides)
    return cfg


def print_cuda_memory_usage():
    """Use this function to locate and debug memory leak."""
    import gc

    gc.collect()
    # Also clear the cache if you want to fully release the memory
    torch.cuda.empty_cache()
    print("Current GPU Memory Allocated: {:.2f} MB".format(torch.cuda.memory_allocated(0) / 1024**2))
    print("Maximum GPU Memory Allocated: {:.2f} MB".format(torch.cuda.max_memory_allocated(0) / 1024**2))
    print("Current GPU Memory Reserved: {:.2f} MB".format(torch.cuda.memory_reserved(0) / 1024**2))
    print("Maximum GPU Memory Reserved: {:.2f} MB".format(torch.cuda.max_memory_reserved(0) / 1024**2))


def capture_timestamp_utc():
    return datetime.now(timezone.utc)


def say(text, blocking=False):
    # Check if mac, linux, or windows.
    if platform.system() == "Darwin":
        cmd = f'say "{text}"'
        if not blocking:
            cmd += " &"
    elif platform.system() == "Linux":
        cmd = f'spd-say "{text}"'
        if blocking:
            cmd += "  --wait"
    elif platform.system() == "Windows":
        # TODO(rcadene): Make blocking option work for Windows
        cmd = (
            'PowerShell -Command "Add-Type -AssemblyName System.Speech; '
            f"(New-Object System.Speech.Synthesis.SpeechSynthesizer).Speak('{text}')\""
        )

    os.system(cmd)


def log_say(text, play_sounds, blocking=False):
    logging.info(text)

    if play_sounds:
        say(text, blocking)
Add copyrights (#157) 2024-05-15 12:13:09 +02:00			`#!/usr/bin/env python`

			`# Copyright 2024 The HuggingFace Inc. team. All rights reserved.`
			`#`
			`# Licensed under the Apache License, Version 2.0 (the "License");`
			`# you may not use this file except in compliance with the License.`
			`# You may obtain a copy of the License at`
			`#`
			`# http://www.apache.org/licenses/LICENSE-2.0`
			`#`
			`# Unless required by applicable law or agreed to in writing, software`
			`# distributed under the License is distributed on an "AS IS" BASIS,`
			`# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`# See the License for the specific language governing permissions and`
			`# limitations under the License.`
Clean logging, Refactor 2024-02-29 23:13:06 +00:00			`import logging`
Provide more information to the user (#358) Co-authored-by: Alexander Soare <alexander.soare159@gmail.com> Co-authored-by: Remi <re.cadene@gmail.com> 2024-08-23 18:00:35 +08:00			`import os`
finish examples 2 and 3 2024-03-26 16:13:40 +00:00			`import os.path as osp`
Refactor `record` with `add_frame` (#468) Co-authored-by: Simon Alibert <75076266+aliberts@users.noreply.github.com> 2024-10-16 20:51:35 +02:00			`import platform`
Add common, refactor eval with eval_policy 2024-01-31 13:48:12 +00:00			`import random`
Add context manager for seeding (#164) 2024-05-09 17:58:39 +01:00			`from contextlib import contextmanager`
Add real robot devices and scripts to control real robot (#288) Co-authored-by: Simon Alibert <alibert.sim@gmail.com> 2024-07-15 17:43:10 +02:00			`from datetime import datetime, timezone`
finish examples 2 and 3 2024-03-26 16:13:40 +00:00			`from pathlib import Path`
Add resume training (#205) Co-authored-by: Remi <re.cadene@gmail.com> 2024-05-28 12:04:23 +01:00			`from typing import Any, Generator`
Add common, refactor eval with eval_policy 2024-01-31 13:48:12 +00:00
finish examples 2 and 3 2024-03-26 16:13:40 +00:00			`import hydra`
Add common, refactor eval with eval_policy 2024-01-31 13:48:12 +00:00			`import numpy as np`
			`import torch`
finish examples 2 and 3 2024-03-26 16:13:40 +00:00			`from omegaconf import DictConfig`
Add common, refactor eval with eval_policy 2024-01-31 13:48:12 +00:00

Refactor `record` with `add_frame` (#468) Co-authored-by: Simon Alibert <75076266+aliberts@users.noreply.github.com> 2024-10-16 20:51:35 +02:00			`def none_or_int(value):`
			`if value == "None":`
			`return None`
			`return int(value)`


Provide more information to the user (#358) Co-authored-by: Alexander Soare <alexander.soare159@gmail.com> Co-authored-by: Remi <re.cadene@gmail.com> 2024-08-23 18:00:35 +08:00			`def inside_slurm():`
			`"""Check whether the python process was launched through slurm"""`
			# TODO(rcadene): return False for interactive mode `--pty bash`
			`return "SLURM_JOB_ID" in os.environ`


Add get_safe_torch_device in policies 2024-03-20 18:38:55 +01:00			`def get_safe_torch_device(cfg_device: str, log: bool = False) -> torch.device:`
backup wip 2024-04-11 17:51:35 +01:00			`"""Given a string, return a torch.device with checks on whether the device is available."""`
Add get_safe_torch_device in policies 2024-03-20 18:38:55 +01:00			`match cfg_device:`
			`case "cuda":`
			`assert torch.cuda.is_available()`
			`device = torch.device("cuda")`
			`case "mps":`
			`assert torch.backends.mps.is_available()`
			`device = torch.device("mps")`
			`case "cpu":`
			`device = torch.device("cpu")`
			`if log:`
			`logging.warning("Using CPU, this will be slow.")`
			`case _:`
			`device = torch.device(cfg_device)`
			`if log:`
			`logging.warning(f"Using custom {cfg_device} device.")`

			`return device`


Add resume training (#205) Co-authored-by: Remi <re.cadene@gmail.com> 2024-05-28 12:04:23 +01:00			`def get_global_random_state() -> dict[str, Any]:`
			"""Get the random state for `random`, `numpy`, and `torch`."""
			`random_state_dict = {`
			`"random_state": random.getstate(),`
			`"numpy_random_state": np.random.get_state(),`
			`"torch_random_state": torch.random.get_rng_state(),`
			`}`
			`if torch.cuda.is_available():`
			`random_state_dict["torch_cuda_random_state"] = torch.cuda.random.get_rng_state()`
			`return random_state_dict`


			`def set_global_random_state(random_state_dict: dict[str, Any]):`
			"""Set the random state for `random`, `numpy`, and `torch`.

			`Args:`
			random_state_dict: A dictionary of the form returned by `get_global_random_state`.
			`"""`
			`random.setstate(random_state_dict["random_state"])`
			`np.random.set_state(random_state_dict["numpy_random_state"])`
			`torch.random.set_rng_state(random_state_dict["torch_random_state"])`
			`if torch.cuda.is_available():`
			`torch.cuda.random.set_rng_state(random_state_dict["torch_cuda_random_state"])`


Renamed set_seed -> set_global_seed 2024-03-25 17:19:28 +01:00			`def set_global_seed(seed):`
Add common, refactor eval with eval_policy 2024-01-31 13:48:12 +00:00			`"""Set seed for reproducibility."""`
			`random.seed(seed)`
			`np.random.seed(seed)`
			`torch.manual_seed(seed)`
Add resume training (#205) Co-authored-by: Remi <re.cadene@gmail.com> 2024-05-28 12:04:23 +01:00			`if torch.cuda.is_available():`
			`torch.cuda.manual_seed_all(seed)`
Clean logging, Refactor 2024-02-29 23:13:06 +00:00

Add context manager for seeding (#164) 2024-05-09 17:58:39 +01:00			`@contextmanager`
			`def seeded_context(seed: int) -> Generator[None, None, None]:`
			`"""Set the seed when entering a context, and restore the prior random state at exit.`

			`Example usage:`

			```
			`a = random.random() # produces some random number`
			`with seeded_context(1337):`
			`b = random.random() # produces some other random number`
			c = random.random() # produces yet another random number, but the same it would have if we never made `b`
			```
			`"""`
Add resume training (#205) Co-authored-by: Remi <re.cadene@gmail.com> 2024-05-28 12:04:23 +01:00			`random_state_dict = get_global_random_state()`
Add context manager for seeding (#164) 2024-05-09 17:58:39 +01:00			`set_global_seed(seed)`
			`yield None`
Add resume training (#205) Co-authored-by: Remi <re.cadene@gmail.com> 2024-05-28 12:04:23 +01:00			`set_global_random_state(random_state_dict)`
Add context manager for seeding (#164) 2024-05-09 17:58:39 +01:00

Clean logging, Refactor 2024-02-29 23:13:06 +00:00			`def init_logging():`
			`def custom_format(record):`
			`dt = datetime.now().strftime("%Y-%m-%d %H:%M:%S")`
			`fnameline = f"{record.pathname}:{record.lineno}"`
			`message = f"{record.levelname} {dt} {fnameline[-15:]:>15} {record.msg}"`
			`return message`

			`logging.basicConfig(level=logging.INFO)`

			`for handler in logging.root.handlers[:]:`
			`logging.root.removeHandler(handler)`

			`formatter = logging.Formatter()`
			`formatter.format = custom_format`
			`console_handler = logging.StreamHandler()`
			`console_handler.setFormatter(formatter)`
			`logging.getLogger().addHandler(console_handler)`


Add precision param to format_big_number (#232) 2024-05-31 18:19:01 +10:00			`def format_big_number(num, precision=0):`
Clean logging, Refactor 2024-02-29 23:13:06 +00:00			`suffixes = ["", "K", "M", "B", "T", "Q"]`
			`divisor = 1000.0`

			`for suffix in suffixes:`
			`if abs(num) < divisor:`
Add precision param to format_big_number (#232) 2024-05-31 18:19:01 +10:00			`return f"{num:.{precision}f}{suffix}"`
Clean logging, Refactor 2024-02-29 23:13:06 +00:00			`num /= divisor`

			`return num`
finish examples 2 and 3 2024-03-26 16:13:40 +00:00

			`def _relative_path_between(path1: Path, path2: Path) -> Path:`
			`"""Returns path1 relative to path2."""`
			`path1 = path1.absolute()`
			`path2 = path2.absolute()`
			`try:`
			`return path1.relative_to(path2)`
			`except ValueError: # most likely because path1 is not a subpath of path2`
			`common_parts = Path(osp.commonpath([path1, path2])).parts`
			`return Path(`
			`"/".join([".."] * (len(path2.parts) - len(common_parts)) + list(path1.parts[len(common_parts) :]))`
			`)`


			`def init_hydra_config(config_path: str, overrides: list[str] \| None = None) -> DictConfig:`
			`"""Initialize a Hydra config given only the path to the relevant config file.`

			`For config resolution, it is assumed that the config file's parent is the Hydra config dir.`
			`"""`
fix tests 2024-03-26 16:40:54 +00:00			`# TODO(alexander-soare): Resolve configs without Hydra initialization.`
			`hydra.core.global_hydra.GlobalHydra.instance().clear()`
finish examples 2 and 3 2024-03-26 16:13:40 +00:00			`# Hydra needs a path relative to this file.`
			`hydra.initialize(`
Remove warnings (#111) - Replace `use_pretrained_backbone` with `pretrained_backbone_weights` - Bump diffusers' minimum version `0.26.3` -> `0.27.2` - Add ignore flags in CI's pytest - Change Box observation spaces in simulation environments - Set `version_base="1.2"` in Hydra initializations - Bump einops' minimum version `0.7.0` -> `0.8.0` 2024-04-29 00:31:33 +02:00			`str(_relative_path_between(Path(config_path).absolute().parent, Path(__file__).absolute().parent)),`
			`version_base="1.2",`
finish examples 2 and 3 2024-03-26 16:13:40 +00:00			`)`
			`cfg = hydra.compose(Path(config_path).stem, overrides)`
			`return cfg`
fix memory leak due to itertools.cycle 2024-04-05 10:59:32 +00:00

			`def print_cuda_memory_usage():`
print_cuda_memory_usage docstring 2024-04-10 16:03:39 +00:00			`"""Use this function to locate and debug memory leak."""`
fix memory leak due to itertools.cycle 2024-04-05 10:59:32 +00:00			`import gc`

			`gc.collect()`
			`# Also clear the cache if you want to fully release the memory`
			`torch.cuda.empty_cache()`
			`print("Current GPU Memory Allocated: {:.2f} MB".format(torch.cuda.memory_allocated(0) / 1024**2))`
			`print("Maximum GPU Memory Allocated: {:.2f} MB".format(torch.cuda.max_memory_allocated(0) / 1024**2))`
			`print("Current GPU Memory Reserved: {:.2f} MB".format(torch.cuda.memory_reserved(0) / 1024**2))`
			`print("Maximum GPU Memory Reserved: {:.2f} MB".format(torch.cuda.max_memory_reserved(0) / 1024**2))`
Add real robot devices and scripts to control real robot (#288) Co-authored-by: Simon Alibert <alibert.sim@gmail.com> 2024-07-15 17:43:10 +02:00

			`def capture_timestamp_utc():`
			`return datetime.now(timezone.utc)`
Refactor `record` with `add_frame` (#468) Co-authored-by: Simon Alibert <75076266+aliberts@users.noreply.github.com> 2024-10-16 20:51:35 +02:00

			`def say(text, blocking=False):`
			`# Check if mac, linux, or windows.`
			`if platform.system() == "Darwin":`
			`cmd = f'say "{text}"'`
Make `say(blocking=True)` work for Linux (#460) 2024-10-17 15:22:21 +01:00			`if not blocking:`
			`cmd += " &"`
Refactor `record` with `add_frame` (#468) Co-authored-by: Simon Alibert <75076266+aliberts@users.noreply.github.com> 2024-10-16 20:51:35 +02:00			`elif platform.system() == "Linux":`
			`cmd = f'spd-say "{text}"'`
Make `say(blocking=True)` work for Linux (#460) 2024-10-17 15:22:21 +01:00			`if blocking:`
			`cmd += " --wait"`
Refactor `record` with `add_frame` (#468) Co-authored-by: Simon Alibert <75076266+aliberts@users.noreply.github.com> 2024-10-16 20:51:35 +02:00			`elif platform.system() == "Windows":`
Make `say(blocking=True)` work for Linux (#460) 2024-10-17 15:22:21 +01:00			`# TODO(rcadene): Make blocking option work for Windows`
Refactor `record` with `add_frame` (#468) Co-authored-by: Simon Alibert <75076266+aliberts@users.noreply.github.com> 2024-10-16 20:51:35 +02:00			`cmd = (`
			`'PowerShell -Command "Add-Type -AssemblyName System.Speech; '`
			`f"(New-Object System.Speech.Synthesis.SpeechSynthesizer).Speak('{text}')\""`
			`)`

			`os.system(cmd)`


			`def log_say(text, play_sounds, blocking=False):`
			`logging.info(text)`

			`if play_sounds:`
			`say(text, blocking)`