From 6d726266fd9e643e6835f01eac385d02e9ca0168 Mon Sep 17 00:00:00 2001 From: CarolinePascal Date: Tue, 22 Apr 2025 18:31:38 +0200 Subject: [PATCH] fix(audio load file): adding missing dimension when loading mono audio data --- src/lerobot/datasets/utils.py | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/src/lerobot/datasets/utils.py b/src/lerobot/datasets/utils.py index c75aef4ef..34197fa6e 100644 --- a/src/lerobot/datasets/utils.py +++ b/src/lerobot/datasets/utils.py @@ -417,6 +417,11 @@ def load_image_as_numpy( def load_audio_from_path(fpath: str | Path) -> np.ndarray: audio_data, _ = read(fpath, dtype="float32") + + # Fill missing channel dimension when loading mono audio data + if audio_data.ndim == 1: + audio_data = np.expand_dims(audio_data, axis=1) + return audio_data