diff --git a/src/lerobot/scripts/lerobot_train.py b/src/lerobot/scripts/lerobot_train.py index b15e0cf3b..50e8a8b6b 100644 --- a/src/lerobot/scripts/lerobot_train.py +++ b/src/lerobot/scripts/lerobot_train.py @@ -255,8 +255,8 @@ def train(cfg: TrainPipelineConfig, accelerator: Accelerator | None = None): chunk_size = cfg.policy.chunk_size hf = dataset.hf_dataset total_frames = len(hf) - max_samples = total_frames - chunk_size - indices = np.arange(max_samples) + max_samples = min(1_000_000, total_frames - chunk_size) + indices = np.random.choice(total_frames - chunk_size, max_samples, replace=False) logging.info( f"use_delta_actions is enabled — computing delta action stats " f"from {max_samples} chunk samples (chunk_size={chunk_size})"