diff --git a/lerobot/common/datasets/video_utils.py b/lerobot/common/datasets/video_utils.py index 39c93c4e..b16ba0c0 100644 --- a/lerobot/common/datasets/video_utils.py +++ b/lerobot/common/datasets/video_utils.py @@ -162,9 +162,9 @@ def decode_video_frames_torchcodec( log_loaded_timestamps: bool = False, ) -> torch.Tensor: """Loads frames associated with the requested timestamps of a video using torchcodec. - + Note: Setting device="cuda" outside the main process, e.g. in data loader workers, will lead to CUDA initialization errors. - + Note: Video benefits from inter-frame compression. Instead of storing every frame individually, the encoder stores a reference frame (or a key frame) and subsequent frames as differences relative to that key frame. As a consequence, to access a requested frame, we need to load the preceding key frame,