# Description: Preload the dataset to cache_dir # Copyright (C) 2024 Ronan Le Meillat # License: Apache License 2.0 from datasets import load_dataset dataset_id = "eltorio/ROCO-radiology" cache_dir = "/workspace/data" train_dataset = load_dataset(dataset_id, split="train", cache_dir=cache_dir)