from datasets import load_dataset raw_datasets = load_dataset("allocine") raw_datasets.save_to_disk("my-arrow-datasets")