from datasets import load_dataset dataset = load_dataset("liuhaotian/LLaVA-Pretrain") dataset.save_to_disk("LLaVa_Pretrain_dataset")