Spaces:
Build error
Build error
| import datasets | |
| import logging | |
| import os | |
| from tqdm import tqdm | |
| PATH = "/Users/reshinthadithyan/master/research/code-research/carperai/pile-v2-small-filtered/data" | |
| dataset_subs = os.listdir(PATH) | |
| print(dataset_subs) | |
| for ds in tqdm(dataset_subs): | |
| try: | |
| print(ds) | |
| dataset = datasets.load_dataset("CarperAI/pile-v2-small-filtered",data_files=f"data/{ds}/data.json", split="train") | |
| dataset.save_to_disk(f"cache_ds/{ds}") | |
| except: | |
| print(f"Error at {ds}") |