#!/usr/bin/env python3 | |
import glob | |
import os | |
from datasets import load_dataset | |
folder_path = "isp-data-json/" # Replace with your folder path | |
# Search for all .json files in the folder | |
json_files = glob.glob(os.path.join(folder_path, "*.jsonl")) | |
path = "pminervini/inverse-scaling" | |
for json_path in json_files: | |
base_name = os.path.basename(json_path) | |
name = base_name.split("_")[0] | |
ds = load_dataset("json", data_files={"data": json_path}) | |
ds.push_to_hub(path, config_name=name) | |