from datasets import load_dataset

dataset = load_dataset('THUDM/LongAlign-10k')
for split, split_dataset in dataset.items():
    split_dataset.to_json("/data/longalign.jsonl")