import numpy as np
import random
import torch
from datasets import load_dataset
traindata = load_dataset('allenai--c4', data_files='c4-train.00000-of-01024.json')
print(1)
valdata = load_dataset('allenai--c4',data_files='c4-validation.00000-of-00008.json')
print(2)