import json
import random
import os, shutil
random_seed = {100, 200, 300}
random.seed(random_seed)

DIR = 'ORIGINAL MATH DATASET'
SUB_DIR = os.listdir(DIR)
TARGET_DIR = 'MATH DATASET'
if not os.path.exists(TARGET_DIR): 
    os.makedirs(TARGET_DIR)
all_files = []
for sub_idx, sub_dir in enumerate(SUB_DIR): 
    files = os.listdir(os.path.join(DIR, sub_dir))
    for file in files: 
        all_files.append((sub_dir, file))
file_select = random.sample(all_files, 500)
for f in file_select: 
    if not os.path.exists(os.path.join(TARGET_DIR, f[0])): 
        os.makedirs(os.path.join(TARGET_DIR, f[0]))
    shutil.copy(os.path.join(DIR, f[0], f[1]), os.path.join(TARGET_DIR, f[0]))