{"nbformat":4,"nbformat_minor":4,"metadata":{"kernelspec":{"name":"python3","display_name":"Yandex DataSphere Kernel","language":"python"},"language_info":{"mimetype":"text/x-python","name":"python","codemirror_mode":{"version":3,"name":"ipython"},"nbconvert_exporter":"python","version":"3.7.7","file_extension":".py","pygments_lexer":"ipython3"},"notebookId":"778cae86-760d-4162-a46f-a32f25159f92"},"cells":[{"cell_type":"code","source":"import os\nimport subprocess\nfrom shutil import copyfile\nfrom random import shuffle\n\nsplits = ['gridsearch', 'small_test', 'test']\n\ndef make_split(dataset):\n    folder_names = []\n    for entry_name in os.listdir(dataset):\n        entry_path = os.path.join(dataset, entry_name)\n        if os.path.isdir(entry_path):\n            folder_names.append(entry_name)\n\n\n    os.mkdir(f'./{dataset}_repack')\n    for split in splits:\n        os.mkdir(f'./{dataset}_repack/{split}')\n\n    for folder_name in folder_names:\n        onlyfiles = ([f for f in os.listdir(dataset + '/' + folder_name) if os.path.isfile(os.path.join(dataset + '/' + folder_name, f))])\n        shuffle(onlyfiles)\n\n        for split in splits:\n            os.mkdir(f'./{dataset}_repack/{split}/{folder_name}')\n\n        for i, cur_file in enumerate(onlyfiles):\n            if i <= 2:\n                cur_split = splits[0]\n            elif i <= 4:\n                cur_split = splits[1]\n            else:\n                cur_split = splits[2]\n\n            copyfile(f'{dataset}/{folder_name}/{cur_file}', f'./{dataset}_repack/{cur_split}/{folder_name}/{cur_file}')","metadata":{"cellId":"0rhw9krjf13ixznptfklhke"},"outputs":[],"execution_count":null},{"cell_type":"code","source":"make_split('imagenet-r')","metadata":{"cellId":"rvge7mgrwry0oalspdr5k"},"outputs":[],"execution_count":null},{"cell_type":"code","source":"#!c1.8\nmake_split('imagenet/val')","metadata":{"cellId":"tqol6f3bnfv22o2g0rx4"},"outputs":[],"execution_count":null}]}