{"nbformat":4,"nbformat_minor":0,"metadata":{"colab":{"name":"TrainIndGeneration.ipynb","provenance":[],"collapsed_sections":[]},"kernelspec":{"name":"python3","display_name":"Python 3"}},"cells":[{"cell_type":"code","metadata":{"id":"1DEMv7VevmPT","colab_type":"code","outputId":"3fcfa86b-84e5-46b3-b122-5105e481904a","executionInfo":{"status":"ok","timestamp":1591047259985,"user_tz":240,"elapsed":33503,"user":{"displayName":"Udai G. Nagpal","photoUrl":"","userId":"11423854453810789252"}},"colab":{"base_uri":"https://localhost:8080/","height":161}},"source":["%tensorflow_version 1.x\n","import numpy as np\n","import keras\n","\n","from google.colab import drive\n","drive.mount(\"/content/gdrive\", force_remount=True)\n"],"execution_count":0,"outputs":[{"output_type":"stream","text":["TensorFlow 1.x selected.\n"],"name":"stdout"},{"output_type":"stream","text":["Using TensorFlow backend.\n"],"name":"stderr"},{"output_type":"stream","text":["Go to this URL in a browser: https://accounts.google.com/o/oauth2/auth?client_id=947318989803-6bn6qk8qdgf4n4g3pfee6491hc0brc4i.apps.googleusercontent.com&redirect_uri=urn%3aietf%3awg%3aoauth%3a2.0%3aoob&response_type=code&scope=email%20https%3a%2f%2fwww.googleapis.com%2fauth%2fdocs.test%20https%3a%2f%2fwww.googleapis.com%2fauth%2fdrive%20https%3a%2f%2fwww.googleapis.com%2fauth%2fdrive.photos.readonly%20https%3a%2f%2fwww.googleapis.com%2fauth%2fpeopleapi.readonly\n","\n","Enter your authorization code:\n","··········\n","Mounted at /content/gdrive\n"],"name":"stdout"}]},{"cell_type":"markdown","metadata":{"id":"_wjEbk_B6973","colab_type":"text"},"source":["Code used in generating the indices within X_train_All of the initial training set for each active learning experiment (such that each class is equally represented)"]},{"cell_type":"code","metadata":{"id":"xjW5qz4_wH-b","colab_type":"code","outputId":"1efa164a-970a-4180-f55a-40488a119073","executionInfo":{"status":"ok","timestamp":1591048064101,"user_tz":240,"elapsed":28755,"user":{"displayName":"Udai G. Nagpal","photoUrl":"","userId":"11423854453810789252"}},"colab":{"base_uri":"https://localhost:8080/","height":90}},"source":["#Loading data\n","data_path = \"/content/gdrive/My Drive/FINAL_PAPER_ACTIVE_LEARNING_EXP/MNIST/\"\n","train_data = np.loadtxt(data_path + \"mnist_train.csv\", \n","\t\t  delimiter=\",\")\n","test_data = np.loadtxt(data_path + \"mnist_test.csv\", \n","\t\t delimiter=\",\") \n","y_train_All = train_data[:,0]\n","y_test = test_data[:,0]\n","X_train_All = train_data[:,1:].reshape((60000,28,28))\n","X_test = test_data[:,1:].reshape((10000,28,28)) \n","train_ind = np.arange(60000)\n","test_ind = np.arange(10000)\n","\n","y_test_original = y_test\n","print(len(np.argwhere(y_train_All == 7))+len(np.argwhere(y_train_All == 9)))\n","print(len(np.argwhere(y_test == 7))+len(np.argwhere(y_test == 9)))\n","\"\"\"\n","y_test = keras.utils.to_categorical(y_test, num_classes=10)\n","X_test = np.expand_dims(X_test[test_ind], axis=1)\n","folder_path = \"/content/gdrive/My Drive/FINAL_PAPER_ACTIVE_LEARNING_EXP/MNIST/MultiClass_AL_Scripts_v1/\"\n","out_folder_path = \"/content/gdrive/My Drive/FINAL_PAPER_ACTIVE_LEARNING_EXP/MNIST/MultiClass_AL_Results_v1/\"\n","\n","print(y_train_All[train_data_indices])\n","\"\"\""],"execution_count":0,"outputs":[{"output_type":"stream","text":["12214\n","2037\n"],"name":"stdout"},{"output_type":"execute_result","data":{"text/plain":["'\\ny_test = keras.utils.to_categorical(y_test, num_classes=10)\\nX_test = np.expand_dims(X_test[test_ind], axis=1)\\nfolder_path = \"/content/gdrive/My Drive/FINAL_PAPER_ACTIVE_LEARNING_EXP/MNIST/MultiClass_AL_Scripts_v1/\"\\nout_folder_path = \"/content/gdrive/My Drive/FINAL_PAPER_ACTIVE_LEARNING_EXP/MNIST/MultiClass_AL_Results_v1/\"\\n\\nprint(y_train_All[train_data_indices])\\n'"]},"metadata":{"tags":[]},"execution_count":15}]},{"cell_type":"code","metadata":{"id":"-U3G_n2vwdZp","colab_type":"code","outputId":"33bfaa8d-1b3c-46ec-9614-d1bd0695c683","executionInfo":{"status":"ok","timestamp":1587154300373,"user_tz":240,"elapsed":348,"user":{"displayName":"Udai Nagpal","photoUrl":"","userId":"13753938716573431194"}},"colab":{"base_uri":"https://localhost:8080/","height":90}},"source":["#Assembling and saving a balanced initial training set\n","train_ind_tmp = []\n","for digit in range(10):\n","  poss_digits = np.argwhere(y_train_All==digit).flatten()\n","  train_ind_tmp += list(np.random.choice(poss_digits, size=3, replace=False))\n","print(train_ind_tmp)\n","print(y_train_All[train_ind_tmp])\n","\n","np.save(folder_path+\"trainindices3.npy\", np.array(train_ind_tmp))"],"execution_count":0,"outputs":[{"output_type":"stream","text":["[52126, 21358, 44933, 52738, 30218, 9103, 15748, 7528, 46546, 51848, 1870, 18119, 10854, 56516, 3439, 26621, 21385, 29065, 34776, 15404, 54539, 41309, 36580, 30513, 31800, 39142, 42003, 31226, 8356, 49313]\n","[0. 0. 0. 1. 1. 1. 2. 2. 2. 3. 3. 3. 4. 4. 4. 5. 5. 5. 6. 6. 6. 7. 7. 7.\n"," 8. 8. 8. 9. 9. 9.]\n"],"name":"stdout"}]},{"cell_type":"code","metadata":{"id":"oiWqSONjxByZ","colab_type":"code","colab":{}},"source":[""],"execution_count":0,"outputs":[]}]}