{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# EYEPACK, MESSIDOR-1, MESSIDOR-2 COMBINED ON APTOS"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Loading datasets...\n",
      "Combined dataset D contains 37379 samples:\n",
      "  - EyePACS: 35122 samples\n",
      "  - Messidor-1: 1200 samples\n",
      "  - Messidor-2: 1057 samples\n",
      "  - APTOS (to be evaluated): 3662 samples\n",
      "\n",
      "Calculating median theta for combined dataset D...\n",
      "Creating train/calibration split for conformal bounds...\n",
      "Calculating calibration MARD values...\n",
      "\n",
      "Combined dataset D conformal bounds:\n",
      "  - Mean MARD: 38.111575\n",
      "  - Std MARD: 10.958648\n",
      "  - Lower bound: 16.194278\n",
      "  - Upper bound: 60.028871\n",
      "\n",
      "Evaluating APTOS against combined dataset bounds...\n",
      "\n",
      "APTOS EVALUATION AGAINST COMBINED DATASET BOUNDS:\n",
      "  - Total APTOS samples: 3662\n",
      "  - APTOS samples outside combined bounds: 315\n",
      "  - Percentage outside: 8.60%\n",
      "\n",
      "APTOS points outside combined dataset bounds:\n",
      "  Point 1 (ID: 0083ee8054ee): MARD = 69.775539\n",
      "  Point 2 (ID: 0243404e8a00): MARD = 63.052424\n",
      "  Point 3 (ID: 033f2b43de6d): MARD = 66.086915\n",
      "  Point 4 (ID: 03747397839f): MARD = 60.886183\n",
      "  Point 5 (ID: 03b373718013): MARD = 64.983450\n",
      "  Point 6 (ID: 04d029cfb612): MARD = 62.026108\n",
      "  Point 7 (ID: 0519b934f6b1): MARD = 81.045599\n",
      "  Point 8 (ID: 052d9a3fe55a): MARD = 87.241807\n",
      "  Point 9 (ID: 0551676cc2aa): MARD = 65.770265\n",
      "  Point 10 (ID: 05b1bb2bdb81): MARD = 73.444397\n",
      "  Point 11 (ID: 07929d32b5b3): MARD = 70.609223\n",
      "  Point 12 (ID: 086d41d17da8): MARD = 60.416731\n",
      "  Point 13 (ID: 08b6e3240858): MARD = 72.992325\n",
      "  Point 14 (ID: 096436d68d06): MARD = 66.395213\n",
      "  Point 15 (ID: 09662e462531): MARD = 62.841948\n",
      "  Point 16 (ID: 0efc93ec838b): MARD = 62.173358\n",
      "  Point 17 (ID: 0eff8eacb2f7): MARD = 74.867855\n",
      "  Point 18 (ID: 0fb560f9adb2): MARD = 78.276552\n",
      "  Point 19 (ID: 0fc6829da85b): MARD = 63.627973\n",
      "  Point 20 (ID: 0fcfc6301f3d): MARD = 60.855146\n",
      "  Point 21 (ID: 103f97a2ab15): MARD = 63.888841\n",
      "  Point 22 (ID: 13063d1bc4ea): MARD = 61.610841\n",
      "  Point 23 (ID: 15bed5adde74): MARD = 73.177802\n",
      "  Point 24 (ID: 164cd5a3a6cd): MARD = 63.660418\n",
      "  Point 25 (ID: 172df1330a60): MARD = 62.934139\n",
      "  Point 26 (ID: 174db0854291): MARD = 61.499388\n",
      "  Point 27 (ID: 1891698febce): MARD = 66.198440\n",
      "  Point 28 (ID: 191348830ddf): MARD = 60.968320\n",
      "  Point 29 (ID: 19244004583f): MARD = 73.927800\n",
      "  Point 30 (ID: 1a03a7970337): MARD = 64.055424\n",
      "  Point 31 (ID: 1ab8d3431ffc): MARD = 60.119591\n",
      "  Point 32 (ID: 1b495ac025b7): MARD = 78.231208\n",
      "  Point 33 (ID: 1dd9adcbfff4): MARD = 69.250471\n",
      "  Point 34 (ID: 1e7ccd4a1c87): MARD = 71.050216\n",
      "  Point 35 (ID: 1e9224ccca95): MARD = 67.803763\n",
      "  Point 36 (ID: 1f31701dd61b): MARD = 69.474280\n",
      "  Point 37 (ID: 1f3f32efaf20): MARD = 62.851028\n",
      "  Point 38 (ID: 1f4bf8e28b41): MARD = 60.592397\n",
      "  Point 39 (ID: 2017cd92c63d): MARD = 65.478684\n",
      "  Point 40 (ID: 207a580de0ea): MARD = 65.276048\n",
      "  Point 41 (ID: 20d5fdd450ae): MARD = 61.848666\n",
      "  Point 42 (ID: 20f86e068276): MARD = 64.335383\n",
      "  Point 43 (ID: 21037f5c7790): MARD = 64.070132\n",
      "  Point 44 (ID: 22a6da005395): MARD = 70.415567\n",
      "  Point 45 (ID: 23175b7ef453): MARD = 60.436737\n",
      "  Point 46 (ID: 237aa50edc34): MARD = 76.986351\n",
      "  Point 47 (ID: 239f2c348ea4): MARD = 82.385745\n",
      "  Point 48 (ID: 269b44e628eb): MARD = 61.858973\n",
      "  Point 49 (ID: 276b14f72328): MARD = 65.957142\n",
      "  Point 50 (ID: 28503940d10b): MARD = 62.745683\n",
      "  Point 51 (ID: 28a4d00927b7): MARD = 73.872119\n",
      "  Point 52 (ID: 2994f17f58a5): MARD = 65.999853\n",
      "  Point 53 (ID: 2b074afdf626): MARD = 65.945884\n",
      "  Point 54 (ID: 2d07162a13b1): MARD = 70.264378\n",
      "  Point 55 (ID: 2d9d97a6e713): MARD = 64.881322\n",
      "  Point 56 (ID: 2dc647e00ad3): MARD = 63.824633\n",
      "  Point 57 (ID: 2f284b6a1940): MARD = 60.679468\n",
      "  Point 58 (ID: 2f8d14a7d390): MARD = 75.665150\n",
      "  Point 59 (ID: 30263a7d5609): MARD = 82.258369\n",
      "  Point 60 (ID: 3079490a4b9c): MARD = 62.883731\n",
      "  Point 61 (ID: 3132556f5352): MARD = 72.974522\n",
      "  Point 62 (ID: 33e8e26a75d4): MARD = 66.253281\n",
      "  Point 63 (ID: 3486f7096276): MARD = 63.010220\n",
      "  Point 64 (ID: 351e842842a2): MARD = 66.183549\n",
      "  Point 65 (ID: 35cd9832fc0a): MARD = 66.843951\n",
      "  Point 66 (ID: 3601dac9bed7): MARD = 73.301953\n",
      "  Point 67 (ID: 3694e8c8e09a): MARD = 70.841117\n",
      "  Point 68 (ID: 3710ff45299c): MARD = 68.397402\n",
      "  Point 69 (ID: 37c4dfe03aba): MARD = 61.085741\n",
      "  Point 70 (ID: 387138ddf43d): MARD = 68.799536\n",
      "  Point 71 (ID: 393fa5a023a5): MARD = 62.594855\n",
      "  Point 72 (ID: 3b018e8b7303): MARD = 71.140382\n",
      "  Point 73 (ID: 3b73a3a4a734): MARD = 60.497178\n",
      "  Point 74 (ID: 3ddb86eb530e): MARD = 64.791527\n",
      "  Point 75 (ID: 42a67337fa8e): MARD = 70.176007\n",
      "  Point 76 (ID: 42af7282349b): MARD = 68.026281\n",
      "  Point 77 (ID: 44976c3b11a6): MARD = 67.225389\n",
      "  Point 78 (ID: 44ecf3f4efa5): MARD = 68.485203\n",
      "  Point 79 (ID: 467b7d9d811c): MARD = 73.319234\n",
      "  Point 80 (ID: 47536db39f00): MARD = 60.513315\n",
      "  Point 81 (ID: 48543037d0b3): MARD = 66.176878\n",
      "  Point 82 (ID: 49386d603494): MARD = 63.362916\n",
      "  Point 83 (ID: 495255c7492f): MARD = 61.741858\n",
      "  Point 84 (ID: 496155f71d0a): MARD = 62.800278\n",
      "  Point 85 (ID: 4bcee3cbe232): MARD = 68.728570\n",
      "  Point 86 (ID: 4c52922f3bfd): MARD = 61.038761\n",
      "  Point 87 (ID: 4ccfa0b4e96c): MARD = 69.027190\n",
      "  Point 88 (ID: 4e4a6224a04e): MARD = 61.185852\n",
      "  Point 89 (ID: 4e6071b73120): MARD = 60.882270\n",
      "  Point 90 (ID: 4ecd1fdd1435): MARD = 65.872291\n",
      "  Point 91 (ID: 504a69096fcb): MARD = 70.026068\n",
      "  Point 92 (ID: 5090917a2676): MARD = 62.022411\n",
      "  Point 93 (ID: 50d8a8fb7737): MARD = 66.407356\n",
      "  Point 94 (ID: 510aa0a898fa): MARD = 61.144520\n",
      "  Point 95 (ID: 51a078d6d43a): MARD = 66.381662\n",
      "  Point 96 (ID: 51da6aebba8f): MARD = 67.108102\n",
      "  Point 97 (ID: 5257cb536da2): MARD = 67.709434\n",
      "  Point 98 (ID: 5264a54e1830): MARD = 60.880783\n",
      "  Point 99 (ID: 5265dc9acdf8): MARD = 60.489984\n",
      "  Point 100 (ID: 54bbe3da103e): MARD = 76.819638\n",
      "  Point 101 (ID: 5548a7961a3e): MARD = 75.095988\n",
      "  Point 102 (ID: 55fd453001cc): MARD = 68.616790\n",
      "  Point 103 (ID: 57f933d3d7c7): MARD = 64.462432\n",
      "  Point 104 (ID: 582f739b8f62): MARD = 64.978644\n",
      "  Point 105 (ID: 58c12863f33d): MARD = 63.006425\n",
      "  Point 106 (ID: 596f4fdb0004): MARD = 64.755290\n",
      "  Point 107 (ID: 59f3f70abddd): MARD = 61.168032\n",
      "  Point 108 (ID: 5a11d21c2828): MARD = 70.495404\n",
      "  Point 109 (ID: 5ad3dabeb2cd): MARD = 68.496240\n",
      "  Point 110 (ID: 5b301a6d1ac7): MARD = 82.596308\n",
      "  Point 111 (ID: 5b804948e35f): MARD = 64.168426\n",
      "  Point 112 (ID: 5cc6dea19614): MARD = 62.481917\n",
      "  Point 113 (ID: 5de4615a5161): MARD = 60.239756\n",
      "  Point 114 (ID: 5e7db41b3bee): MARD = 68.475322\n",
      "  Point 115 (ID: 61c2fbd16e38): MARD = 69.112875\n",
      "  Point 116 (ID: 63c7b0265775): MARD = 60.911713\n",
      "  Point 117 (ID: 64678182d8a8): MARD = 63.329898\n",
      "  Point 118 (ID: 650104ede84c): MARD = 63.962793\n",
      "  Point 119 (ID: 657859f893d9): MARD = 66.244139\n",
      "  Point 120 (ID: 65a3b13ad9a0): MARD = 76.786401\n",
      "  Point 121 (ID: 665ce639a331): MARD = 60.599833\n",
      "  Point 122 (ID: 684dd88a0d49): MARD = 60.371934\n",
      "  Point 123 (ID: 68987fb159ab): MARD = 60.929238\n",
      "  Point 124 (ID: 6b00cb764237): MARD = 63.329898\n",
      "  Point 125 (ID: 6b3860e8f64f): MARD = 62.423520\n",
      "  Point 126 (ID: 6baafa56895c): MARD = 80.486019\n",
      "  Point 127 (ID: 6bcce181be65): MARD = 85.438810\n",
      "  Point 128 (ID: 6d10709053ae): MARD = 62.382078\n",
      "  Point 129 (ID: 6d9effbcde78): MARD = 72.983702\n",
      "  Point 130 (ID: 6df8b7b6e837): MARD = 68.071690\n",
      "  Point 131 (ID: 6dfd80748e72): MARD = 62.748237\n",
      "  Point 132 (ID: 6e092b306fe1): MARD = 78.208948\n",
      "  Point 133 (ID: 6e0f78e188ff): MARD = 68.426708\n",
      "  Point 134 (ID: 6e68e742f5bc): MARD = 66.807085\n",
      "  Point 135 (ID: 6f4e0538d1e4): MARD = 69.412839\n",
      "  Point 136 (ID: 6fb656d506b2): MARD = 68.584018\n",
      "  Point 137 (ID: 6fe4751a3b42): MARD = 60.918669\n",
      "  Point 138 (ID: 705f508d1e42): MARD = 61.372171\n",
      "  Point 139 (ID: 70d0392397de): MARD = 71.774685\n",
      "  Point 140 (ID: 7131bf4c9e6f): MARD = 68.107041\n",
      "  Point 141 (ID: 72a867980067): MARD = 80.512557\n",
      "  Point 142 (ID: 7356dd08b0ae): MARD = 72.527088\n",
      "  Point 143 (ID: 74898f372d2b): MARD = 82.776100\n",
      "  Point 144 (ID: 77baa08a1345): MARD = 72.377638\n",
      "  Point 145 (ID: 7828dd083cdc): MARD = 62.764799\n",
      "  Point 146 (ID: 7a6495a39d87): MARD = 60.228785\n",
      "  Point 147 (ID: 7d3835e4e63a): MARD = 64.132266\n",
      "  Point 148 (ID: 7e6e90a93aa5): MARD = 64.235749\n",
      "  Point 149 (ID: 7eee3d1f1268): MARD = 66.367420\n",
      "  Point 150 (ID: 807135cbc438): MARD = 60.920286\n",
      "  Point 151 (ID: 8185ce1cdcef): MARD = 61.608579\n",
      "  Point 152 (ID: 81d79d53ed7b): MARD = 69.950972\n",
      "  Point 153 (ID: 83fda7c0500b): MARD = 63.756471\n",
      "  Point 154 (ID: 8693ab1fd2be): MARD = 60.867872\n",
      "  Point 155 (ID: 873dcc0b468f): MARD = 70.518490\n",
      "  Point 156 (ID: 87a9f4d20f07): MARD = 62.991597\n",
      "  Point 157 (ID: 8846b09384a4): MARD = 63.532050\n",
      "  Point 158 (ID: 8a482c024fc2): MARD = 67.264643\n",
      "  Point 159 (ID: 8a81f62320d6): MARD = 63.778269\n",
      "  Point 160 (ID: 8a9bef2fbd4e): MARD = 69.712296\n",
      "  Point 161 (ID: 8af50c9d0a86): MARD = 69.775655\n",
      "  Point 162 (ID: 8b079e79035f): MARD = 61.111943\n",
      "  Point 163 (ID: 8b568d47a1fd): MARD = 63.192168\n",
      "  Point 164 (ID: 8b76c3c5cb3e): MARD = 72.726537\n",
      "  Point 165 (ID: 8be6629a6039): MARD = 72.845434\n",
      "  Point 166 (ID: 8c0d05233238): MARD = 78.503482\n",
      "  Point 167 (ID: 8dc22e65c06f): MARD = 76.568259\n",
      "  Point 168 (ID: 8ff2733f6aef): MARD = 65.207491\n",
      "  Point 169 (ID: 8ff863f8874f): MARD = 72.162283\n",
      "  Point 170 (ID: 904b03ad5594): MARD = 77.532630\n",
      "  Point 171 (ID: 921433215353): MARD = 61.407128\n",
      "  Point 172 (ID: 9232dc06cfdc): MARD = 61.269721\n",
      "  Point 173 (ID: 93be637084a2): MARD = 63.971439\n",
      "  Point 174 (ID: 956765d5f46d): MARD = 64.890022\n",
      "  Point 175 (ID: 95a4cc805c7b): MARD = 68.116044\n",
      "  Point 176 (ID: 96a9706b8534): MARD = 61.269330\n",
      "  Point 177 (ID: 9910c827e2fe): MARD = 60.356335\n",
      "  Point 178 (ID: 99132193eaa0): MARD = 65.949274\n",
      "  Point 179 (ID: 9a1029536d78): MARD = 62.613879\n",
      "  Point 180 (ID: 9a496b1e20f9): MARD = 64.913933\n",
      "  Point 181 (ID: 9a78c6a7b1c2): MARD = 60.634275\n",
      "  Point 182 (ID: 9ac2e3e9fca5): MARD = 61.136331\n",
      "  Point 183 (ID: 9ae54843c69a): MARD = 71.759410\n",
      "  Point 184 (ID: 9ba469af2980): MARD = 63.408422\n",
      "  Point 185 (ID: 9bafbbd152d2): MARD = 76.124079\n",
      "  Point 186 (ID: 9c088d2d1559): MARD = 76.831585\n",
      "  Point 187 (ID: 9c514d2d5b3f): MARD = 68.317116\n",
      "  Point 188 (ID: 9da74370835a): MARD = 62.272491\n",
      "  Point 189 (ID: 9eaac43744f5): MARD = 62.781997\n",
      "  Point 190 (ID: 9f5a8665cf2e): MARD = 85.834265\n",
      "  Point 191 (ID: a1b12fdce6c3): MARD = 68.475322\n",
      "  Point 192 (ID: a1eb88562239): MARD = 61.353168\n",
      "  Point 193 (ID: a30a143a53a3): MARD = 66.296630\n",
      "  Point 194 (ID: a32b5ce3d48a): MARD = 65.794777\n",
      "  Point 195 (ID: a4359815f152): MARD = 65.868397\n",
      "  Point 196 (ID: a47878630dc2): MARD = 60.172170\n",
      "  Point 197 (ID: a6356a3c5d11): MARD = 69.781204\n",
      "  Point 198 (ID: a64273801bde): MARD = 78.001227\n",
      "  Point 199 (ID: a73c3d516c59): MARD = 65.783005\n",
      "  Point 200 (ID: a7ec056502e7): MARD = 69.871991\n",
      "  Point 201 (ID: a80dab8eddf4): MARD = 68.246387\n",
      "  Point 202 (ID: a88f68b0b114): MARD = 70.670479\n",
      "  Point 203 (ID: a8c9fcdbc0be): MARD = 68.100575\n",
      "  Point 204 (ID: aa5ce75edcf5): MARD = 68.495270\n",
      "  Point 205 (ID: aaaadb174012): MARD = 61.603412\n",
      "  Point 206 (ID: ab7991df166b): MARD = 66.416614\n",
      "  Point 207 (ID: ac81fc200162): MARD = 70.782043\n",
      "  Point 208 (ID: ae94ce412de9): MARD = 64.575624\n",
      "  Point 209 (ID: af133a85ea0c): MARD = 76.346851\n",
      "  Point 210 (ID: afc744fad65e): MARD = 66.333130\n",
      "  Point 211 (ID: b0f8613305a3): MARD = 67.522968\n",
      "  Point 212 (ID: b1197f2cc9b3): MARD = 63.183091\n",
      "  Point 213 (ID: b11dcdcbc8c8): MARD = 62.938407\n",
      "  Point 214 (ID: b17f0b81dab3): MARD = 65.089326\n",
      "  Point 215 (ID: b43440c6ebe4): MARD = 64.063939\n",
      "  Point 216 (ID: b460ca9fa26f): MARD = 65.935021\n",
      "  Point 217 (ID: b4f41b5bf0ef): MARD = 66.273419\n",
      "  Point 218 (ID: b56340f472d2): MARD = 62.707305\n",
      "  Point 219 (ID: b576c5269ad1): MARD = 69.854687\n",
      "  Point 220 (ID: b5bf7b84fc66): MARD = 64.401425\n",
      "  Point 221 (ID: b5e6ae31493c): MARD = 60.876964\n",
      "  Point 222 (ID: b665041e1633): MARD = 66.744557\n",
      "  Point 223 (ID: b66f23ffa730): MARD = 65.332750\n",
      "  Point 224 (ID: b6fd109b1bc9): MARD = 68.133465\n",
      "  Point 225 (ID: b8f1b30877db): MARD = 61.210124\n",
      "  Point 226 (ID: b94c58d063bf): MARD = 62.626701\n",
      "  Point 227 (ID: b9fe7da14a32): MARD = 67.001683\n",
      "  Point 228 (ID: ba08cee68c71): MARD = 68.323033\n",
      "  Point 229 (ID: bb11db08584a): MARD = 67.629497\n",
      "  Point 230 (ID: bb45257258cc): MARD = 60.724052\n",
      "  Point 231 (ID: bb5083fae98f): MARD = 64.181368\n",
      "  Point 232 (ID: bcb0498ed2c1): MARD = 80.790263\n",
      "  Point 233 (ID: bde1063a5dd7): MARD = 80.708090\n",
      "  Point 234 (ID: beb00fa6e7c9): MARD = 63.080658\n",
      "  Point 235 (ID: bfb578c0e8d8): MARD = 60.568537\n",
      "  Point 236 (ID: c0202976c670): MARD = 77.917507\n",
      "  Point 237 (ID: c096131ad065): MARD = 60.369011\n",
      "  Point 238 (ID: c1896142a20a): MARD = 61.190933\n",
      "  Point 239 (ID: c1ebe785503a): MARD = 75.955391\n",
      "  Point 240 (ID: c7c3d363bc86): MARD = 66.248974\n",
      "  Point 241 (ID: c9485c38fdd5): MARD = 64.785556\n",
      "  Point 242 (ID: ca7570c5925c): MARD = 61.310100\n",
      "  Point 243 (ID: cab3dfa7962d): MARD = 65.334928\n",
      "  Point 244 (ID: cd972e5639e0): MARD = 67.798014\n",
      "  Point 245 (ID: cd9e2190c73f): MARD = 65.021365\n",
      "  Point 246 (ID: ce6f33a81ad5): MARD = 61.074387\n",
      "  Point 247 (ID: ce887b196c23): MARD = 61.864732\n",
      "  Point 248 (ID: cfb17a7cc8d4): MARD = 62.856165\n",
      "  Point 249 (ID: cfd1bd0fcbb4): MARD = 64.136212\n",
      "  Point 250 (ID: d02b79fc3200): MARD = 60.785972\n",
      "  Point 251 (ID: d1b279cc02ae): MARD = 64.709066\n",
      "  Point 252 (ID: d1ca85af57c9): MARD = 62.767354\n",
      "  Point 253 (ID: d25b8a8ad3c4): MARD = 60.565766\n",
      "  Point 254 (ID: d26bc6e1230d): MARD = 68.185766\n",
      "  Point 255 (ID: d3be5346684b): MARD = 68.835117\n",
      "  Point 256 (ID: d5ad3362424c): MARD = 64.615529\n",
      "  Point 257 (ID: d6dbb0820ea5): MARD = 60.878252\n",
      "  Point 258 (ID: d6f6bdfd8011): MARD = 62.931490\n",
      "  Point 259 (ID: d78b7401096f): MARD = 64.410907\n",
      "  Point 260 (ID: d7bc62d60e8c): MARD = 63.031308\n",
      "  Point 261 (ID: d81338217fc5): MARD = 61.734800\n",
      "  Point 262 (ID: d99dd99be001): MARD = 75.707443\n",
      "  Point 263 (ID: d9ad2a0ec026): MARD = 68.872182\n",
      "  Point 264 (ID: da6bbb76d562): MARD = 64.823679\n",
      "  Point 265 (ID: dc0eea0b68a7): MARD = 68.706545\n",
      "  Point 266 (ID: dc6fa1b38b83): MARD = 64.827887\n",
      "  Point 267 (ID: de57c9e9fa93): MARD = 77.214458\n",
      "  Point 268 (ID: de730033c683): MARD = 62.415324\n",
      "  Point 269 (ID: dfea19863428): MARD = 61.196254\n",
      "  Point 270 (ID: e1418d28d668): MARD = 76.113935\n",
      "  Point 271 (ID: e150935f66a6): MARD = 62.083237\n",
      "  Point 272 (ID: e2a233493b90): MARD = 62.189244\n",
      "  Point 273 (ID: e30a890600e1): MARD = 61.587469\n",
      "  Point 274 (ID: e3a7671f787b): MARD = 72.728248\n",
      "  Point 275 (ID: e540d2e35d15): MARD = 68.284512\n",
      "  Point 276 (ID: e580676516b0): MARD = 72.907263\n",
      "  Point 277 (ID: e65f94ad9be3): MARD = 73.025853\n",
      "  Point 278 (ID: e6a6acf7fca1): MARD = 64.105344\n",
      "  Point 279 (ID: e7291472109b): MARD = 63.539816\n",
      "  Point 280 (ID: e7a7187066ad): MARD = 61.864732\n",
      "  Point 281 (ID: e821c1b6417a): MARD = 63.594297\n",
      "  Point 282 (ID: e966850247f4): MARD = 64.451678\n",
      "  Point 283 (ID: e9f3c85a2a02): MARD = 69.429660\n",
      "  Point 284 (ID: e9f82b5bbaf4): MARD = 60.701366\n",
      "  Point 285 (ID: eae70f527755): MARD = 68.699246\n",
      "  Point 286 (ID: eb32a815f78c): MARD = 66.918768\n",
      "  Point 287 (ID: ec0c9f817b03): MARD = 67.268647\n",
      "  Point 288 (ID: ed2ef440d22c): MARD = 62.135870\n",
      "  Point 289 (ID: ed88faaa325a): MARD = 62.126076\n",
      "  Point 290 (ID: ee059945b08a): MARD = 61.136044\n",
      "  Point 291 (ID: eebd1e195952): MARD = 72.304332\n",
      "  Point 292 (ID: f002ce614c59): MARD = 66.802263\n",
      "  Point 293 (ID: f02057c41256): MARD = 68.673821\n",
      "  Point 294 (ID: f06e7a9df795): MARD = 63.062373\n",
      "  Point 295 (ID: f09cfc6a4dbd): MARD = 66.364420\n",
      "  Point 296 (ID: f0c13be90519): MARD = 78.073656\n",
      "  Point 297 (ID: f2ee81781411): MARD = 66.149451\n",
      "  Point 298 (ID: f3a268d2726d): MARD = 60.610805\n",
      "  Point 299 (ID: f4e68b61f480): MARD = 63.214709\n",
      "  Point 300 (ID: f66c4ee86629): MARD = 81.541568\n",
      "  Point 301 (ID: f6f3ea0d2693): MARD = 67.803763\n",
      "  Point 302 (ID: f6f7dba7104d): MARD = 65.591157\n",
      "  Point 303 (ID: f71333204618): MARD = 68.271020\n",
      "  Point 304 (ID: f72adcac5638): MARD = 72.101318\n",
      "  Point 305 (ID: f85c78201a50): MARD = 61.030228\n",
      "  Point 306 (ID: f8d62557ad0c): MARD = 65.668316\n",
      "  Point 307 (ID: fa9bece586fc): MARD = 67.938269\n",
      "  Point 308 (ID: fb6b8200b7f8): MARD = 69.449438\n",
      "  Point 309 (ID: fb767cea406c): MARD = 63.801105\n",
      "  Point 310 (ID: fba493e17448): MARD = 68.389497\n",
      "  Point 311 (ID: fcc32dffd24d): MARD = 78.084940\n",
      "  Point 312 (ID: fd4c946c52bf): MARD = 67.963220\n",
      "  Point 313 (ID: fdc685055659): MARD = 68.660932\n",
      "  Point 314 (ID: fe3f62695b2d): MARD = 60.425970\n",
      "  Point 315 (ID: ff8a0b45c789): MARD = 60.757206\n",
      "\n",
      "Results saved to /drive2/Kuntal/Pysindy-experiment/conformal_boundary/cross_dataset_evaluation\n",
      "Point of note: The percentage outside (8.60%) should be compared with APTOS accuracy from literature.\n"
     ]
    }
   ],
   "source": [
    "import os\n",
    "import numpy as np\n",
    "import pandas as pd\n",
    "from sklearn.model_selection import train_test_split\n",
    "\n",
    "# ─── CONFIG ────────────────────────────────────────────────────────────────\n",
    "BASE_DIR = \"/drive2/Kuntal/Pysindy-experiment\"\n",
    "OUTPUT_DIR = f\"{BASE_DIR}/conformal_boundary/cross_dataset_evaluation\"\n",
    "\n",
    "# Dataset paths\n",
    "APTOS_DATA_DIR = f\"{BASE_DIR}/aptos_theta_data\"\n",
    "EYEPACS_DATA_DIR = f\"{BASE_DIR}/eyepacs_theta_data\"\n",
    "M1_DATA_DIR = f\"{BASE_DIR}/M1-output\"\n",
    "M2_DATA_DIR = f\"{BASE_DIR}/M2-output\"\n",
    "\n",
    "# Create output directory\n",
    "os.makedirs(OUTPUT_DIR, exist_ok=True)\n",
    "\n",
    "# ─── MARD CALCULATION FUNCTION ─────────────────────────────────────────────\n",
    "def calculate_robust_mard(theta1, theta2, max_value=100.0):\n",
    "    \"\"\"\n",
    "    Calculate Mean Absolute Relative Difference with numerical stability improvements\n",
    "    \"\"\"\n",
    "    epsilon = 1e-6  # Larger epsilon to avoid extreme values\n",
    "    \n",
    "    # Flatten the theta arrays if they are not already flat\n",
    "    if theta1.ndim > 1:\n",
    "        theta1_flat = theta1.flatten()\n",
    "        theta2_flat = theta2.flatten()\n",
    "    else:\n",
    "        theta1_flat = theta1\n",
    "        theta2_flat = theta2\n",
    "    \n",
    "    # Calculate absolute relative differences with capping\n",
    "    abs_diff = np.abs(theta1_flat - theta2_flat)\n",
    "    denominator = np.abs(theta2_flat) + epsilon\n",
    "    rel_diff = abs_diff / denominator\n",
    "    \n",
    "    # Cap extreme values\n",
    "    rel_diff = np.minimum(rel_diff, max_value)\n",
    "    \n",
    "    # Return mean of absolute relative differences\n",
    "    return np.mean(rel_diff)\n",
    "\n",
    "def main():\n",
    "    # Load theta arrays from all datasets\n",
    "    print(\"Loading datasets...\")\n",
    "    eyepacs_thetas = np.load(os.path.join(EYEPACS_DATA_DIR, \"eyepacs_all_thetas.npy\"), allow_pickle=True)\n",
    "    eyepacs_ids = np.load(os.path.join(EYEPACS_DATA_DIR, \"eyepacs_theta_ids.npy\"), allow_pickle=True)\n",
    "    \n",
    "    messidor1_thetas = np.load(os.path.join(M1_DATA_DIR, \"messidor_all_thetas.npy\"), allow_pickle=True)\n",
    "    messidor1_ids = np.load(os.path.join(M1_DATA_DIR, \"messidor_theta_ids.npy\"), allow_pickle=True)\n",
    "    \n",
    "    messidor2_thetas = np.load(os.path.join(M2_DATA_DIR, \"messidor2_all_thetas.npy\"), allow_pickle=True)\n",
    "    messidor2_ids = np.load(os.path.join(M2_DATA_DIR, \"messidor2_theta_ids.npy\"), allow_pickle=True)\n",
    "    \n",
    "    aptos_thetas = np.load(os.path.join(APTOS_DATA_DIR, \"aptos_all_thetas.npy\"), allow_pickle=True)\n",
    "    aptos_ids = np.load(os.path.join(APTOS_DATA_DIR, \"aptos_theta_ids.npy\"), allow_pickle=True)\n",
    "    \n",
    "    # Combine Messidor-1, Messidor-2, and EyePACS into dataset D\n",
    "    combined_thetas = np.concatenate([eyepacs_thetas, messidor1_thetas, messidor2_thetas])\n",
    "    combined_ids = np.concatenate([eyepacs_ids, messidor1_ids, messidor2_ids])\n",
    "    \n",
    "    print(f\"Combined dataset D contains {len(combined_thetas)} samples:\")\n",
    "    print(f\"  - EyePACS: {len(eyepacs_thetas)} samples\")\n",
    "    print(f\"  - Messidor-1: {len(messidor1_thetas)} samples\")\n",
    "    print(f\"  - Messidor-2: {len(messidor2_thetas)} samples\")\n",
    "    print(f\"  - APTOS (to be evaluated): {len(aptos_thetas)} samples\")\n",
    "    \n",
    "    # Step 1: Calculate the median theta for the combined dataset D\n",
    "    print(\"\\nCalculating median theta for combined dataset D...\")\n",
    "    combined_stacked = np.stack(combined_thetas)\n",
    "    combined_median_theta = np.median(combined_stacked, axis=0)\n",
    "    \n",
    "    # Step 2: Create train/calibration split for the combined dataset\n",
    "    print(\"Creating train/calibration split for conformal bounds...\")\n",
    "    combined_train, combined_calibration = train_test_split(\n",
    "        combined_thetas, test_size=0.4, random_state=42\n",
    "    )\n",
    "    \n",
    "    # Step 3: Calculate MARD values for the calibration set\n",
    "    print(\"Calculating calibration MARD values...\")\n",
    "    calibration_mard_values = []\n",
    "    for theta in combined_calibration:\n",
    "        mard = calculate_robust_mard(theta, combined_median_theta)\n",
    "        calibration_mard_values.append(mard)\n",
    "    \n",
    "    calibration_mard_values = np.array(calibration_mard_values)\n",
    "    \n",
    "    # Step 4: Establish conformal bounds for the combined dataset\n",
    "    mean_mard = np.mean(calibration_mard_values)\n",
    "    std_mard = np.std(calibration_mard_values)\n",
    "    \n",
    "    # Calculate conformal boundaries, ensuring non-negative lower bound\n",
    "    lower_bound = max(0, mean_mard - 2 * std_mard)\n",
    "    upper_bound = mean_mard + 2 * std_mard\n",
    "    \n",
    "    print(f\"\\nCombined dataset D conformal bounds:\")\n",
    "    print(f\"  - Mean MARD: {mean_mard:.6f}\")\n",
    "    print(f\"  - Std MARD: {std_mard:.6f}\")\n",
    "    print(f\"  - Lower bound: {lower_bound:.6f}\")\n",
    "    print(f\"  - Upper bound: {upper_bound:.6f}\")\n",
    "    \n",
    "    # Step 5: Evaluate APTOS against the combined dataset bounds\n",
    "    print(\"\\nEvaluating APTOS against combined dataset bounds...\")\n",
    "    aptos_mard_values = []\n",
    "    aptos_in_domain_flags = []\n",
    "    aptos_outside_indices = []\n",
    "    \n",
    "    for i, theta in enumerate(aptos_thetas):\n",
    "        mard = calculate_robust_mard(theta, combined_median_theta)\n",
    "        aptos_mard_values.append(mard)\n",
    "        \n",
    "        # Check if this sample falls within the combined dataset bounds\n",
    "        in_domain = lower_bound <= mard <= upper_bound\n",
    "        aptos_in_domain_flags.append(in_domain)\n",
    "        \n",
    "        # Store indices of samples that fall outside bounds\n",
    "        if not in_domain:\n",
    "            aptos_outside_indices.append(i)\n",
    "    \n",
    "    # Calculate statistics\n",
    "    total_aptos = len(aptos_thetas)\n",
    "    outside_count = sum(not flag for flag in aptos_in_domain_flags)\n",
    "    percentage_outside = (outside_count / total_aptos) * 100\n",
    "    \n",
    "    print(f\"\\nAPTOS EVALUATION AGAINST COMBINED DATASET BOUNDS:\")\n",
    "    print(f\"  - Total APTOS samples: {total_aptos}\")\n",
    "    print(f\"  - APTOS samples outside combined bounds: {outside_count}\")\n",
    "    print(f\"  - Percentage outside: {percentage_outside:.2f}%\")\n",
    "    \n",
    "    # Save MARD values for APTOS points outside the combined bounds\n",
    "    if outside_count > 0:\n",
    "        print(\"\\nAPTOS points outside combined dataset bounds:\")\n",
    "        outside_mards = [aptos_mard_values[i] for i in aptos_outside_indices]\n",
    "        outside_ids = [aptos_ids[i] for i in aptos_outside_indices]\n",
    "        \n",
    "        for i, (idx, mard) in enumerate(zip(outside_ids, outside_mards)):\n",
    "            print(f\"  Point {i+1} (ID: {idx}): MARD = {mard:.6f}\")\n",
    "        \n",
    "        # Save to CSV\n",
    "        outside_df = pd.DataFrame({\n",
    "            'id': outside_ids,\n",
    "            'mard': outside_mards\n",
    "        })\n",
    "        outside_df.to_csv(os.path.join(OUTPUT_DIR, \"aptos_points_outside_combined_bounds.csv\"), index=False)\n",
    "    \n",
    "    # Save all results to CSV\n",
    "    results_dict = {\n",
    "        'id': aptos_ids,\n",
    "        'mard': aptos_mard_values,\n",
    "        'in_domain': aptos_in_domain_flags\n",
    "    }\n",
    "    \n",
    "    results_df = pd.DataFrame(results_dict)\n",
    "    results_df.to_csv(os.path.join(OUTPUT_DIR, \"aptos_evaluation_against_combined_bounds.csv\"), index=False)\n",
    "    \n",
    "    # Save combined dataset bounds for reference\n",
    "    with open(os.path.join(OUTPUT_DIR, \"combined_dataset_bounds.txt\"), 'w') as f:\n",
    "        f.write(f\"Mean MARD: {mean_mard}\\n\")\n",
    "        f.write(f\"Std MARD: {std_mard}\\n\")\n",
    "        f.write(f\"Lower bound (max(0, mean-2std)): {lower_bound}\\n\")\n",
    "        f.write(f\"Upper bound (mean+2std): {upper_bound}\\n\")\n",
    "        f.write(f\"Percentage of APTOS samples outside bounds: {percentage_outside:.2f}%\\n\")\n",
    "    \n",
    "    # Save the combined median theta for future use\n",
    "    np.save(os.path.join(OUTPUT_DIR, \"combined_median_theta.npy\"), combined_median_theta)\n",
    "    \n",
    "    print(f\"\\nResults saved to {OUTPUT_DIR}\")\n",
    "    print(f\"Point of note: The percentage outside ({percentage_outside:.2f}%) should be compared with APTOS accuracy from literature.\")\n",
    "\n",
    "if __name__ == \"__main__\":\n",
    "    main()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#  APTOS , MESSIDOR-1, MESSIDOR-2 COMBINED ON EYEPACK,"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Loading datasets...\n",
      "Combined dataset D contains 5919 samples:\n",
      "  - APTOS: 3662 samples\n",
      "  - Messidor-1: 1200 samples\n",
      "  - Messidor-2: 1057 samples\n",
      "  - EyePACS (to be evaluated): 35122 samples\n",
      "\n",
      "Calculating median theta for combined dataset D (APTOS + M1 + M2)...\n",
      "Creating train/calibration split for conformal bounds...\n",
      "Calculating calibration MARD values...\n",
      "\n",
      "Combined dataset D conformal bounds:\n",
      "  - Mean MARD: 39.046265\n",
      "  - Std MARD: 10.553906\n",
      "  - Lower bound: 17.938453\n",
      "  - Upper bound: 60.154076\n",
      "\n",
      "Evaluating EyePACS against combined dataset bounds...\n",
      "\n",
      "EYEPACS EVALUATION AGAINST COMBINED DATASET BOUNDS:\n",
      "  - Total EyePACS samples: 35122\n",
      "  - EyePACS samples outside combined bounds: 1632\n",
      "  - Percentage outside: 4.65%\n",
      "\n",
      "EyePACS points outside combined dataset bounds:\n",
      "  Point 1 (ID: 30_right): MARD = 74.130376\n",
      "  Point 2 (ID: 36_left): MARD = 63.070297\n",
      "  Point 3 (ID: 36_right): MARD = 68.363566\n",
      "  Point 4 (ID: 47_left): MARD = 61.183707\n",
      "  Point 5 (ID: 51_right): MARD = 63.654737\n",
      "  Point 6 (ID: 58_left): MARD = 66.462211\n",
      "  Point 7 (ID: 62_left): MARD = 71.307947\n",
      "  Point 8 (ID: 82_left): MARD = 67.780744\n",
      "  Point 9 (ID: 82_right): MARD = 61.918156\n",
      "  Point 10 (ID: 161_left): MARD = 60.204596\n",
      "  ... and 1622 more\n",
      "\n",
      "Results saved to /drive2/Kuntal/Pysindy-experiment/conformal_boundary/cross_dataset_evaluation\n",
      "Point of note: The percentage outside (4.65%) should be compared with EyePACS accuracy from literature.\n"
     ]
    }
   ],
   "source": [
    "import os\n",
    "import numpy as np\n",
    "import pandas as pd\n",
    "from sklearn.model_selection import train_test_split\n",
    "\n",
    "# ─── CONFIG ────────────────────────────────────────────────────────────────\n",
    "BASE_DIR = \"/drive2/Kuntal/Pysindy-experiment\"\n",
    "OUTPUT_DIR = f\"{BASE_DIR}/conformal_boundary/cross_dataset_evaluation\"\n",
    "\n",
    "# Dataset paths\n",
    "APTOS_DATA_DIR = f\"{BASE_DIR}/aptos_theta_data\"\n",
    "EYEPACS_DATA_DIR = f\"{BASE_DIR}/eyepacs_theta_data\"\n",
    "M1_DATA_DIR = f\"{BASE_DIR}/M1-output\"\n",
    "M2_DATA_DIR = f\"{BASE_DIR}/M2-output\"\n",
    "\n",
    "# Create output directory\n",
    "os.makedirs(OUTPUT_DIR, exist_ok=True)\n",
    "\n",
    "# ─── MARD CALCULATION FUNCTION ─────────────────────────────────────────────\n",
    "def calculate_robust_mard(theta1, theta2, max_value=100.0):\n",
    "    \"\"\"\n",
    "    Calculate Mean Absolute Relative Difference with numerical stability improvements\n",
    "    \"\"\"\n",
    "    epsilon = 1e-6  # Larger epsilon to avoid extreme values\n",
    "    \n",
    "    # Flatten the theta arrays if they are not already flat\n",
    "    if theta1.ndim > 1:\n",
    "        theta1_flat = theta1.flatten()\n",
    "        theta2_flat = theta2.flatten()\n",
    "    else:\n",
    "        theta1_flat = theta1\n",
    "        theta2_flat = theta2\n",
    "    \n",
    "    # Calculate absolute relative differences with capping\n",
    "    abs_diff = np.abs(theta1_flat - theta2_flat)\n",
    "    denominator = np.abs(theta2_flat) + epsilon\n",
    "    rel_diff = abs_diff / denominator\n",
    "    \n",
    "    # Cap extreme values\n",
    "    rel_diff = np.minimum(rel_diff, max_value)\n",
    "    \n",
    "    # Return mean of absolute relative differences\n",
    "    return np.mean(rel_diff)\n",
    "\n",
    "def main():\n",
    "    # Load theta arrays from all datasets\n",
    "    print(\"Loading datasets...\")\n",
    "    eyepacs_thetas = np.load(os.path.join(EYEPACS_DATA_DIR, \"eyepacs_all_thetas.npy\"), allow_pickle=True)\n",
    "    eyepacs_ids = np.load(os.path.join(EYEPACS_DATA_DIR, \"eyepacs_theta_ids.npy\"), allow_pickle=True)\n",
    "    \n",
    "    messidor1_thetas = np.load(os.path.join(M1_DATA_DIR, \"messidor_all_thetas.npy\"), allow_pickle=True)\n",
    "    messidor1_ids = np.load(os.path.join(M1_DATA_DIR, \"messidor_theta_ids.npy\"), allow_pickle=True)\n",
    "    \n",
    "    messidor2_thetas = np.load(os.path.join(M2_DATA_DIR, \"messidor2_all_thetas.npy\"), allow_pickle=True)\n",
    "    messidor2_ids = np.load(os.path.join(M2_DATA_DIR, \"messidor2_theta_ids.npy\"), allow_pickle=True)\n",
    "    \n",
    "    aptos_thetas = np.load(os.path.join(APTOS_DATA_DIR, \"aptos_all_thetas.npy\"), allow_pickle=True)\n",
    "    aptos_ids = np.load(os.path.join(APTOS_DATA_DIR, \"aptos_theta_ids.npy\"), allow_pickle=True)\n",
    "    \n",
    "    # Combine APTOS, Messidor-1, and Messidor-2 into dataset D\n",
    "    combined_thetas = np.concatenate([aptos_thetas, messidor1_thetas, messidor2_thetas])\n",
    "    combined_ids = np.concatenate([aptos_ids, messidor1_ids, messidor2_ids])\n",
    "    \n",
    "    print(f\"Combined dataset D contains {len(combined_thetas)} samples:\")\n",
    "    print(f\"  - APTOS: {len(aptos_thetas)} samples\")\n",
    "    print(f\"  - Messidor-1: {len(messidor1_thetas)} samples\")\n",
    "    print(f\"  - Messidor-2: {len(messidor2_thetas)} samples\")\n",
    "    print(f\"  - EyePACS (to be evaluated): {len(eyepacs_thetas)} samples\")\n",
    "    \n",
    "    # Step 1: Calculate the median theta for the combined dataset D\n",
    "    print(\"\\nCalculating median theta for combined dataset D (APTOS + M1 + M2)...\")\n",
    "    combined_stacked = np.stack(combined_thetas)\n",
    "    combined_median_theta = np.median(combined_stacked, axis=0)\n",
    "    \n",
    "    # Step 2: Create train/calibration split for the combined dataset\n",
    "    print(\"Creating train/calibration split for conformal bounds...\")\n",
    "    combined_train, combined_calibration = train_test_split(\n",
    "        combined_thetas, test_size=0.4, random_state=42\n",
    "    )\n",
    "    \n",
    "    # Step 3: Calculate MARD values for the calibration set\n",
    "    print(\"Calculating calibration MARD values...\")\n",
    "    calibration_mard_values = []\n",
    "    for theta in combined_calibration:\n",
    "        mard = calculate_robust_mard(theta, combined_median_theta)\n",
    "        calibration_mard_values.append(mard)\n",
    "    \n",
    "    calibration_mard_values = np.array(calibration_mard_values)\n",
    "    \n",
    "    # Step 4: Establish conformal bounds for the combined dataset\n",
    "    mean_mard = np.mean(calibration_mard_values)\n",
    "    std_mard = np.std(calibration_mard_values)\n",
    "    \n",
    "    # Calculate conformal boundaries, ensuring non-negative lower bound\n",
    "    lower_bound = max(0, mean_mard - 2 * std_mard)\n",
    "    upper_bound = mean_mard + 2 * std_mard\n",
    "    \n",
    "    print(f\"\\nCombined dataset D conformal bounds:\")\n",
    "    print(f\"  - Mean MARD: {mean_mard:.6f}\")\n",
    "    print(f\"  - Std MARD: {std_mard:.6f}\")\n",
    "    print(f\"  - Lower bound: {lower_bound:.6f}\")\n",
    "    print(f\"  - Upper bound: {upper_bound:.6f}\")\n",
    "    \n",
    "    # Step 5: Evaluate EyePACS against the combined dataset bounds\n",
    "    print(\"\\nEvaluating EyePACS against combined dataset bounds...\")\n",
    "    eyepacs_mard_values = []\n",
    "    eyepacs_in_domain_flags = []\n",
    "    eyepacs_outside_indices = []\n",
    "    \n",
    "    for i, theta in enumerate(eyepacs_thetas):\n",
    "        mard = calculate_robust_mard(theta, combined_median_theta)\n",
    "        eyepacs_mard_values.append(mard)\n",
    "        \n",
    "        # Check if this sample falls within the combined dataset bounds\n",
    "        in_domain = lower_bound <= mard <= upper_bound\n",
    "        eyepacs_in_domain_flags.append(in_domain)\n",
    "        \n",
    "        # Store indices of samples that fall outside bounds\n",
    "        if not in_domain:\n",
    "            eyepacs_outside_indices.append(i)\n",
    "    \n",
    "    # Calculate statistics\n",
    "    total_eyepacs = len(eyepacs_thetas)\n",
    "    outside_count = sum(not flag for flag in eyepacs_in_domain_flags)\n",
    "    percentage_outside = (outside_count / total_eyepacs) * 100\n",
    "    \n",
    "    print(f\"\\nEYEPACS EVALUATION AGAINST COMBINED DATASET BOUNDS:\")\n",
    "    print(f\"  - Total EyePACS samples: {total_eyepacs}\")\n",
    "    print(f\"  - EyePACS samples outside combined bounds: {outside_count}\")\n",
    "    print(f\"  - Percentage outside: {percentage_outside:.2f}%\")\n",
    "    \n",
    "    # Save MARD values for EyePACS points outside the combined bounds\n",
    "    if outside_count > 0:\n",
    "        print(\"\\nEyePACS points outside combined dataset bounds:\")\n",
    "        outside_mards = [eyepacs_mard_values[i] for i in eyepacs_outside_indices]\n",
    "        outside_ids = [eyepacs_ids[i] for i in eyepacs_outside_indices]\n",
    "        \n",
    "        for i, (idx, mard) in enumerate(zip(outside_ids, outside_mards)):\n",
    "            if i < 10:  # Only print first 10 to avoid excessive output\n",
    "                print(f\"  Point {i+1} (ID: {idx}): MARD = {mard:.6f}\")\n",
    "            if i == 10:\n",
    "                print(f\"  ... and {outside_count - 10} more\")\n",
    "        \n",
    "        # Save to CSV\n",
    "        outside_df = pd.DataFrame({\n",
    "            'id': outside_ids,\n",
    "            'mard': outside_mards\n",
    "        })\n",
    "        outside_df.to_csv(os.path.join(OUTPUT_DIR, \"eyepacs_points_outside_combined_bounds.csv\"), index=False)\n",
    "    \n",
    "    # Save all results to CSV\n",
    "    results_dict = {\n",
    "        'id': eyepacs_ids,\n",
    "        'mard': eyepacs_mard_values,\n",
    "        'in_domain': eyepacs_in_domain_flags\n",
    "    }\n",
    "    \n",
    "    results_df = pd.DataFrame(results_dict)\n",
    "    results_df.to_csv(os.path.join(OUTPUT_DIR, \"eyepacs_evaluation_against_combined_bounds.csv\"), index=False)\n",
    "    \n",
    "    # Save combined dataset bounds for reference\n",
    "    with open(os.path.join(OUTPUT_DIR, \"combined_aptos_m1_m2_bounds.txt\"), 'w') as f:\n",
    "        f.write(f\"Mean MARD: {mean_mard}\\n\")\n",
    "        f.write(f\"Std MARD: {std_mard}\\n\")\n",
    "        f.write(f\"Lower bound (max(0, mean-2std)): {lower_bound}\\n\")\n",
    "        f.write(f\"Upper bound (mean+2std): {upper_bound}\\n\")\n",
    "        f.write(f\"Percentage of EyePACS samples outside bounds: {percentage_outside:.2f}%\\n\")\n",
    "    \n",
    "    # Save the combined median theta for future use\n",
    "    np.save(os.path.join(OUTPUT_DIR, \"combined_aptos_m1_m2_median_theta.npy\"), combined_median_theta)\n",
    "    \n",
    "    # Save a summary of all datasts' performance for future comparison\n",
    "    summary_data = {\n",
    "        'dataset': ['EyePACS'],\n",
    "        'total_samples': [total_eyepacs],\n",
    "        'outside_count': [outside_count],\n",
    "        'percentage_outside': [percentage_outside]\n",
    "    }\n",
    "    \n",
    "    # Check if previous summary file exists, and if so, append to it\n",
    "    summary_path = os.path.join(OUTPUT_DIR, \"cross_dataset_evaluation_summary.csv\")\n",
    "    if os.path.exists(summary_path):\n",
    "        existing_summary = pd.read_csv(summary_path)\n",
    "        updated_summary = pd.concat([existing_summary, pd.DataFrame(summary_data)])\n",
    "        updated_summary.to_csv(summary_path, index=False)\n",
    "    else:\n",
    "        pd.DataFrame(summary_data).to_csv(summary_path, index=False)\n",
    "    \n",
    "    print(f\"\\nResults saved to {OUTPUT_DIR}\")\n",
    "    print(f\"Point of note: The percentage outside ({percentage_outside:.2f}%) should be compared with EyePACS accuracy from literature.\")\n",
    "\n",
    "if __name__ == \"__main__\":\n",
    "    main()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Loading datasets...\n",
      "Combined dataset D contains 39841 samples:\n",
      "  - APTOS: 3662 samples\n",
      "  - EyePACS: 35122 samples\n",
      "  - Messidor-2: 1057 samples\n",
      "  - Messidor-1 (to be evaluated): 1200 samples\n",
      "\n",
      "Calculating median theta for combined dataset D (APTOS + EyePACS + M2)...\n",
      "Creating train/calibration split for conformal bounds...\n",
      "Calculating calibration MARD values...\n",
      "\n",
      "Combined dataset D conformal bounds:\n",
      "  - Mean MARD: 38.588328\n",
      "  - Std MARD: 10.811252\n",
      "  - Lower bound: 16.965824\n",
      "  - Upper bound: 60.210832\n",
      "\n",
      "Evaluating Messidor-1 against combined dataset bounds...\n",
      "\n",
      "MESSIDOR-1 EVALUATION AGAINST COMBINED DATASET BOUNDS:\n",
      "  - Total Messidor-1 samples: 1200\n",
      "  - Messidor-1 samples outside combined bounds: 5\n",
      "  - Percentage outside: 0.42%\n",
      "\n",
      "Messidor-1 points outside combined dataset bounds:\n",
      "  Point 1 (ID: 20051021_39314_0100_PP.tif): MARD = 63.534097\n",
      "  Point 2 (ID: 20060523_49269_0100_PP.tif): MARD = 60.283263\n",
      "  Point 3 (ID: 20060530_55203_0100_PP.tif): MARD = 67.182082\n",
      "  Point 4 (ID: 20060530_55816_0100_PP.tif): MARD = 66.802287\n",
      "  Point 5 (ID: 20051202_55742_0400_PP.tif): MARD = 60.355726\n",
      "\n",
      "Results saved to /drive2/Kuntal/Pysindy-experiment/conformal_boundary/cross_dataset_evaluation\n",
      "Point of note: The percentage outside (0.42%) should be compared with Messidor-1 accuracy from literature.\n"
     ]
    }
   ],
   "source": [
    "import os\n",
    "import numpy as np\n",
    "import pandas as pd\n",
    "from sklearn.model_selection import train_test_split\n",
    "\n",
    "# ─── CONFIG ────────────────────────────────────────────────────────────────\n",
    "BASE_DIR = \"/drive2/Kuntal/Pysindy-experiment\"\n",
    "OUTPUT_DIR = f\"{BASE_DIR}/conformal_boundary/cross_dataset_evaluation\"\n",
    "\n",
    "# Dataset paths\n",
    "APTOS_DATA_DIR = f\"{BASE_DIR}/aptos_theta_data\"\n",
    "EYEPACS_DATA_DIR = f\"{BASE_DIR}/eyepacs_theta_data\"\n",
    "M1_DATA_DIR = f\"{BASE_DIR}/M1-output\"\n",
    "M2_DATA_DIR = f\"{BASE_DIR}/M2-output\"\n",
    "\n",
    "# Create output directory\n",
    "os.makedirs(OUTPUT_DIR, exist_ok=True)\n",
    "\n",
    "# ─── MARD CALCULATION FUNCTION ─────────────────────────────────────────────\n",
    "def calculate_robust_mard(theta1, theta2, max_value=100.0):\n",
    "    \"\"\"\n",
    "    Calculate Mean Absolute Relative Difference with numerical stability improvements\n",
    "    \"\"\"\n",
    "    epsilon = 1e-6  # Larger epsilon to avoid extreme values\n",
    "    \n",
    "    # Flatten the theta arrays if they are not already flat\n",
    "    if theta1.ndim > 1:\n",
    "        theta1_flat = theta1.flatten()\n",
    "        theta2_flat = theta2.flatten()\n",
    "    else:\n",
    "        theta1_flat = theta1\n",
    "        theta2_flat = theta2\n",
    "    \n",
    "    # Calculate absolute relative differences with capping\n",
    "    abs_diff = np.abs(theta1_flat - theta2_flat)\n",
    "    denominator = np.abs(theta2_flat) + epsilon\n",
    "    rel_diff = abs_diff / denominator\n",
    "    \n",
    "    # Cap extreme values\n",
    "    rel_diff = np.minimum(rel_diff, max_value)\n",
    "    \n",
    "    # Return mean of absolute relative differences\n",
    "    return np.mean(rel_diff)\n",
    "\n",
    "def main():\n",
    "    # Load theta arrays from all datasets\n",
    "    print(\"Loading datasets...\")\n",
    "    eyepacs_thetas = np.load(os.path.join(EYEPACS_DATA_DIR, \"eyepacs_all_thetas.npy\"), allow_pickle=True)\n",
    "    eyepacs_ids = np.load(os.path.join(EYEPACS_DATA_DIR, \"eyepacs_theta_ids.npy\"), allow_pickle=True)\n",
    "    \n",
    "    messidor1_thetas = np.load(os.path.join(M1_DATA_DIR, \"messidor_all_thetas.npy\"), allow_pickle=True)\n",
    "    messidor1_ids = np.load(os.path.join(M1_DATA_DIR, \"messidor_theta_ids.npy\"), allow_pickle=True)\n",
    "    \n",
    "    messidor2_thetas = np.load(os.path.join(M2_DATA_DIR, \"messidor2_all_thetas.npy\"), allow_pickle=True)\n",
    "    messidor2_ids = np.load(os.path.join(M2_DATA_DIR, \"messidor2_theta_ids.npy\"), allow_pickle=True)\n",
    "    \n",
    "    aptos_thetas = np.load(os.path.join(APTOS_DATA_DIR, \"aptos_all_thetas.npy\"), allow_pickle=True)\n",
    "    aptos_ids = np.load(os.path.join(APTOS_DATA_DIR, \"aptos_theta_ids.npy\"), allow_pickle=True)\n",
    "    \n",
    "    # Combine APTOS, EyePACS, and Messidor-2 into dataset D\n",
    "    combined_thetas = np.concatenate([aptos_thetas, eyepacs_thetas, messidor2_thetas])\n",
    "    combined_ids = np.concatenate([aptos_ids, eyepacs_ids, messidor2_ids])\n",
    "    \n",
    "    print(f\"Combined dataset D contains {len(combined_thetas)} samples:\")\n",
    "    print(f\"  - APTOS: {len(aptos_thetas)} samples\")\n",
    "    print(f\"  - EyePACS: {len(eyepacs_thetas)} samples\")\n",
    "    print(f\"  - Messidor-2: {len(messidor2_thetas)} samples\")\n",
    "    print(f\"  - Messidor-1 (to be evaluated): {len(messidor1_thetas)} samples\")\n",
    "    \n",
    "    # Step 1: Calculate the median theta for the combined dataset D\n",
    "    print(\"\\nCalculating median theta for combined dataset D (APTOS + EyePACS + M2)...\")\n",
    "    combined_stacked = np.stack(combined_thetas)\n",
    "    combined_median_theta = np.median(combined_stacked, axis=0)\n",
    "    \n",
    "    # Step 2: Create train/calibration split for the combined dataset\n",
    "    print(\"Creating train/calibration split for conformal bounds...\")\n",
    "    combined_train, combined_calibration = train_test_split(\n",
    "        combined_thetas, test_size=0.4, random_state=42\n",
    "    )\n",
    "    \n",
    "    # Step 3: Calculate MARD values for the calibration set\n",
    "    print(\"Calculating calibration MARD values...\")\n",
    "    calibration_mard_values = []\n",
    "    for theta in combined_calibration:\n",
    "        mard = calculate_robust_mard(theta, combined_median_theta)\n",
    "        calibration_mard_values.append(mard)\n",
    "    \n",
    "    calibration_mard_values = np.array(calibration_mard_values)\n",
    "    \n",
    "    # Step 4: Establish conformal bounds for the combined dataset\n",
    "    mean_mard = np.mean(calibration_mard_values)\n",
    "    std_mard = np.std(calibration_mard_values)\n",
    "    \n",
    "    # Calculate conformal boundaries, ensuring non-negative lower bound\n",
    "    lower_bound = max(0, mean_mard - 2 * std_mard)\n",
    "    upper_bound = mean_mard + 2 * std_mard\n",
    "    \n",
    "    print(f\"\\nCombined dataset D conformal bounds:\")\n",
    "    print(f\"  - Mean MARD: {mean_mard:.6f}\")\n",
    "    print(f\"  - Std MARD: {std_mard:.6f}\")\n",
    "    print(f\"  - Lower bound: {lower_bound:.6f}\")\n",
    "    print(f\"  - Upper bound: {upper_bound:.6f}\")\n",
    "    \n",
    "    # Step 5: Evaluate Messidor-1 against the combined dataset bounds\n",
    "    print(\"\\nEvaluating Messidor-1 against combined dataset bounds...\")\n",
    "    m1_mard_values = []\n",
    "    m1_in_domain_flags = []\n",
    "    m1_outside_indices = []\n",
    "    \n",
    "    for i, theta in enumerate(messidor1_thetas):\n",
    "        mard = calculate_robust_mard(theta, combined_median_theta)\n",
    "        m1_mard_values.append(mard)\n",
    "        \n",
    "        # Check if this sample falls within the combined dataset bounds\n",
    "        in_domain = lower_bound <= mard <= upper_bound\n",
    "        m1_in_domain_flags.append(in_domain)\n",
    "        \n",
    "        # Store indices of samples that fall outside bounds\n",
    "        if not in_domain:\n",
    "            m1_outside_indices.append(i)\n",
    "    \n",
    "    # Calculate statistics\n",
    "    total_m1 = len(messidor1_thetas)\n",
    "    outside_count = sum(not flag for flag in m1_in_domain_flags)\n",
    "    percentage_outside = (outside_count / total_m1) * 100\n",
    "    \n",
    "    print(f\"\\nMESSIDOR-1 EVALUATION AGAINST COMBINED DATASET BOUNDS:\")\n",
    "    print(f\"  - Total Messidor-1 samples: {total_m1}\")\n",
    "    print(f\"  - Messidor-1 samples outside combined bounds: {outside_count}\")\n",
    "    print(f\"  - Percentage outside: {percentage_outside:.2f}%\")\n",
    "    \n",
    "    # Save MARD values for Messidor-1 points outside the combined bounds\n",
    "    if outside_count > 0:\n",
    "        print(\"\\nMessidor-1 points outside combined dataset bounds:\")\n",
    "        outside_mards = [m1_mard_values[i] for i in m1_outside_indices]\n",
    "        outside_ids = [messidor1_ids[i] for i in m1_outside_indices]\n",
    "        \n",
    "        for i, (idx, mard) in enumerate(zip(outside_ids, outside_mards)):\n",
    "            if i < 10:  # Only print first 10 to avoid excessive output\n",
    "                print(f\"  Point {i+1} (ID: {idx}): MARD = {mard:.6f}\")\n",
    "            if i == 10:\n",
    "                print(f\"  ... and {outside_count - 10} more\")\n",
    "        \n",
    "        # Save to CSV\n",
    "        outside_df = pd.DataFrame({\n",
    "            'id': outside_ids,\n",
    "            'mard': outside_mards\n",
    "        })\n",
    "        outside_df.to_csv(os.path.join(OUTPUT_DIR, \"messidor1_points_outside_combined_bounds.csv\"), index=False)\n",
    "    \n",
    "    # Save all results to CSV\n",
    "    results_dict = {\n",
    "        'id': messidor1_ids,\n",
    "        'mard': m1_mard_values,\n",
    "        'in_domain': m1_in_domain_flags\n",
    "    }\n",
    "    \n",
    "    results_df = pd.DataFrame(results_dict)\n",
    "    results_df.to_csv(os.path.join(OUTPUT_DIR, \"messidor1_evaluation_against_combined_bounds.csv\"), index=False)\n",
    "    \n",
    "    # Save combined dataset bounds for reference\n",
    "    with open(os.path.join(OUTPUT_DIR, \"combined_aptos_eyepacs_m2_bounds.txt\"), 'w') as f:\n",
    "        f.write(f\"Mean MARD: {mean_mard}\\n\")\n",
    "        f.write(f\"Std MARD: {std_mard}\\n\")\n",
    "        f.write(f\"Lower bound (max(0, mean-2std)): {lower_bound}\\n\")\n",
    "        f.write(f\"Upper bound (mean+2std): {upper_bound}\\n\")\n",
    "        f.write(f\"Percentage of Messidor-1 samples outside bounds: {percentage_outside:.2f}%\\n\")\n",
    "    \n",
    "    # Save the combined median theta for future use\n",
    "    np.save(os.path.join(OUTPUT_DIR, \"combined_aptos_eyepacs_m2_median_theta.npy\"), combined_median_theta)\n",
    "    \n",
    "    # Save a summary of all datasets' performance for future comparison\n",
    "    summary_data = {\n",
    "        'dataset': ['Messidor-1'],\n",
    "        'total_samples': [total_m1],\n",
    "        'outside_count': [outside_count],\n",
    "        'percentage_outside': [percentage_outside]\n",
    "    }\n",
    "    \n",
    "    # Check if previous summary file exists, and if so, append to it\n",
    "    summary_path = os.path.join(OUTPUT_DIR, \"cross_dataset_evaluation_summary.csv\")\n",
    "    if os.path.exists(summary_path):\n",
    "        existing_summary = pd.read_csv(summary_path)\n",
    "        updated_summary = pd.concat([existing_summary, pd.DataFrame(summary_data)])\n",
    "        updated_summary.to_csv(summary_path, index=False)\n",
    "    else:\n",
    "        pd.DataFrame(summary_data).to_csv(summary_path, index=False)\n",
    "    \n",
    "    print(f\"\\nResults saved to {OUTPUT_DIR}\")\n",
    "    print(f\"Point of note: The percentage outside ({percentage_outside:.2f}%) should be compared with Messidor-1 accuracy from literature.\")\n",
    "\n",
    "if __name__ == \"__main__\":\n",
    "    main()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Loading datasets...\n",
      "Combined dataset D contains 39984 samples:\n",
      "  - APTOS: 3662 samples\n",
      "  - EyePACS: 35122 samples\n",
      "  - Messidor-1: 1200 samples\n",
      "  - Messidor-2 (to be evaluated): 1057 samples\n",
      "\n",
      "Calculating median theta for combined dataset D (APTOS + EyePACS + M1)...\n",
      "Creating train/calibration split for conformal bounds...\n",
      "Calculating calibration MARD values...\n",
      "\n",
      "Combined dataset D conformal bounds:\n",
      "  - Mean MARD: 38.739620\n",
      "  - Std MARD: 10.755412\n",
      "  - Lower bound: 17.228796\n",
      "  - Upper bound: 60.250444\n",
      "\n",
      "Evaluating Messidor-2 against combined dataset bounds...\n",
      "\n",
      "MESSIDOR-2 EVALUATION AGAINST COMBINED DATASET BOUNDS:\n",
      "  - Total Messidor-2 samples: 1057\n",
      "  - Messidor-2 samples outside combined bounds: 5\n",
      "  - Percentage outside: 0.47%\n",
      "\n",
      "Messidor-2 points outside combined dataset bounds:\n",
      "  Point 1 (ID: 20051021_39314_0100_PP.png): MARD = 63.663860\n",
      "  Point 2 (ID: 20051202_55742_0400_PP.png): MARD = 60.547950\n",
      "  Point 3 (ID: 20060523_49269_0100_PP.png): MARD = 60.550895\n",
      "  Point 4 (ID: 20060530_55203_0100_PP.png): MARD = 67.237804\n",
      "  Point 5 (ID: 20060530_55816_0100_PP.png): MARD = 66.814779\n",
      "\n",
      "Results saved to /drive2/Kuntal/Pysindy-experiment/conformal_boundary/cross_dataset_evaluation\n",
      "Point of note: The percentage outside (0.47%) should be compared with Messidor-2 accuracy from literature.\n"
     ]
    }
   ],
   "source": [
    "import os\n",
    "import numpy as np\n",
    "import pandas as pd\n",
    "from sklearn.model_selection import train_test_split\n",
    "\n",
    "# ─── CONFIG ────────────────────────────────────────────────────────────────\n",
    "BASE_DIR = \"/drive2/Kuntal/Pysindy-experiment\"\n",
    "OUTPUT_DIR = f\"{BASE_DIR}/conformal_boundary/cross_dataset_evaluation\"\n",
    "\n",
    "# Dataset paths\n",
    "APTOS_DATA_DIR = f\"{BASE_DIR}/aptos_theta_data\"\n",
    "EYEPACS_DATA_DIR = f\"{BASE_DIR}/eyepacs_theta_data\"\n",
    "M1_DATA_DIR = f\"{BASE_DIR}/M1-output\"\n",
    "M2_DATA_DIR = f\"{BASE_DIR}/M2-output\"\n",
    "\n",
    "# Create output directory\n",
    "os.makedirs(OUTPUT_DIR, exist_ok=True)\n",
    "\n",
    "# ─── MARD CALCULATION FUNCTION ─────────────────────────────────────────────\n",
    "def calculate_robust_mard(theta1, theta2, max_value=100.0):\n",
    "    \"\"\"\n",
    "    Calculate Mean Absolute Relative Difference with numerical stability improvements\n",
    "    \"\"\"\n",
    "    epsilon = 1e-6  # Larger epsilon to avoid extreme values\n",
    "    \n",
    "    # Flatten the theta arrays if they are not already flat\n",
    "    if theta1.ndim > 1:\n",
    "        theta1_flat = theta1.flatten()\n",
    "        theta2_flat = theta2.flatten()\n",
    "    else:\n",
    "        theta1_flat = theta1\n",
    "        theta2_flat = theta2\n",
    "    \n",
    "    # Calculate absolute relative differences with capping\n",
    "    abs_diff = np.abs(theta1_flat - theta2_flat)\n",
    "    denominator = np.abs(theta2_flat) + epsilon\n",
    "    rel_diff = abs_diff / denominator\n",
    "    \n",
    "    # Cap extreme values\n",
    "    rel_diff = np.minimum(rel_diff, max_value)\n",
    "    \n",
    "    # Return mean of absolute relative differences\n",
    "    return np.mean(rel_diff)\n",
    "\n",
    "def main():\n",
    "    # Load theta arrays from all datasets\n",
    "    print(\"Loading datasets...\")\n",
    "    eyepacs_thetas = np.load(os.path.join(EYEPACS_DATA_DIR, \"eyepacs_all_thetas.npy\"), allow_pickle=True)\n",
    "    eyepacs_ids = np.load(os.path.join(EYEPACS_DATA_DIR, \"eyepacs_theta_ids.npy\"), allow_pickle=True)\n",
    "    \n",
    "    messidor1_thetas = np.load(os.path.join(M1_DATA_DIR, \"messidor_all_thetas.npy\"), allow_pickle=True)\n",
    "    messidor1_ids = np.load(os.path.join(M1_DATA_DIR, \"messidor_theta_ids.npy\"), allow_pickle=True)\n",
    "    \n",
    "    messidor2_thetas = np.load(os.path.join(M2_DATA_DIR, \"messidor2_all_thetas.npy\"), allow_pickle=True)\n",
    "    messidor2_ids = np.load(os.path.join(M2_DATA_DIR, \"messidor2_theta_ids.npy\"), allow_pickle=True)\n",
    "    \n",
    "    aptos_thetas = np.load(os.path.join(APTOS_DATA_DIR, \"aptos_all_thetas.npy\"), allow_pickle=True)\n",
    "    aptos_ids = np.load(os.path.join(APTOS_DATA_DIR, \"aptos_theta_ids.npy\"), allow_pickle=True)\n",
    "    \n",
    "    # Combine APTOS, EyePACS, and Messidor-1 into dataset D\n",
    "    combined_thetas = np.concatenate([aptos_thetas, eyepacs_thetas, messidor1_thetas])\n",
    "    combined_ids = np.concatenate([aptos_ids, eyepacs_ids, messidor1_ids])\n",
    "    \n",
    "    print(f\"Combined dataset D contains {len(combined_thetas)} samples:\")\n",
    "    print(f\"  - APTOS: {len(aptos_thetas)} samples\")\n",
    "    print(f\"  - EyePACS: {len(eyepacs_thetas)} samples\")\n",
    "    print(f\"  - Messidor-1: {len(messidor1_thetas)} samples\")\n",
    "    print(f\"  - Messidor-2 (to be evaluated): {len(messidor2_thetas)} samples\")\n",
    "    \n",
    "    # Step 1: Calculate the median theta for the combined dataset D\n",
    "    print(\"\\nCalculating median theta for combined dataset D (APTOS + EyePACS + M1)...\")\n",
    "    combined_stacked = np.stack(combined_thetas)\n",
    "    combined_median_theta = np.median(combined_stacked, axis=0)\n",
    "    \n",
    "    # Step 2: Create train/calibration split for the combined dataset\n",
    "    print(\"Creating train/calibration split for conformal bounds...\")\n",
    "    combined_train, combined_calibration = train_test_split(\n",
    "        combined_thetas, test_size=0.4, random_state=42\n",
    "    )\n",
    "    \n",
    "    # Step 3: Calculate MARD values for the calibration set\n",
    "    print(\"Calculating calibration MARD values...\")\n",
    "    calibration_mard_values = []\n",
    "    for theta in combined_calibration:\n",
    "        mard = calculate_robust_mard(theta, combined_median_theta)\n",
    "        calibration_mard_values.append(mard)\n",
    "    \n",
    "    calibration_mard_values = np.array(calibration_mard_values)\n",
    "    \n",
    "    # Step 4: Establish conformal bounds for the combined dataset\n",
    "    mean_mard = np.mean(calibration_mard_values)\n",
    "    std_mard = np.std(calibration_mard_values)\n",
    "    \n",
    "    # Calculate conformal boundaries, ensuring non-negative lower bound\n",
    "    lower_bound = max(0, mean_mard - 2 * std_mard)\n",
    "    upper_bound = mean_mard + 2 * std_mard\n",
    "    \n",
    "    print(f\"\\nCombined dataset D conformal bounds:\")\n",
    "    print(f\"  - Mean MARD: {mean_mard:.6f}\")\n",
    "    print(f\"  - Std MARD: {std_mard:.6f}\")\n",
    "    print(f\"  - Lower bound: {lower_bound:.6f}\")\n",
    "    print(f\"  - Upper bound: {upper_bound:.6f}\")\n",
    "    \n",
    "    # Step 5: Evaluate Messidor-2 against the combined dataset bounds\n",
    "    print(\"\\nEvaluating Messidor-2 against combined dataset bounds...\")\n",
    "    m2_mard_values = []\n",
    "    m2_in_domain_flags = []\n",
    "    m2_outside_indices = []\n",
    "    \n",
    "    for i, theta in enumerate(messidor2_thetas):\n",
    "        mard = calculate_robust_mard(theta, combined_median_theta)\n",
    "        m2_mard_values.append(mard)\n",
    "        \n",
    "        # Check if this sample falls within the combined dataset bounds\n",
    "        in_domain = lower_bound <= mard <= upper_bound\n",
    "        m2_in_domain_flags.append(in_domain)\n",
    "        \n",
    "        # Store indices of samples that fall outside bounds\n",
    "        if not in_domain:\n",
    "            m2_outside_indices.append(i)\n",
    "    \n",
    "    # Calculate statistics\n",
    "    total_m2 = len(messidor2_thetas)\n",
    "    outside_count = sum(not flag for flag in m2_in_domain_flags)\n",
    "    percentage_outside = (outside_count / total_m2) * 100\n",
    "    \n",
    "    print(f\"\\nMESSIDOR-2 EVALUATION AGAINST COMBINED DATASET BOUNDS:\")\n",
    "    print(f\"  - Total Messidor-2 samples: {total_m2}\")\n",
    "    print(f\"  - Messidor-2 samples outside combined bounds: {outside_count}\")\n",
    "    print(f\"  - Percentage outside: {percentage_outside:.2f}%\")\n",
    "    \n",
    "    # Save MARD values for Messidor-2 points outside the combined bounds\n",
    "    if outside_count > 0:\n",
    "        print(\"\\nMessidor-2 points outside combined dataset bounds:\")\n",
    "        outside_mards = [m2_mard_values[i] for i in m2_outside_indices]\n",
    "        outside_ids = [messidor2_ids[i] for i in m2_outside_indices]\n",
    "        \n",
    "        for i, (idx, mard) in enumerate(zip(outside_ids, outside_mards)):\n",
    "            if i < 10:  # Only print first 10 to avoid excessive output\n",
    "                print(f\"  Point {i+1} (ID: {idx}): MARD = {mard:.6f}\")\n",
    "            if i == 10:\n",
    "                print(f\"  ... and {outside_count - 10} more\")\n",
    "        \n",
    "        # Save to CSV\n",
    "        outside_df = pd.DataFrame({\n",
    "            'id': outside_ids,\n",
    "            'mard': outside_mards\n",
    "        })\n",
    "        outside_df.to_csv(os.path.join(OUTPUT_DIR, \"messidor2_points_outside_combined_bounds.csv\"), index=False)\n",
    "    \n",
    "    # Save all results to CSV\n",
    "    results_dict = {\n",
    "        'id': messidor2_ids,\n",
    "        'mard': m2_mard_values,\n",
    "        'in_domain': m2_in_domain_flags\n",
    "    }\n",
    "    \n",
    "    results_df = pd.DataFrame(results_dict)\n",
    "    results_df.to_csv(os.path.join(OUTPUT_DIR, \"messidor2_evaluation_against_combined_bounds.csv\"), index=False)\n",
    "    \n",
    "    # Save combined dataset bounds for reference\n",
    "    with open(os.path.join(OUTPUT_DIR, \"combined_aptos_eyepacs_m1_bounds.txt\"), 'w') as f:\n",
    "        f.write(f\"Mean MARD: {mean_mard}\\n\")\n",
    "        f.write(f\"Std MARD: {std_mard}\\n\")\n",
    "        f.write(f\"Lower bound (max(0, mean-2std)): {lower_bound}\\n\")\n",
    "        f.write(f\"Upper bound (mean+2std): {upper_bound}\\n\")\n",
    "        f.write(f\"Percentage of Messidor-2 samples outside bounds: {percentage_outside:.2f}%\\n\")\n",
    "    \n",
    "    # Save the combined median theta for future use\n",
    "    np.save(os.path.join(OUTPUT_DIR, \"combined_aptos_eyepacs_m1_median_theta.npy\"), combined_median_theta)\n",
    "    \n",
    "    # Save a summary of all datasets' performance for future comparison\n",
    "    summary_data = {\n",
    "        'dataset': ['Messidor-2'],\n",
    "        'total_samples': [total_m2],\n",
    "        'outside_count': [outside_count],\n",
    "        'percentage_outside': [percentage_outside]\n",
    "    }\n",
    "    \n",
    "    # Check if previous summary file exists, and if so, append to it\n",
    "    summary_path = os.path.join(OUTPUT_DIR, \"cross_dataset_evaluation_summary.csv\")\n",
    "    if os.path.exists(summary_path):\n",
    "        existing_summary = pd.read_csv(summary_path)\n",
    "        updated_summary = pd.concat([existing_summary, pd.DataFrame(summary_data)])\n",
    "        updated_summary.to_csv(summary_path, index=False)\n",
    "    else:\n",
    "        pd.DataFrame(summary_data).to_csv(summary_path, index=False)\n",
    "    \n",
    "    print(f\"\\nResults saved to {OUTPUT_DIR}\")\n",
    "    print(f\"Point of note: The percentage outside ({percentage_outside:.2f}%) should be compared with Messidor-2 accuracy from literature.\")\n",
    "\n",
    "if __name__ == \"__main__\":\n",
    "    main()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.12"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
