{
    "diabetes_readmission": {
      "causal": {
        "metrics": {
          "id_test": [0.5838581758805692, 0.5838581758805692, 0.5390716118497784, 0.5838581758805692, 0.5838581758805692],
          "ood_test": [0.5061607283001098, 0.5061607283001098, 0.5148328362894365, 0.5061607283001098, 0.5061607283001098],
          "ood_validation": [0.4936440677966102, 0.4936440677966102, 0.5074152542372882, 0.4936440677966102, 0.4936440677966102],
          "validation": [0.5781614559029398, 0.5781614559029398, 0.5401306579561362, 0.5781614559029398, 0.5781614559029398],
          "train": [0.5757699486700887, 0.5757699486700887, 0.5417347176854876, 0.5757699486700887, 0.5757699486700887]
        },
        "train_shifts": {
          "informativeness": [0.016108566162679066, 0.007327715096787075, 0.025988259154460368, 0.026583422616086042, 0.018450650257634427],
          "invariance": [0.3282168223850304, 0.23299134870413565, 0.30551563673256066, 0.36245430322212197, 0.3232534494859635],
          "label_shift": [0.003375592508434266, -0.0031805683642138712, 0.03056067027352713, -0.009696242617215522, 0.02263980414945888],
          "latent_covariate_shift": [0.34940142352513076, 0.26449467777265195, 0.31244108273213095, 0.38343962513825747, 0.33114553454493423],
          "concept_shift": [0.23541236822028438, 0.2129245109820915, 0.24441127956486647, 0.2594279176894181, 0.2041104637251856],
          "residual": [0.022821989500404632, 0.01914462470706447, 0.05351741187111222, 0.01766116493016624, 0.0189634589477612],
          "overall": [-0.11213951062360046, -0.10411778474917194, -0.13099173436253636, -0.11514716150932926, -0.08730209594850477]
        },
        "test_shifts": {
          "informativeness": [0.015895192638073728, 0.020059336422862544, 0.027709064948070718, 0.006601629275459808, 0.017104770717058706],
          "invariance": [0.0013680332236263094, 0.0019034080721954485, 0.0020099438786653594, 0.00014958456458690356, 0.00224436999663059],
          "label_shift": [-0.006770410690669257, 0.0007466110447008205, -0.0018651941118563787, 0.027071814301264048, 0.010135774381306023],
          "latent_covariate_shift": [0.001074251809665984, 0.0010588768978909994, 0.0023352618227570746, 0.0012750759809887508, 0.001978953073132122],
          "concept_shift": [0.05850892675011577, 0.07030527954938783, 0.06050243454170087, 0.05640628172323983, 0.05358855150813848],
          "residual": [0.02427198401875249, 0.01684482282186634, 0.013650371073479373, 0.0138282706558665, 0.016143218187510352],
          "overall": [-0.04116335080805143, -0.031987086238499524, -0.016962461480141425, -0.02133112938319366, -0.020897544495617107]
        }
      },
      "arguablycausal": {
        "metrics": {
          "id_test": [0.6300443200373221, 0.6251457895964544, 0.6300443200373221, 0.6251457895964544, 0.6300443200373221],
          "ood_test": [0.6007887301836446, 0.588526134044891, 0.6007887301836446, 0.588526134044891, 0.6007887301836446],
          "ood_validation": [0.5972810734463276, 0.5817443502824858, 0.5972810734463276, 0.5817443502824858, 0.5972810734463276],
          "validation": [0.6327578161455903, 0.6322911805879609, 0.6327578161455903, 0.6322911805879609, 0.6327578161455903],
          "train": [0.6300746616892208, 0.6260790947270182, 0.6300746616892208, 0.6260790947270182, 0.6300746616892208]
        },
        "train_shifts": {
          "informativeness": [0.0746577579410178, 0.05827706815971102, 0.0746577579410178, 0.05827706815971102, 0.05827706815971102],
          "invariance": [0.38423538407533425, 0.19677958745590315, 0.38423538407533425, 0.19677958745590315, 0.19677958745590315],
          "label_shift": [0.003375592508434266, 0.015734076376641568, 0.003375592508434266, 0.015734076376641568, 0.015734076376641568],
          "latent_covariate_shift": [0.43524056301367586, 0.23069245520521173, 0.43524056301367586, 0.23069245520521173, 0.23069245520521173],
          "concept_shift": [-0.003196091221786769, 0.0031029711040021514, -0.003196091221786769, 0.0031029711040021514, 0.0031029711040021514],
          "residual": [0.05930618648858875, 0.04881102018780926, 0.05930618648858875, 0.04881102018780926, 0.04881102018780926],
          "overall": [0.044140002786710375, 0.03273803448287576, 0.044140002786710375, 0.03273803448287576, 0.03273803448287576]
        },
        "test_shifts": {
          "informativeness": [0.0775486274261339, 0.06263627806356624, 0.0775486274261339, 0.06263627806356624, 0.06263627806356624],
          "invariance": [0.00010820212806625991, 8.415721071987506e-05, 0.00010820212806625991, 8.415721071987506e-05, 8.415721071987506e-05],
          "label_shift": [-0.009544186325330216, 0.0009818828414588172, -0.009544186325330216, 0.0009818828414588172, 0.0009818828414588172],
          "latent_covariate_shift": [0.0, -2.40449173489476e-05, 0.0, -2.40449173489476e-05, -2.40449173489476e-05],
          "concept_shift": [0.002272244689400748, 0.0009137068592300567, 0.002272244689400748, 0.0009137068592300567, 0.0009137068592300567],
          "residual": [0.04886681280265805, 0.042185859311475164, 0.04886681280265805, 0.042185859311475164, 0.042185859311475164],
          "overall": [0.02271949805207725, 0.02043040567917103, 0.02271949805207725, 0.02043040567917103, 0.02043040567917103]
        }
      },
      "all": {
        "metrics": {
          "id_test": [0.423839514812223, 0.41614182411943085, 0.6116165150454863, 0.5838581758805692, 0.5250758105901563],
          "ood_test": [0.4795557997174698, 0.4938392716998901, 0.552837074242662, 0.5061607283001098, 0.5448909119447497],
          "ood_validation": [0.4901129943502825, 0.5063559322033898, 0.548728813559322, 0.4936440677966102, 0.5388418079096046],
          "validation": [0.4265048996733551, 0.4218385440970602, 0.6185254316378908, 0.5781614559029398, 0.5361642557162856],
          "train": [0.4254841343910406, 0.4242300513299113, 0.6105634624358376, 0.5757699486700887, 0.5275898273448437]
        },
        "train_shifts": {
          "informativeness": [0.05655232337662966, 0.04867149443251885, 0.05350227651860848, 0.06115343090868404, 0.06277789291764539],
          "invariance": [0.40179438446746063, 0.32886613279028737, 0.7611043874623891, 0.4570353874513053, 0.7129544199306392],
          "label_shift": [0.003375592508434266, -0.0031805683642138712, 0.03056067027352713, -0.009696242617215522, -0.005975659725125663],
          "latent_covariate_shift": [0.4378070326264794, 0.3416773637551988, 0.7166906482495378, 0.4897513677525412, 0.7616273144985475],
          "concept_shift": [0.00850924695819596, 0.008000131476263909, 0.00229875232650786, 0.017468185424531917, -0.008504906207840047],
          "residual": [0.0647119659381701, 0.04268569885765858, 0.03482506382273122, 0.053260040964021434, 0.07057734525539854],
          "overall": [0.007279854293088112, 0.006801061137077097, 0.010601302062961282, 0.010669166074406856, 0.01780161818755817]
        },
        "test_shifts": {
          "informativeness": [0.054642526057281655, 0.045657124126912384, 0.0670924729505627, 0.06992279552056771, 0.07828738933301808],
          "invariance": [8.415721071987506e-05, 0.005049432643110976, 0.019151776667802323, 1.1211992763352213e-15, 0.0015508971689569865],
          "label_shift": [-0.006770410690669257, 0.0007466110447008205, -0.0018651941118563787, 0.010976329636563498, -0.009470196352610684],
          "latent_covariate_shift": [-9.617966939322766e-05, -0.0001442695040885601, 0.0, 0.0, 0.0],
          "concept_shift": [-9.617966939210646e-05, -0.00014426950408839994, 4.805139755722377e-16, 1.6017132519074588e-16, 1.6017132519074588e-16],
          "residual": [0.05437891474240899, 0.04561897049308206, 0.062348234955542634, 0.06989693262237405, 0.07660210425201168],
          "overall": [-0.0031636726358224565, -0.002113257165374839, -0.0057642473948095255, 0.005514027716474773, -0.0038252616797775085]
        }
      }
    },


    "acsfoodstamps": {
        "causal": {
          "metrics": {
            "id_test": [0.8139466856590527, 0.8151167523019789, 0.8132217530650658, 0.8126875922063387, 0.8156381950450221],
            "ood_test": [0.7767707353001351, 0.7816604607389828, 0.7819878063750563, 0.7823765293178935, 0.7806784238307624],
            "ood_validation": [0.7889891364389615, 0.7900939053581293, 0.7913828024304916, 0.7923034431964647, 0.7900939053581293],
            "validation": [0.8168059318045964, 0.818739109974945, 0.8161445813778981, 0.8157884696096761, 0.81861192720058],
            "train": [0.8145935410433406, 0.8158939807763848, 0.813750957842224, 0.8136158265741203, 0.8157826962026524]
          },
          "train_shifts": {
            "informativeness": [0.06292680889843892, 0.0737103786123164, 0.07422964019152277, 0.0638053562656715, 0.08047899620698462],
            "invariance": [2.17360554357066, 0.7127199527079671, 2.365347756628525, 0.34129387729800953, 1.6237156297700388],
            "label_shift": [-0.0058060624703405814, 0.005422396634699895, 0.0019714875710719567, -0.0017492588395214394, 0.0035166859362696936],
            "latent_covariate_shift": [2.187927849685372, 0.8041070001875738, 2.4466133146889266, 0.38877755210236487, 1.753554066612402],
            "concept_shift": [0.11647203527055955, 0.10648791713310941, 0.11003123159370272, 0.05877097925211524, 0.10809010187776413],
            "residual": [0.04919885019344319, 0.0800142433147186, 0.07366010100529127, 0.07013826737349999, 0.07768192063662192],
            "overall": [-0.04024993710809826, -0.011143101211803619, -0.012827553794882991, -0.012851192751469148, 0.015429586020797095]
          },
          "test_shifts": {
            "informativeness": [0.07775577378274857, 0.08416191990343967, 0.07594309673275937, 0.07038994061813662, 0.08176588101668596],
            "invariance": [0.011361372335123677, 0.00032387702702761504, 0.0002874702890212285, 0.0011132737666612086, 0.00022913962733860189],
            "label_shift": [-0.0015958378682764684, -0.0014419506622654974, -0.0062578540267975175, -0.007654155868600332, 0.017383880625888287],
            "latent_covariate_shift": [7.274930641074643e-05, -0.00024253064831920314, 0.00011172814242665215, 0.0003106901259264884, 0.00040746013958792326],
            "concept_shift": [0.14284827521708285, 0.15267668602735113, 0.12994264129191824, 0.12842216922872712, 0.12773017802456146],
            "residual": [0.07129518277864821, 0.08212645050449563, 0.07902377039940711, 0.07328635830125046, 0.07785041338931732],
            "overall": [-0.07140577705293577, -0.07530705278353766, -0.07126879239930291, -0.07133587205214492, -0.051168520815843305]
          }
        },
        "arguablycausal": {
          "metrics": {
            "id_test": [0.8220735615811161, 0.8307091621305387, 0.8267538281528208, 0.8091010835834562, 0.8237396347357175],
            "ood_test": [0.7968206555096362, 0.8088096894308278, 0.8021809403003396, 0.7801260280698883, 0.8004828348132084],
            "ood_validation": [0.8040876450009207, 0.8125575400478733, 0.809795617749954, 0.7864113422942368, 0.8055606702264776],
            "validation": [0.8259630915588793, 0.8344461826090275, 0.831330204637084, 0.8127615195797881, 0.8273748203543312],
            "train": [0.8239668817108572, 0.8329411876925621, 0.8286519622649908, 0.8099418458613267, 0.8251767040052908]
          },
          "train_shifts": {
            "informativeness": [0.010037449301801279, 0.138466904652488, 0.015885263287728605, 0.09994033174675024, 0.12382239946897193],
            "invariance": [0.6913397369659873, 0.2724595577132243, 0.5537605392149502, 0.11408042937634164, 0.13982309574270532],
            "label_shift": [-0.0058060624703405814, 0.005422396634699895, 0.0019714875710719567, -0.0017492588395214394, 0.0035166859362696936],
            "latent_covariate_shift": [0.6895457814489371, 0.30490296948327716, 0.5518991321932777, 0.12076564877575148, 0.15529349412842303],
            "concept_shift": [0.0005109570959124368, -0.00011660189915026864, -0.00011764494263531041, -0.00045959469561522543, 0.006256273555412138],
            "residual": [0.005317289690057757, 0.1250295541801208, 0.008377251208974723, 0.10346353830424883, 0.11434056496023905],
            "overall": [0.0006646720700919373, 0.03242855562431873, 0.007621874824771247, -0.0008254289297467826, 0.015847239892020512]
          },
          "test_shifts": {
            "informativeness": [0.04758650894994602, 0.17283029795071259, 0.06797540520485233, 0.1027925391257456, 0.1527129014086324],
            "invariance": [0.031198280259225285, 1.1211992763352213e-15, 0.03660838666255654, 0.00146680808896939, 9.050140593520606e-05],
            "label_shift": [-0.0015958378682764684, -0.0014419506622654974, -0.0062578540267975175, -0.007654155868600332, 0.017383880625888287],
            "latent_covariate_shift": [0.0, 0.0, 0.0, 0.0011755906674833225, 5.539239364886694e-05],
            "concept_shift": [0.0037510071063115327, 0.00306572696188911, 0.0033542659700670314, 0.008064343794686837, 0.0033963657689948753],
            "residual": [0.04443650089931378, 0.14858120282003853, 0.0532625439815069, 0.10383304603236068, 0.1326894847891638],
            "overall": [-0.015122554566274406, 0.021995256318596196, -0.008397392106365108, -0.00904536544900171, 0.026999619541772157]
          }
        },
        "all": {
          "metrics": {
            "id_test": [0.817024469654576, 0.8443811364908175, 0.8394592257211172, 0.835656509131607, 0.8365594953451697],
            "ood_test": [0.7873071729612504, 0.8147632881869143, 0.8106919268382503, 0.8087892303285732, 0.8104873358157044],
            "ood_validation": [0.7934082121156325, 0.8153194623457927, 0.8107162585159271, 0.8123734118946787, 0.8138464371202356],
            "validation": [0.8211047095781348, 0.8453839012044209, 0.8412377427601205, 0.8374985691937884, 0.8401948440103273],
            "train": [0.8180004387791764, 0.8447453014063191, 0.83952605489827, 0.8359013573538436, 0.8378965307829028]
          },
          "train_shifts": {
            "informativeness": [0.009371969804680087, 0.18173141918744726, 0.02970223479021865, 0.14804129738765448, 0.16751959485518642],
            "invariance": [0.7142965711624533, 0.3381517164854672, 0.5171746279101165, 0.04011184410845488, 0.2508307164990842],
            "label_shift": [-0.0058060624703405814, 0.005422396634699895, 0.0019714875710719567, -0.0017492588395214394, 0.0035166859362696936],
            "latent_covariate_shift": [0.7135533302768001, 0.3655060501403584, 0.5161819136594916, 0.04184508066166055, 0.2629979940603884],
            "concept_shift": [9.257293179098162e-05, -0.001991916650746003, 3.6067376022620544e-05, 0.00097727593960667, 0.002343891420367261],
            "residual": [0.006313162456522016, 0.13197384297838752, 0.00021824034147927362, 0.1300389103725151, 0.13248470722372963],
            "overall": [-0.00026213079573426945, 0.06714189967922829, 0.029955347420951628, 0.01750573790217816, 0.04170492367006007]
          },
          "test_shifts": {
            "informativeness": [0.057013775972670815, 0.199069177114589, 0.007281645638885224, 0.14979473254380263, 0.17528507777799326],
            "invariance": [0.02485042207931326, 1.1211992763352213e-15, 0.002055840433266947, 0.00176530051164947, 1.1211992763352213e-15],
            "label_shift": [-0.0015958378682764684, -0.0014419506622654974, -0.0062578540267975175, -0.007654155868600332, 0.017383880625888287],
            "latent_covariate_shift": [0.0, 0.0, 0.0, 2.838649491896098e-05, 0.0],
            "concept_shift": [0.0021640425613340076, 0.0009738191526005036, 0.002344379441444868, 0.005297020286061459, 0.0016590992970224455],
            "residual": [0.0570587550546559, 0.12317397916356715, 0.005716525289091386, 0.12134124436362778, 0.13165087076615795],
            "overall": [-0.014350130336446956, 0.07468731304358828, -0.003763916600960828, 0.021109443094478708, 0.051496597676267686]
          }
        }
      },
      "brfss_diabetes": {
        "causal": {
          "metrics": {
            "id_test": [0.8733539482615582, 0.8733539482615582, 0.8733539482615582, 0.8733539482615582, 0.8727734948908001],
            "ood_test": [0.8256898387489898, 0.8256898387489898, 0.8256898387489898, 0.8256898387489898, 0.8258053731343283],
            "ood_validation": [0.8263613623244179, 0.8263613623244179, 0.8263613623244179, 0.8263613623244179, 0.828748280605227],
            "validation": [0.8727420826765417, 0.8727420826765417, 0.8727420826765417, 0.8727420826765417, 0.8745233339386236],
            "train": [0.8726770320313149, 0.8726770320313149, 0.8726770320313149, 0.8726770320313149, 0.8752812802753529]
          },
          "train_shifts": {
            "informativeness": [0.14071908082893472, 0.14071908082893472, 0.14071908082893472, 0.14071908082893472, 0.14071908082893472],
            "invariance": [0.12139778878262138, 0.12139778878262138, 0.12139778878262138, 0.12139778878262138, 0.12139778878262138],
            "label_shift": [0.017554929267790703, 0.017554929267790703, 0.017554929267790703, 0.017554929267790703, 0.017554929267790703],
            "latent_covariate_shift": [0.12942517779261428, 0.12942517779261428, 0.12942517779261428, 0.12942517779261428, 0.12942517779261428],
            "concept_shift": [0.031838328386072215, 0.031838328386072215, 0.031838328386072215, 0.031838328386072215, 0.031838328386072215],
            "residual": [0.14451726459615816, 0.14451726459615816, 0.14451726459615816, 0.14451726459615816, 0.14451726459615816],
            "overall": [-0.006926188821367724, -0.006926188821367724, -0.006926188821367724, -0.006926188821367724, -0.006926188821367724]
          },
          "test_shifts": {
            "informativeness": [0.11102299581870327, 0.11102299581870327, 0.11102299581870327, 0.11102299581870327, 0.11102299581870327],
            "invariance": [0.21686273013837493, 0.21686273013837493, 0.21686273013837493, 0.21686273013837493, 0.21686273013837493],
            "label_shift": [0.010747443489363856, 0.010747443489363856, 0.010747443489363856, 0.010747443489363856, 0.010747443489363856],
            "latent_covariate_shift": [0.23272830478966047, 0.23272830478966047, 0.23272830478966047, 0.23272830478966047, 0.23272830478966047],
            "concept_shift": [0.1071328622142813, 0.1071328622142813, 0.1071328622142813, 0.1071328622142813, 0.1071328622142813],
            "residual": [0.15271201086531838, 0.15271201086531838, 0.15271201086531838, 0.15271201086531838, 0.15271201086531838],
            "overall": [-0.08194893708343107, -0.08194893708343107, -0.08194893708343107, -0.08194893708343107, -0.08194893708343107]
          }
        },
        "arguablycausal": {
          "metrics": {
            "id_test": [0.8727734948908001, 0.8727734948908001, 0.8727734948908001, 0.8727734948908001, 0.8727734948908001],
            "ood_test": [0.8258053731343283, 0.8258053731343283, 0.8258053731343283, 0.8258053731343283, 0.8258053731343283],
            "ood_validation": [0.828748280605227, 0.828748280605227, 0.828748280605227, 0.828748280605227, 0.828748280605227],
            "validation": [0.8745233339386236, 0.8745233339386236, 0.8745233339386236, 0.8745233339386236, 0.8745233339386236],
            "train": [0.8752812802753529, 0.8752812802753529, 0.8752812802753529, 0.8752812802753529, 0.8752812802753529]
          },
          "train_shifts": {
            "informativeness": [0.065579582170207, 0.08185042528033055, 0.065579582170207, 0.08185042528033055, 0.065579582170207],
            "invariance": [1.1211992763352213e-15, 0.0003967411362459429, 1.1211992763352213e-15, 0.0003967411362459429, 1.1211992763352213e-15],
            "label_shift": [0.004410807874824522, 0.005675449120732449, 0.004410807874824522, 0.005675449120732449, 0.004410807874824522],
            "latent_covariate_shift": [0.0, 0.0, 0.0, 0.0, 0.0],
            "concept_shift": [0.0016951666730452262, 0.00028853900817824143, 0.0016951666730452262, 0.00028853900817824143, 0.0016951666730452262],
            "residual": [0.06565139847660087, 0.08186571745359833, 0.06565139847660087, 0.08186571745359833, 0.06565139847660087],
            "overall": [0.0012860042944952271, 0.0024797923148863615, 0.0012860042944952271, 0.0024797923148863615, 0.0012860042944952271]
          },
          "test_shifts": {
            "informativeness": [0.06146337294796018, 0.07856781042015454, 0.06146337294796018, 0.07856781042015454, 0.06146337294796018],
            "invariance": [0.11115786544330293, 0.0976707142196128, 0.11115786544330293, 0.0976707142196128, 0.11115786544330293],
            "label_shift": [0.01689154063470388, 0.009215807138557535, 0.01689154063470388, 0.009215807138557535, 0.01689154063470388],
            "latent_covariate_shift": [0.12360306727917729, 0.10277430146961146, 0.12360306727917729, 0.10277430146961146, 0.12360306727917729],
            "concept_shift": [0.00463889773086192, 0.004302801172548457, 0.00463889773086192, 0.004302801172548457, 0.00463889773086192],
            "residual": [0.06374901847339591, 0.08539145851485647, 0.06374901847339591, 0.08539145851485647, 0.06374901847339591],
            "overall": [0.010063276844422417, -0.0018153514866980636, 0.010063276844422417, -0.0018153514866980636, 0.010063276844422417]
          }
        },
        "all": {
          "metrics": {
            "id_test": [0.8727734948908001, 0.8727734948908001, 0.8727734948908001, 0.8727734948908001, 0.8727734948908001],
            "ood_test": [0.8258053731343283, 0.8258053731343283, 0.8258053731343283, 0.8258053731343283, 0.8258053731343283],
            "ood_validation": [0.828748280605227, 0.828748280605227, 0.828748280605227, 0.828748280605227, 0.828748280605227],
            "validation": [0.8745233339386236, 0.8745233339386236, 0.8745233339386236, 0.8745233339386236, 0.8745233339386236],
            "train": [0.8752812802753529, 0.8752812802753529, 0.8752812802753529, 0.8752812802753529, 0.8752812802753529]
          },
          "train_shifts": {
            "informativeness": [0.09091036098511927, 0.10978798596557524, 0.09091036098511927, 0.10978798596557524, 0.09091036098511927],
            "invariance": [1.1211992763352213e-15, 0.00043280851226680154, 1.1211992763352213e-15, 0.00043280851226680154, 1.1211992763352213e-15],
            "label_shift": [0.004410807874824522, 0.005675449120732449, 0.004410807874824522, 0.005675449120732449, 0.004410807874824522],
            "latent_covariate_shift": [0.0, 0.0, 0.0, 0.0, 0.0],
            "concept_shift": [0.000504943264311402, 0.0003606737602228418, 0.000504943264311402, 0.0003606737602228418, 0.000504943264311402],
            "residual": [0.09091306962032668, 0.10979392292365862, 0.09091306962032668, 0.10979392292365862, 0.09091306962032668],
            "overall": [0.0019502236700486009, 0.002435046466038024, 0.0019502236700486009, 0.002435046466038024, 0.0019502236700486009]
          },
          "test_shifts": {
            "informativeness": [0.08551390802184884, 0.11929932305352953, 0.08551390802184884, 0.11929932305352953, 0.08551390802184884],
            "invariance": [0.11506280540660196, 0.2442295332011294, 0.11506280540660196, 0.2442295332011294, 0.11506280540660196],
            "label_shift": [0.01689154063470388, 0.0015103556643162749, 0.01689154063470388, 0.0015103556643162749, 0.01689154063470388],
            "latent_covariate_shift": [0.1257691976399603, 0.26585065427144633, 0.1257691976399603, 0.26585065427144633, 0.1257691976399603],
            "concept_shift": [-0.0033356914822875085, -0.0016704959080424133, -0.0033356914822875085, -0.0016704959080424133, -0.0033356914822875085],
            "residual": [0.09849656251251815, 0.13262186048058577, 0.09849656251251815, 0.13262186048058577, 0.09849656251251815],
            "overall": [0.002484157684505564, -0.0009215511057184267, 0.002484157684505564, -0.0009215511057184267, 0.002484157684505564]
          }
        }
      },
      "acsincome": {
        "causal": {
          "metrics": {
            "id_test": [0.6929045159983799, 0.7056374038072094, 0.7044349939246659, 0.7019479040097205, 0.706194309437019],
            "ood_test": [0.6444125357326342, 0.6699951258710859, 0.6591403090461198, 0.6706933119047306, 0.67125976472448],
            "ood_validation": [0.645050385299348, 0.6681683461766449, 0.6611736810906935, 0.6695909899229401, 0.6699466508595139],
            "validation": [0.6895168180236053, 0.7042116254785938, 0.7027244248963705, 0.7013448090371167, 0.7054520140492991],
            "train": [0.6906171314025613, 0.7040968323493837, 0.7022631500257491, 0.7011493343606595, 0.705042151752638]
          },
          "train_shifts": {
            "informativeness": [0.19214780289117878, 0.1376068490632905, 0.181416684473431, 0.13661322517109534, 0.12548021534256396],
            "invariance": [1.3699775780233154, 0.9287020108741347, 1.3543904521744476, 0.8117112933979674, 1.133168395927881],
            "label_shift": [0.015213404934141922, 0.008082415533674643, 0.01645051026249839, 0.008952243593109139, 0.012942164580406736],
            "latent_covariate_shift": [1.334623401615656, 1.0327657304568243, 1.344685847962023, 0.8448142117242189, 1.1991925310846334],
            "concept_shift": [0.20338844762828895, 0.19759857757004834, 0.21029733236679385, 0.16652837975335444, 0.1938105667689268],
            "residual": [0.1302552772941036, 0.12316111209268205, 0.13890355358124562, 0.10898071352512817, 0.12387427656744333],
            "overall": [-0.049872083953828084, -0.028280484256233612, -0.05926258226617466, -0.034604097271029755, -0.05581619474076327]
          },
          "test_shifts": {
            "informativeness": [0.1595484469147919, 0.14638262407062308, 0.1579294753599218, 0.15131617164351716, 0.15932175986320954],
            "invariance": [0.00961501884573523, 0.0010385805203655338, 0.008456828410855577, 0.008164335122383974, 0.0015200593564478832],
            "label_shift": [0.003482233702930959, -0.0030031161792455387, 0.013090250486158318, 0.007755964108755229, -0.001559746675945601],
            "latent_covariate_shift": [-0.00021190260141068704, 0.0008942218498627095, 0.0006406951345724709, 0.0022463775597194977, 0.0007933331044731999],
            "concept_shift": [0.10691793507716399, 0.12170977441854285, 0.11121536096221002, 0.09393452347906513, 0.11161394655461694],
            "residual": [0.15810790660633603, 0.1537176244919946, 0.15850840257057053, 0.1569891517374258, 0.15477059175030308],
            "overall": [-0.055190771102233624, -0.06976362505551714, -0.05354954908681614, -0.051721238560395816, -0.05239904162836215]
          }
        },
        "arguablycausal": {
          "metrics": {
            "id_test": [0.8003493317132442, 0.8213029060348319, 0.809785085054678, 0.810772326852977, 0.8176387201296071],
            "ood_test": [0.7614838429213158, 0.8017678597304738, 0.7783852142640724, 0.7920327752236171, 0.7953787988565557],
            "ood_validation": [0.759098992294013, 0.801778304682869, 0.7784232365145228, 0.791108476585655, 0.7973918197984589],
            "validation": [0.8019618390659115, 0.8215675726987944, 0.810467360693605, 0.8117710343954688, 0.8180299338670379],
            "train": [0.8017273635556034, 0.8241342021306471, 0.8110832569299031, 0.8121678032912937, 0.8201116505276781]
          },
          "train_shifts": {
            "informativeness": [0.013398465892137675, 0.3175345420893832, 0.014208939608395126, 0.28803964433555546, 0.3370651638893076],
            "invariance": [0.42030974834657525, 0.16785091845604208, 0.5487107270593294, 0.08805680450720309, 0.5992415609338768],
            "label_shift": [0.015213404934141922, 0.008082415533674643, 0.01645051026249839, 0.008952243593109139, 0.012942164580406736],
            "latent_covariate_shift": [0.4211897808953605, 0.18054783515677467, 0.5479692561080874, 0.06005482833768752, 0.6655552658181723],
            "concept_shift": [0.0008819332184488002, 0.0006083325776725289, 0.0007946845183567383, 0.0044877378481105136, -0.003615209232890497],
            "residual": [0.0009611077622181602, 0.13003001945689907, 0.0009454298687678572, 0.10546487591473226, 0.1526896764314617],
            "overall": [0.0200431102621587, 0.1975900224608515, 0.02072068713607714, 0.17080603320856474, 0.22581102680664222]
          },
          "test_shifts": {
            "informativeness": [0.08034992517377179, 0.3285031057678491, 0.06228673233103459, 0.2634004277892457, 0.39639236965268126],
            "invariance": [0.02435016690500915, 0.006023251795712601, 0.024886489455334122, 0.02947946911964063, 0.0011902234087330236],
            "label_shift": [0.003482233702930959, -0.0030031161792455387, 0.013090250486158318, 0.007755964108755229, -0.001559746675945601],
            "latent_covariate_shift": [5.77006211246754e-06, 0.0, 3.2592470794131605e-06, -2.2025956085569866e-05, 3.071688123396579e-06],
            "concept_shift": [0.016796577013550237, 0.014012175584634556, 0.014426950408890128, 0.013429086338942119, 0.014883803838504756],
            "residual": [0.05787419007052008, 0.14404702999372776, 0.03816774222672728, 0.11933565687272774, 0.21098036709250592],
            "overall": [0.0036463650264937295, 0.17293680399432498, 0.011009025038814055, 0.12647746226356144, 0.17659665144264539]
          }
        },
        "all": {
          "metrics": {
            "id_test": [0.8154237545565006, 0.8267137505062778, 0.8204105913325233, 0.8146200384771163, 0.8163793539894694],
            "ood_test": [0.7894376309098813, 0.8047186837217267, 0.8088814532808157, 0.7911106427263506, 0.7799001462238674],
            "ood_validation": [0.7831653823355068, 0.7981031416716065, 0.8016597510373444, 0.783402489626556, 0.7790160047421458],
            "validation": [0.8166693035471316, 0.8281935259310825, 0.8216308578299528, 0.8156314273961333, 0.8177704648292884],
            "train": [0.8164561518143408, 0.8289035165090739, 0.8217095962971958, 0.8154609954885719, 0.8175383249889449]
          },
          "train_shifts": {
            "informativeness": [0.016166836301628813, 0.37217352300344064, 0.033058459453132044, 0.3536601054706979, 0.3495947522130081],
            "invariance": [0.8031574457813077, 0.18353565454722331, 0.44954916419394314, 0.04529566065984213, 0.30782860512754606],
            "label_shift": [0.015213404934141922, 0.008082415533674643, 0.01645051026249839, 0.008952243593109139, 0.012942164580406736],
            "latent_covariate_shift": [0.804627893314868, 0.20672427075731772, 0.45196581927895507, 0.050534265333673736, 0.33901782694416605],
            "concept_shift": [0.00036036148856837696, 9.054096497798559e-05, 6.827405417335035e-05, -0.0023417295464910914, -0.005251539232595138],
            "residual": [0.003864716530917016, 0.13873208606465226, 0.016722350096515556, 0.18039924502766386, 0.18946481600130485],
            "overall": [0.020463865260278696, 0.2490316823281839, 0.02573555500328497, 0.18152714934975, 0.1848213990265142]
          },
          "test_shifts": {
            "informativeness": [0.1534532238779642, 0.39977335978471573, 0.16780913195315386, 0.39646192107462114, 0.40716416998101523],
            "invariance": [0.029394911458113158, 0.0022361773133789285, 0.03289344693226971, 0.0012983395771635885, 0.00010820212806625991],
            "label_shift": [0.003482233702930959, -0.0030031161792455387, 0.013090250486158318, 0.007755964108755229, -0.001559746675945601],
            "latent_covariate_shift": [2.633591064131417e-06, 2.7346673326575097e-06, 3.2592470794131605e-06, 7.32367971647797e-05, 3.071688123396579e-06],
            "concept_shift": [0.008367631237156508, 0.009016844005556631, 0.010531673798490035, 0.009988166953773773, 0.007886732890193574],
            "residual": [0.08369215882594881, 0.17237944254156215, 0.06377944845680805, 0.21870799863239854, 0.25109913149294244],
            "overall": [0.05262222735137807, 0.22026721582772943, 0.0888638779975848, 0.17602526962971388, 0.15128923348503176]
          }
        }
      },
      "acsunemployment": {
        "causal": {
          "metrics": {
            "id_test": [0.966176060483996, 0.966176060483996, 0.966176060483996, 0.966176060483996, 0.966176060483996],
            "ood_test": [0.9484875711290806, 0.9484875711290806, 0.9484875711290806, 0.9484875711290806, 0.9484875711290806],
            "ood_validation": [0.9493949394939494, 0.9493949394939494, 0.9493949394939494, 0.9493949394939494, 0.9493949394939494],
            "validation": [0.9665910612032423, 0.9665910612032423, 0.9665910612032423, 0.9665910612032423, 0.9665910612032423],
            "train": [0.9659411858574622, 0.9659411858574622, 0.9659411858574622, 0.9659411858574622, 0.9659411858574622]
          },
          "train_shifts": {
            "informativeness": [0.05884520457396942, 0.008420957837166431, 0.03836193585556145, 0.00449801497610335, 0.008124553553769424],
            "invariance": [0.20962763031866138, 0.13089255048738602, 0.18440132427762587, 0.07999295650213666, 0.14590996815849785],
            "label_shift": [0.007477877913284072, 0.0007035110240214094, 0.010702787576484114, 0.007558921330948673, 0.010429625385121278],
            "latent_covariate_shift": [0.16557776292104648, 0.1359101285429737, 0.16615046365069217, 0.0846812642207908, 0.1507272415123805],
            "concept_shift": [0.13028661677781211, 0.1270234353134435, 0.13542042160024984, 0.11361236950101955, 0.13738034826295306],
            "residual": [0.00555332858798586, 0.0037207219275002513, 0.008152086972076719, 0.006029309074195632, 0.008200634504667818],
            "overall": [-0.03013742714508792, -0.05595093720725102, -0.041274398441864986, -0.05221386432380065, -0.06114280571287296]
          },
          "test_shifts": {
            "informativeness": [0.0672962296451312, 0.010591108668759605, 0.04872403100799964, 0.006072564446463104, 0.015319296602147838],
            "invariance": [0.36775789487502497, 0.27506341854339433, 0.3611329009412396, 0.14347758899187793, 0.30017068110840495],
            "label_shift": [-0.011390759908765893, -0.0016505080476568843, 0.006426295058067999, -0.009983525331316297, 0.005370670571223699],
            "latent_covariate_shift": [0.33691443555875383, 0.27543668583975617, 0.33500298153107444, 0.14438447475675645, 0.30041949299495624],
            "concept_shift": [0.12641483080481827, 0.11965340234552166, 0.13110830436197785, 0.12040372023313131, 0.12525071455821168],
            "residual": [0.0072182162737327174, 0.012726238361035747, 0.008915635016853714, 0.006392166723527593, 0.016255602735369083],
            "overall": [-0.024246511643529173, -0.06260045124068447, -0.03559756836589159, -0.06505978217684903, -0.06075192218343958]
          }
        },
        "arguablycausal": {
          "metrics": {
            "id_test": [0.9716853097016082, 0.9717039010937936, 0.966176060483996, 0.966176060483996, 0.966176060483996],
            "ood_test": [0.9603510766391012, 0.960375524873022, 0.9484875711290806, 0.9484875711290806, 0.9484875711290806],
            "ood_validation": [0.961001100110011, 0.961001100110011, 0.9493949394939494, 0.9493949394939494, 0.9493949394939494],
            "validation": [0.9722614709600654, 0.9722614709600654, 0.9665910612032423, 0.9665910612032423, 0.9665910612032423],
            "train": [0.9713675736726072, 0.9713760947669635, 0.9659411858574622, 0.9659411858574622, 0.9659411858574622]
          },
          "train_shifts": {
            "informativeness": [0.04024399447172776, 0.03861511760648453, 0.11185415793337666, 0.00376734108016385, 0.041804929340884735],
            "invariance": [0.25808865983652257, 0.21804812771105037, 0.30404895015432254, 0.0022794637832961604, 0.2639515529904047],
            "label_shift": [0.007477877913284072, 0.0007035110240214094, 0.010702787576484114, 0.007558921330948673, 0.010429625385121278],
            "latent_covariate_shift": [0.2569922296080677, 0.22245664509948904, 0.2833929192618254, -0.00840618004272854, 0.26666858174805],
            "concept_shift": [0.004978415863623132, 0.002891840205110864, 0.005016548761867178, 0.00033829129095466754, 0.004727773143342053],
            "residual": [-6.122123033327679e-05, 0.015836117316371762, 0.0098957175985029, 0.002029080641583867, 0.043955961217225385],
            "overall": [0.041006731612664084, 0.02388909439378738, 0.09447354429593367, 5.753545564634536e-06, 0.002058408623371623]
          },
          "test_shifts": {
            "informativeness": [0.046383495305728446, 0.08097058477792926, 0.10828490812096968, 0.004857734834395864, 0.08533303854868533],
            "invariance": [0.2669769485470895, 0.242632289065839, 0.3086335357658244, -0.009788854770466753, 0.2668565357260475],
            "label_shift": [-0.011390759908765893, -0.0016505080476568843, 0.006426295058067999, -0.009983525331316297, 0.005370670571223699],
            "latent_covariate_shift": [0.26550258469762944, 0.25154427033925464, 0.2929450070874234, -0.000305589081195188, 0.2688302061685285],
            "concept_shift": [0.024150902066862028, 0.01833075907888933, 0.020001233413204648, -0.011538115654666135, 0.023098489754714135],
            "residual": [0.003235183081498612, 0.03317192082830473, 0.01764317464673592, 0.006399865626822538, 0.0880302568436989],
            "overall": [0.024640299311685845, 0.04226402102305924, 0.07600999995746491, 0.0039767972138840275, -0.010574292665518292]
          }
        },
        "all": {
          "metrics": {
            "id_test": [0.972168685898429, 0.9719579834536609, 0.9722244600749853, 0.966176060483996, 0.9721377002447866],
            "ood_test": [0.9607422483818325, 0.9606811277970307, 0.9606138951537488, 0.9484875711290806, 0.9608400413175153],
            "ood_validation": [0.9606160616061606, 0.9619361936193619, 0.9609460946094609, 0.9493949394939494, 0.9617161716171617],
            "validation": [0.9725341464019236, 0.9733955529114301, 0.9724907662179916, 0.9665910612032423, 0.972639498277187],
            "train": [0.9718842618485817, 0.9724853863231788, 0.971861022500337, 0.9659411858574622, 0.9719206701608318]
          },
          "train_shifts": {
            "informativeness": [0.026353375720215365, 0.13001665978073326, 0.04568163415624684, 0.0038152989990396886, 0.1388114975000404],
            "invariance": [0.19069976887062137, 0.10870987847235429, 0.21131668413188934, 0.00222203673210147, 0.18510939290368542],
            "label_shift": [0.007477877913284072, 0.0007035110240214094, 0.010702787576484114, 0.007558921330948673, 0.010429625385121278],
            "latent_covariate_shift": [0.1903850579500992, 0.10956211501364861, 0.21180723266759882, -0.008495584933747998, 0.1869134088499938],
            "concept_shift": [0.0011541560327115242, 0.0005454320336355029, 0.0016170206916637094, 0.0004712114003823491, -0.0003460547920674335],
            "residual": [0.0007297337419778691, 0.09978230858433808, 0.007513502337789638, 0.00201704652507398, 0.09912976769349378],
            "overall": [0.028628147458262677, 0.030739508962235304, 0.042956289528722144, -1.6703393675863466e-05, 0.045971577868295185]
          },
          "test_shifts": {
            "informativeness": [0.03160295100682791, 0.18804742634835156, 0.041285738241074704, 0.004932145206980765, 0.19357691431767154],
            "invariance": [0.27271835895583324, 0.14584242140702053, 0.2591043228692201, -0.00972043866594452, 0.26185723308603853],
            "label_shift": [-0.011390759908765893, -0.0016505080476568843, 0.006426295058067999, -0.009983525331316297, 0.005370670571223699],
            "latent_covariate_shift": [0.27214758151172014, 0.14705566848874196, 0.25846839158156054, -0.00047696932677880464, 0.2654724437796364],
            "concept_shift": [0.013467558206699409, 0.01416862605877636, 0.013812602770644571, -0.010697688975612456, 0.010898834172696124],
            "residual": [0.0028067698183329645, 0.11995350522882296, 0.011176062784327477, 0.0064319857216821675, 0.12293959131901418],
            "overall": [0.016081633408705748, 0.06079097760717271, 0.026098555956629167, 0.003478975977029535, 0.06968084654472011]
          }
        }
      },
      "assistments": {
        "causal": {
          "metrics": {
            "id_test": [0.9250542079635062, 0.9250542079635062, 0.9250542079635062, 0.9250542079635062, 0.9250542079635062],
            "ood_test": [0.45120671563483733, 0.45120671563483733, 0.45120671563483733, 0.45120671563483733, 0.45120671563483733],
            "ood_validation": [0.5518867924528302, 0.5518867924528302, 0.5518867924528302, 0.5518867924528302, 0.5518867924528302],
            "validation": [0.9238312462954765, 0.9238312462954765, 0.9238312462954765, 0.9238312462954765, 0.9238312462954765],
            "train": [0.9239277739169417, 0.9239277739169417, 0.9239277739169417, 0.9239277739169417, 0.9239277739169417]
          },
          "train_shifts": {
            "informativeness": [0.30823738476990614, 0.30823738476990614, 0.30823738476990614, 0.30823738476990614, 0.30823738476990614],
            "invariance": [1.7704368426784203, 1.7704368426784203, 1.7704368426784203, 1.7704368426784203, 1.7704368426784203],
            "label_shift": [0.02660028896165906, 0.02660028896165906, 0.02660028896165906, 0.02660028896165906, 0.02660028896165906],
            "latent_covariate_shift": [1.8073300760431545, 1.8073300760431545, 1.8073300760431545, 1.8073300760431545, 1.8073300760431545],
            "concept_shift": [0.16641775286805086, 0.16641775286805086, 0.16641775286805086, 0.16641775286805086, 0.16641775286805086],
            "residual": [0.10071957902179955, 0.10071957902179955, 0.10071957902179955, 0.10071957902179955, 0.10071957902179955],
            "overall": [0.1560556904772778, 0.1560556904772778, 0.1560556904772778, 0.1560556904772778, 0.1560556904772778]
          },
          "test_shifts": {
            "informativeness": [0.21433506315292364, 0.21433506315292364, 0.21433506315292364, 0.21433506315292364, 0.21433506315292364],
            "invariance": [2.000846146110831, 2.000846146110831, 2.000846146110831, 2.000846146110831, 2.000846146110831],
            "label_shift": [0.05048711684579724, 0.05048711684579724, 0.05048711684579724, 0.05048711684579724, 0.05048711684579724],
            "latent_covariate_shift": [2.065672245999952, 2.065672245999952, 2.065672245999952, 2.065672245999952, 2.065672245999952],
            "concept_shift": [0.019231290164515847, 0.019231290164515847, 0.019231290164515847, 0.019231290164515847, 0.019231290164515847],
            "residual": [0.25521655783133895, 0.25521655783133895, 0.25521655783133895, 0.25521655783133895, 0.25521655783133895],
            "overall": [0.007159468606785846, 0.007159468606785846, 0.007159468606785846, 0.007159468606785846, 0.007159468606785846]
          }
        },
        "arguablycausal": {
          "metrics": {
            "id_test": [0.9221281033590181, 0.9221281033590181, 0.9221281033590181, 0.9221281033590181, 0.9221281033590181],
            "ood_test": [0.45120671563483733, 0.45120671563483733, 0.45120671563483733, 0.45120671563483733, 0.45120671563483733],
            "ood_validation": [0.5518867924528302, 0.5518867924528302, 0.5518867924528302, 0.5518867924528302, 0.5518867924528302],
            "validation": [0.9211414809090431, 0.9211414809090431, 0.9211414809090431, 0.9211414809090431, 0.9211414809090431],
            "train": [0.9212483224120128, 0.9212483224120128, 0.9212483224120128, 0.9212483224120128, 0.9212483224120128]
          },
          "train_shifts": {
            "informativeness": [0.16985550220841403, 0.16985550220841403, 0.16985550220841403, 0.16985550220841403, 0.16985550220841403],
            "invariance": [1.1736813133351025, 1.1736813133351025, 1.1736813133351025, 1.1736813133351025, 1.1736813133351025],
            "label_shift": [0.02660028896165906, 0.02660028896165906, 0.02660028896165906, 0.02660028896165906, 0.02660028896165906],
            "latent_covariate_shift": [1.1645609463101294, 1.1645609463101294, 1.1645609463101294, 1.1645609463101294, 1.1645609463101294],
            "concept_shift": [0.080577044407797, 0.080577044407797, 0.080577044407797, 0.080577044407797, 0.080577044407797],
            "residual": [0.09397155408916137, 0.09397155408916137, 0.09397155408916137, 0.09397155408916137, 0.09397155408916137],
            "overall": [0.04433538688369719, 0.04433538688369719, 0.04433538688369719, 0.04433538688369719, 0.04433538688369719]
          },
          "test_shifts": {
            "informativeness": [0.2542348690346613, 0.2542348690346613, 0.2542348690346613, 0.2542348690346613, 0.2542348690346613],
            "invariance": [1.8706553092488023, 1.8706553092488023, 1.8706553092488023, 1.8706553092488023, 1.8706553092488023],
            "label_shift": [0.02329921323212632, 0.02329921323212632, 0.02329921323212632, 0.02329921323212632, 0.02329921323212632],
            "latent_covariate_shift": [1.890871866798543, 1.890871866798543, 1.890871866798543, 1.890871866798543, 1.890871866798543],
            "concept_shift": [0.05715790844597368, 0.05715790844597368, 0.05715790844597368, 0.05715790844597368, 0.05715790844597368],
            "residual": [0.28530400719873195, 0.28530400719873195, 0.28530400719873195, 0.28530400719873195, 0.28530400719873195],
            "overall": [-0.037890206996124, -0.037890206996124, -0.037890206996124, -0.037890206996124, -0.037890206996124]
          }
        },
        "all": {
          "metrics": {
            "id_test": [0.6952874710203102, 0.6952874710203102, 0.6952874710203102, 0.6952874710203102, 0.6952874710203102],
            "ood_test": [0.43651626442812175, 0.43651626442812175, 0.43651626442812175, 0.43651626442812175, 0.43651626442812175],
            "ood_validation": [0.5424528301886793, 0.5424528301886793, 0.5424528301886793, 0.5424528301886793, 0.5424528301886793],
            "validation": [0.6932016836355724, 0.6932016836355724, 0.6932016836355724, 0.6932016836355724, 0.6932016836355724],
            "train": [0.6938775893002008, 0.6938775893002008, 0.6938775893002008, 0.6938775893002008, 0.6938775893002008]
          },
          "train_shifts": {
            "informativeness": [-0.46192807687607673, -0.46192807687607673, -0.46192807687607673, -0.46192807687607673, -0.46192807687607673],
            "invariance": [-0.06032214406385896, -0.06032214406385896, -0.06032214406385896, -0.06032214406385896, -0.06032214406385896],
            "label_shift": [0.02660028896165906, 0.02660028896165906, 0.02660028896165906, 0.02660028896165906, 0.02660028896165906],
            "latent_covariate_shift": [-0.0600936927547586, -0.0600936927547586, -0.0600936927547586, -0.0600936927547586, -0.0600936927547586],
            "concept_shift": [-0.44427192661241915, -0.44427192661241915, -0.44427192661241915, -0.44427192661241915, -0.44427192661241915],
            "residual": [-0.36836058996025833, -0.36836058996025833, -0.36836058996025833, -0.36836058996025833, -0.36836058996025833],
            "overall": [0.1419828465257709, 0.1419828465257709, 0.1419828465257709, 0.1419828465257709, 0.1419828465257709]
          },
          "test_shifts": {
            "informativeness": [-0.3503897952512172, -0.3503897952512172, -0.3503897952512172, -0.3503897952512172, -0.3503897952512172],
            "invariance": [1.11495185871996, 1.11495185871996, 1.11495185871996, 1.11495185871996, 1.11495185871996],
            "label_shift": [0.02329921323212632, 0.02329921323212632, 0.02329921323212632, 0.02329921323212632, 0.02329921323212632],
            "latent_covariate_shift": [1.109295471958496, 1.109295471958496, 1.109295471958496, 1.109295471958496, 1.109295471958496],
            "concept_shift": [-0.3058599271279545, -0.3058599271279545, -0.3058599271279545, -0.3058599271279545, -0.3058599271279545],
            "residual": [-0.29611021558508815, -0.29611021558508815, -0.29611021558508815, -0.29611021558508815, -0.29611021558508815],
            "overall": [0.10747179713317939, 0.10747179713317939, 0.10747179713317939, 0.10747179713317939, 0.10747179713317939]
          }
        }
      },
      "acspubcov": {
    "causal": {
      "metrics": {
        "id_test": [0.7762120044250792, 0.7762120044250792, 0.7762120044250792, 0.7762120044250792, 0.7762120044250792],
        "ood_test": [0.3637295094494649, 0.3637295094494649, 0.3637295094494649, 0.3637295094494649, 0.3637295094494649],
        "ood_validation": [0.3601500946344469, 0.3601500946344469, 0.3601500946344469, 0.3601500946344469, 0.3601500946344469],
        "validation": [0.7770881882499536, 0.7770881882499536, 0.7770881882499536, 0.7770881882499536, 0.7770881882499536],
        "train": [0.7760952951251907, 0.7760952951251907, 0.7760952951251907, 0.7760952951251907, 0.7760952951251907]
      },
      "train_shifts": {
        "informativeness": [0.022111604819473465, 0.027336142328654528, 0.021600813988445555, 0.020048436647273623, 0.030324158306374957],
        "invariance": [0.001187792916523761, 0.0011446048329321924, 0.001238127849957903, 0.0012136511059418543, 0.0012294357672193057],
        "label_shift": [0.016856964365221407, 0.014266508443450773, -0.0024506375970712174, 0.017105702036990012, 0.003951813482014484],
        "latent_covariate_shift": [-0.0007961486190843853, 0.0003083691503200866, 0.0010299822400787982, 0.002002038817846921, 0.001542555918276412],
        "concept_shift": [0.016351395883391275, 0.03855235685630708, 0.030459441221892637, 0.042907428198710976, 0.022512302422693482],
        "residual": [0.024455176530718707, 0.024546903853752956, 0.026023528392809647, 0.01637654957175579, 0.032383314808845806],
        "overall": [-0.0030827582381342464, -0.009771803572832628, -0.020981826618785573, -0.008834782149390118, -0.011182840897281793]
      },
      "test_shifts": {
        "informativeness": [0.05023698345824935, 0.05841359956747832, 0.05878343286571494, 0.049744537351452865, 0.07282651783105427],
        "invariance": [0.0007432599898945372, 0.0011163053153123367, 0.0006271156905820291, -0.001331713956021509, 0.0010549042582529233],
        "label_shift": [-0.003372463110508083, 0.005126024335588067, -0.002479664073928679, -0.0011151225132898191, 0.010057200035966687],
        "latent_covariate_shift": [0.0005694163307785096, 0.0008808618332700316, 0.0005876929385840025, 0.0005735706925358653, 0.0010105952382827047],
        "concept_shift": [0.11301660294391339, 0.14862334994623658, 0.12546891268070492, 0.11939469255901211, 0.11119179366416215],
        "residual": [0.04938921604499311, 0.05089715672566434, 0.05032937684317578, 0.05355117445030153, 0.07256245037784713],
        "overall": [-0.057433687443512516, -0.06434994170453143, -0.055539943730776656, -0.06310890231072094, -0.05032538387087569]
      }
    },
    "arguablycausal": {
      "metrics": {
        "id_test": [0.7762120044250792, 0.7980877906953525, 0.7949247377102212, 0.7762120044250792, 0.7987267912984093],
        "ood_test": [0.3637295094494649, 0.5959147891431108, 0.6192557071540097, 0.3637319548049401, 0.5898882105744507],
        "ood_validation": [0.3601500946344469, 0.5964501078392535, 0.6209890400105639, 0.3601500946344469, 0.5894845723843479],
        "validation": [0.7770881882499536, 0.7990678560089141, 0.7957949682595785, 0.7770881882499536, 0.7995650793460615],
        "train": [0.7760952951251907, 0.7982057530622785, 0.7948654714172784, 0.7760952951251907, 0.7985794193021951]
      },
      "train_shifts": {
        "informativeness": [0.10881078469413191, 0.11836106566010303, 0.08557547639332612, -0.0016867088375926151, 0.1204475001789796],
        "invariance": [0.009950850812328856, -5.60666619728773e-05, 0.05428877843196739, 0.0019045411763426352, 0.0008818632992154746],
        "label_shift": [0.016856964365221407, 0.014266508443450773, -0.0024506375970712174, 0.017105702036990012, 0.003951813482014484],
        "latent_covariate_shift": [0.00012141109211681566, -0.00012491542100818585, 9.000331992120971e-05, 0.002166381624334237, -7.249169940361604e-05],
        "concept_shift": [0.06731293591476857, 0.06027274961551327, 0.0589153134354492, -0.005198395828271556, 0.06280651731082916],
        "residual": [0.10797888025800972, 0.0885533119796192, 0.06938283805019486, -0.000544975775516895, 0.09664449490024014],
        "overall": [-0.029310801198757425, 0.0067702087149349305, -0.041589724729152046, 0.010141236094550865, -0.006101524134977429]
      },
      "test_shifts": {
        "informativeness": [0.22103411280509971, 0.21311526772834827, 0.2028227802984039, 0.0032314188682893356, 0.23385478167634188],
        "invariance": [0.015331269496163234, 0.00014782085247036137, 0.05377678499387467, 0.0023743929179279805, 0.0007596056620814272],
        "label_shift": [-0.003372463110508083, 0.005126024335588067, -0.002479664073928679, -0.0011151225132898191, 0.010057200035966687],
        "latent_covariate_shift": [1.0367668448506073e-05, 2.3919038171430022e-05, 3.717959587999617e-05, 0.0002568357867535808, 7.34594900571979e-05],
        "concept_shift": [0.015765050059314598, 0.013164592248112023, 0.01333823090124829, 0.019497467168095684, 0.01350362558272155],
        "residual": [0.22082541830715455, 0.1312017859765445, 0.1667517591425775, 0.0013162948878077997, 0.1827564367104796],
        "overall": [-0.01702051300082355, 0.07783224688839235, 0.001292270969240561, -0.009449949425798417, 0.049032059106472736]
      }
    },
    "all": {
      "metrics": {
        "id_test": [0.7850082471015332, 0.8066683706682748, 0.7952701974112488, 0.7762120044250792, 0.804869184595293],
        "ood_test": [0.39984129642965877, 0.621588576277362, 0.5726178875307656, 0.3637295094494649, 0.6263936997861537],
        "ood_validation": [0.39698050090232845, 0.621726308376249, 0.5708767991548924, 0.3601500946344469, 0.6262709626303975],
        "validation": [0.7859303767515141, 0.8080837731463454, 0.7961164660799831, 0.7770881882499536, 0.8062985616467079],
        "train": [0.7851479026890241, 0.807452557242448, 0.7955628818877708, 0.7760952951251907, 0.8056211683297768]
      },
      "train_shifts": {
        "informativeness": [0.055133582850976026, 0.14643786878083867, 0.1230714192757638, -0.0016745025338559232, 0.1464292929473803],
        "invariance": [0.07061992225151531, 6.907045986497962e-05, 0.043389053354736806, 0.001909665891522966, 0.0019100455324758915],
        "label_shift": [0.016856964365221407, 0.014266508443450773, -0.0024506375970712174, 0.017105702036990012, 0.003951813482014484],
        "latent_covariate_shift": [0.0, 0.00010270598198085544, 0.0, 0.002152477051117034, 5.000637971481674e-05],
        "concept_shift": [0.0023443794414450283, 0.002854156647571904, 0.0026689858256446087, -0.005584694794989955, 0.0029080423383321123],
        "residual": [0.051590875975261095, 0.10434480528819762, 0.10362338647011621, -0.000563238878862797, 0.10288091503275408],
        "overall": [-0.024510961788154532, 0.04781605715163845, -0.004806305583078735, 0.010355340340793892, 0.043140243910086876]
      },
      "test_shifts": {
        "informativeness": [0.07780992210280378, 0.21793716557284576, 0.20949801246111713, 0.0027653069786260907, 0.23237335029085146],
        "invariance": [0.0670853194013379, 0.0005188665695673284, 0.043352985978713385, 0.0024218619238642433, 0.001698293706043394],
        "label_shift": [-0.003372463110508083, 0.005126024335588067, -0.002479664073928679, -0.0011151225132898191, 0.010057200035966687],
        "latent_covariate_shift": [0.0, 0.00014063141592106658, 0.0, 0.00020666290962791746, 3.311761683749912e-05],
        "concept_shift": [0.0033542659700671914, 0.001496810364572906, 0.00302965958586697, 0.019304120888869285, 0.003095011857548748],
        "residual": [0.07909181231891149, 0.13399879973127907, 0.16586207872473493, 0.0012874949401740785, 0.1507563339423245],
        "overall": [-0.03818791445706429, 0.08556385525025115, 0.019204778917127657, -0.009839409169745704, 0.08426552239313298]
      }
    }
  },
  "brfss_blood_pressure": {
    "causal": {
      "metrics": {
        "train": [0.5987865681504175, 0.5987865681504175, 0.5987865681504175, 0.5987865681504175, 0.5987865681504175],
        "validation": [0.5977967542789545, 0.5977967542789545, 0.5977967542789545, 0.5977967542789545, 0.5977967542789545],
        "id_test": [0.5980334171225787, 0.5980334171225787, 0.5980334171225787, 0.5980334171225787, 0.5980334171225787],
        "ood_validation": [0.4164859002169197, 0.4164859002169197, 0.4164859002169197, 0.4164859002169197, 0.4164859002169197],
        "ood_test": [0.4157073938244039, 0.4157073938244039, 0.4157073938244039, 0.4157073938244039, 0.4157073938244039]
      },
      "train_shifts": {
        "informativeness": [0.09965932863113837, 0.09965932863113837, 0.09965932863113837, 0.09965932863113837, 0.09965932863113837],
        "invariance": [0.0692903686143497, 0.0692903686143497, 0.0692903686143497, 0.0692903686143497, 0.0692903686143497],
        "label_shift": [0.01572578048184541, 0.01572578048184541, 0.01572578048184541, 0.01572578048184541, 0.01572578048184541],
        "latent_covariate_shift": [0.0663888171217777, 0.0663888171217777, 0.0663888171217777, 0.0663888171217777, 0.0663888171217777],
        "concept_shift": [0.08139271642511489, 0.08139271642511489, 0.08139271642511489, 0.08139271642511489, 0.08139271642511489],
        "residual": [0.09590285940196513, 0.09590285940196513, 0.09590285940196513, 0.09590285940196513, 0.09590285940196513],
        "overall": [-0.03052777448874751, -0.03052777448874751, -0.03052777448874751, -0.03052777448874751, -0.03052777448874751]
      },
      "test_shifts": {
        "informativeness": [0.07104750201759404, 0.07104750201759404, 0.07104750201759404, 0.07104750201759404, 0.07104750201759404],
        "invariance": [0.0391859029351735, 0.0391859029351735, 0.0391859029351735, 0.0391859029351735, 0.0391859029351735],
        "label_shift": [0.02105310105154427, 0.02105310105154427, 0.02105310105154427, 0.02105310105154427, 0.02105310105154427],
        "latent_covariate_shift": [0.045352403637596087, 0.045352403637596087, 0.045352403637596087, 0.045352403637596087, 0.045352403637596087],
        "concept_shift": [0.07502280913404194, 0.07502280913404194, 0.07502280913404194, 0.07502280913404194, 0.07502280913404194],
        "residual": [0.080297887404611, 0.080297887404611, 0.080297887404611, 0.080297887404611, 0.080297887404611],
        "overall": [-0.03315198907705451, -0.03315198907705451, -0.03315198907705451, -0.03315198907705451, -0.03315198907705451]
      }
    },
    "arguablycausal": {
      "metrics": {
        "train": [0.5987865681504175, 0.5987865681504175, 0.5987865681504175, 0.5987865681504175, 0.5987865681504175],
        "validation": [0.5977967542789545, 0.5977967542789545, 0.5977967542789545, 0.5977967542789545, 0.5977967542789545],
        "id_test": [0.5980334171225787, 0.5980334171225787, 0.5980334171225787, 0.5980334171225787, 0.5980334171225787],
        "ood_validation": [0.4164859002169197, 0.4164859002169197, 0.4164859002169197, 0.4164859002169197, 0.4164859002169197],
        "ood_test": [0.4157073938244039, 0.4157073938244039, 0.4157073938244039, 0.4157073938244039, 0.4157073938244039]
      },
      "train_shifts": {
        "informativeness": [0.09765699089084444, 0.09765699089084444, 0.09765699089084444, 0.09765699089084444, 0.09765699089084444],
        "invariance": [0.07793818476605491, 0.07793818476605491, 0.07793818476605491, 0.07793818476605491, 0.07793818476605491],
        "label_shift": [0.01572578048184541, 0.01572578048184541, 0.01572578048184541, 0.01572578048184541, 0.01572578048184541],
        "latent_covariate_shift": [0.0810877103026729, 0.0810877103026729, 0.0810877103026729, 0.0810877103026729, 0.0810877103026729],
        "concept_shift": [0.13268393481321883, 0.13268393481321883, 0.13268393481321883, 0.13268393481321883, 0.13268393481321883],
        "residual": [0.09644076972020636, 0.09644076972020636, 0.09644076972020636, 0.09644076972020636, 0.09644076972020636],
        "overall": [-0.055688093226739635, -0.055688093226739635, -0.055688093226739635, -0.055688093226739635, -0.055688093226739635]
      },
      "test_shifts": {
        "informativeness": [0.06936658464312632, 0.06936658464312632, 0.06936658464312632, 0.06936658464312632, 0.06936658464312632],
        "invariance": [0.04740045829685339, 0.04740045829685339, 0.04740045829685339, 0.04740045829685339, 0.04740045829685339],
        "label_shift": [0.02105310105154427, 0.02105310105154427, 0.02105310105154427, 0.02105310105154427, 0.02105310105154427],
        "latent_covariate_shift": [0.055227487913560795, 0.055227487913560795, 0.055227487913560795, 0.055227487913560795, 0.055227487913560795],
        "concept_shift": [0.12864109945946633, 0.12864109945946633, 0.12864109945946633, 0.12864109945946633, 0.12864109945946633],
        "residual": [0.07159031959849071, 0.07159031959849071, 0.07159031959849071, 0.07159031959849071, 0.07159031959849071],
        "overall": [-0.05210421935097172, -0.05210421935097172, -0.05210421935097172, -0.05210421935097172, -0.05210421935097172]
      }
    },
    "all": {
      "metrics": {
        "train": [0.5987865681504175, 0.5987865681504175, 0.5987865681504175, 0.5987865681504175, 0.5987865681504175],
        "validation": [0.5977967542789545, 0.5977967542789545, 0.5977967542789545, 0.5977967542789545, 0.5977967542789545],
        "id_test": [0.5980334171225787, 0.5980334171225787, 0.5980334171225787, 0.5980334171225787, 0.5980334171225787],
        "ood_validation": [0.4164859002169197, 0.4164859002169197, 0.4164859002169197, 0.4164859002169197, 0.4164859002169197],
        "ood_test": [0.4157073938244039, 0.4157073938244039, 0.4157073938244039, 0.4157073938244039, 0.4157073938244039]
      },
      "train_shifts": {
        "informativeness": [0.0986593699492623, 0.0986593699492623, 0.0986593699492623, 0.0986593699492623, 0.0986593699492623],
        "invariance": [0.07989107455116866, 0.07989107455116866, 0.07989107455116866, 0.07989107455116866, 0.07989107455116866],
        "label_shift": [0.01572578048184541, 0.01572578048184541, 0.01572578048184541, 0.01572578048184541, 0.01572578048184541],
        "latent_covariate_shift": [0.0806026583173446, 0.0806026583173446, 0.0806026583173446, 0.0806026583173446, 0.0806026583173446],
        "concept_shift": [0.016078243855003775, 0.016078243855003775, 0.016078243855003775, 0.016078243855003775, 0.016078243855003775],
        "residual": [0.09844055941794555, 0.09844055941794555, 0.09844055941794555, 0.09844055941794555, 0.09844055941794555],
        "overall": [0.00039837072782553107, 0.00039837072782553107, 0.00039837072782553107, 0.00039837072782553107, 0.00039837072782553107]
      },
      "test_shifts": {
        "informativeness": [0.07365563705977853, 0.07365563705977853, 0.07365563705977853, 0.07365563705977853, 0.07365563705977853],
        "invariance": [0.05030459553382311, 0.05030459553382311, 0.05030459553382311, 0.05030459553382311, 0.05030459553382311],
        "label_shift": [0.02105310105154427, 0.02105310105154427, 0.02105310105154427, 0.02105310105154427, 0.02105310105154427],
        "latent_covariate_shift": [0.05353167234564843, 0.05353167234564843, 0.05353167234564843, 0.05353167234564843, 0.05353167234564843],
        "concept_shift": [0.01740055705282833, 0.01740055705282833, 0.01740055705282833, 0.01740055705282833, 0.01740055705282833],
        "residual": [0.07587105035350622, 0.07587105035350622, 0.07587105035350622, 0.07587105035350622, 0.07587105035350622],
        "overall": [0.0012243971115429297, 0.0012243971115429297, 0.0012243971115429297, 0.0012243971115429297, 0.0012243971115429297]
      }
    }
  }


  }