{
    "diabetes_readmission": {
      "causal": {
        "metrics": {
          "id_test": [0.5838581758805692, 0.5838581758805692, 0.5838581758805692, 0.5838581758805692, 0.5838581758805692],
          "ood_test": [0.5061607283001098, 0.5061607283001098, 0.5061607283001098, 0.5081227436823105, 0.5061607283001098],
          "ood_validation": [0.4936440677966102, 0.4936440677966102, 0.4936440677966102, 0.4939971751412429, 0.4936440677966102],
          "validation": [0.5781614559029398, 0.5781614559029398, 0.5781614559029398, 0.5783947736817545, 0.5781614559029398],
          "train": [0.5757699486700887, 0.5757699486700887, 0.5757699486700887, 0.5744575361642558, 0.5757991133924405]
        },
        "train_shifts": {
          "informativeness": [0.021123605725829716, 0.04108626127000954, 0.026272263506125798, 0.03702065073615992, 0.028972200704715165],
          "invariance": [0.2585319018127712, 0.3375875585628073, 0.3488047212306245, 0.33420602946797556, 0.33943360571943254],
          "label_shift": [0.003375592508434266, 0.015734076376641568, 0.0038717563188721436, 0.008008014988420619, 0.004948265890470599],
          "latent_covariate_shift": [0.2881135505983801, 0.3405124406787669, 0.3756069134501434, 0.34532853645454653, 0.3574704512692942],
          "concept_shift": [0.2156857101906199, 0.2242811533138635, 0.25588288191494085, 0.2821864401391253, 0.2597548535303114],
          "residual": [0.018741334147903393, 0.0252506890116253, 0.03214711145117827, 0.018645982230390042, 0.03444933465003578],
          "overall": [-0.08898196287036203, -0.08697552515224695, -0.11847931463332737, -0.11315329057629697, -0.12386200499031019]
        },
        "test_shifts": {
          "informativeness": [0.012905055807477596, 0.01597016472836953, 0.012471973897203423, 0.018726426720528024, 0.022730695163134577],
          "invariance": [0.001082217846126711, 0.000481996151642902, 0.0006675566650245518, 0.0013963431151482353, 0.001931171279886951],
          "label_shift": [-0.009544186325330216, 0.0009818828414588172, 0.00993175229857283, 0.014709639655001874, 0.00401437316520963],
          "latent_covariate_shift": [0.0007856382124371672, 0.0016775995018360724, 0.0014301983254039745, 0.001859312795520507, 0.0011756685097965883],
          "concept_shift": [0.06776245021757742, 0.054949858965832064, 0.06755115290624168, 0.06546289058599618, 0.05845476539468897],
          "residual": [0.021327520195050385, 0.018195266243981604, 0.02061370635957119, 0.015026350205090005, 0.020395242082327517],
          "overall": [-0.047224072475871376, -0.028611287902702114, -0.03657011193601248, -0.021445064109872996, -0.025262494418977786]
        }
      },
      "arguablycausal": {
        "metrics": {
          "id_test": [0.6459062281315605, 0.41614182411943085, 0.6468392815488687, 0.6407744343363657, 0.4166083508280849],
          "ood_test": [0.6132475278606184, 0.4938392716998901, 0.6028096060273113, 0.6022602417202951, 0.49556584523622665],
          "ood_validation": [0.6142302259887006, 0.5063559322033898, 0.6004590395480226, 0.5962217514124294, 0.50829802259887],
          "validation": [0.6283247783481102, 0.4218385440970602, 0.640457302846477, 0.6413905739617359, 0.4230051329911339],
          "train": [0.6374533364442371, 0.4242300513299113, 0.6370741950536631, 0.6351784881007932, 0.4269715352309846]
        },
        "train_shifts": {
          "informativeness": [0.0972165501376091, 0.04591813012264994, 0.06243893849172817, 0.07498693002662063, 0.06379721469433905],
          "invariance": [0.34328566100362307, 0.09360768934684091, 0.4046836282493212, 0.3503976808148978, 0.18502248786587847],
          "label_shift": [0.003375592508434266, 0.015734076376641568, 0.0038717563188721436, 0.01694303354363733, 0.010591709630585226],
          "latent_covariate_shift": [0.38090715571913475, 0.09635856144421553, 0.4177813853070975, 0.38118552927081245, 0.22835138476742456],
          "concept_shift": [0.008044734747278199, 0.01601029963438607, 0.0036517581548589236, 0.00714315337978324, -0.0022902266967838214],
          "residual": [0.0694901204951357, 0.02773867851572211, 0.05242416219385244, 0.05406422126071908, 0.06741806608881758],
          "overall": [0.04420260588080728, 0.019416776026742893, 0.01667365390877052, 0.04121657307578591, 0.02448456521997905]
        },
        "test_shifts": {
          "informativeness": [0.08020995337515098, 0.04985022796273721, 0.07772458846052058, 0.08006616490054107, 0.07064538285373939],
          "invariance": [0.002548761238904996, 0.00012022458674073371, 0.006564262436045983, 0.0034508035047186936, 0.0010820212806678848],
          "label_shift": [-0.009544186325330216, 0.0009818828414588172, 0.023396601732772856, 0.0008036909816690989, 0.0012998536855332644],
          "latent_covariate_shift": [-4.80898346978952e-05, -2.40449173489476e-05, 0.0, -4.674648406711088e-05, -0.0001442695040885601],
          "concept_shift": [0.0019716832225485136, 0.0006251678510526161, 0.0012623581607779442, 0.0015809533156415693, 0.0005049432643117222],
          "residual": [0.059286382903726675, 0.03872861072246404, 0.05666434953423528, 0.06007096296521081, 0.068685127048463],
          "overall": [0.013867210160683499, 0.011227839983431444, 0.028845229494259765, 0.017857795773951128, 0.0017445656235089424]
        }
      },
      "all": {
        "metrics": {
          "id_test": [0.6309773734546302, 0.5838581758805692, 0.5868905994868207, 0.5838581758805692, 0.5838581758805692],
          "ood_test": [0.5693768639146131, 0.5061607283001098, 0.5118701930623136, 0.5061607283001098, 0.506298069376864],
          "ood_validation": [0.5653248587570622, 0.4936440677966102, 0.500882768361582, 0.4936440677966102, 0.4939971751412429],
          "validation": [0.6278581427904807, 0.5781614559029398, 0.5795613625758282, 0.5781614559029398, 0.5781614559029398],
          "train": [0.6199545030331312, 0.5757699486700887, 0.5774031731217919, 0.5757699486700887, 0.5757991133924405]
        },
        "train_shifts": {
          "informativeness": [0.06201283368052549, 0.053829439288845704, 0.005947926997509259, 0.03583836851265815, 0.07482439374634237],
          "invariance": [0.46193520125785303, 0.5094900195768708, 0.02666267893195003, 0.5272822557362624, 0.3554454854943362],
          "label_shift": [0.003375592508434266, 8.713826765839446e-05, 0.0013420918373664278, -0.002909466547099919, 0.03783006797584684],
          "latent_covariate_shift": [0.48377302339992667, 0.5496094309545619, 0.0023998647840264013, 0.5802432807454279, 0.3477727163022136],
          "concept_shift": [0.006704820938262567, 0.0006187835962930707, 0.03966235687667005, 0.0056022238530903145, 0.0028123798389551175],
          "residual": [0.057990792722544614, 0.0670498706865583, -0.001543021506712834, 0.038064540023478866, 0.04784026498791966],
          "overall": [0.01327633781410354, 0.006573451626815635, -0.023800591089391535, 0.0199984957936669, 0.040656588230807277]
        },
        "test_shifts": {
          "informativeness": [0.07046958521579033, 0.07505199810501634, 0.014908341494768884, 0.06923008343290488, 0.05045156582434743],
          "invariance": [1.1211992763352213e-15, 0.00010820212806625991, 0.00360533979025336, 3.6067376021979855e-05, 0.008223361733066988],
          "label_shift": [0.003414277603891494, -0.0046583752649079465, -0.0041588179013152555, 0.002935145858394216, 0.0009752909884537679],
          "latent_covariate_shift": [0.0, 0.0, 0.0037743692993055054, 0.0, -0.00021640425613284018],
          "concept_shift": [1.6017132519074588e-16, 1.6017132519074588e-16, -0.004591253425623501, 4.805139755722377e-16, -0.00021640425613300034],
          "residual": [0.06349952800078888, 0.07503347395818111, 0.013945584192006411, 0.06923911134048491, 0.050272215768247495],
          "overall": [0.008677196016946553, -0.0023647645496519543, 0.0012634898194426678, 0.0014405113336058428, -0.0034446853162065916]
        }
      }
    },
    "acsfoodstamps": {
    "causal": {
      "metrics": {
        "id_test": [0.813158162486646, 0.8154219870783944, 0.8126494378592868, 0.8159561479371217, 0.8127639009004426],
        "ood_test": [0.781946888170547, 0.7839109619869881, 0.7820287245795654, 0.7823560702156389, 0.7824992839314211],
        "ood_validation": [0.7913828024304916, 0.7910145461241024, 0.7943288528816056, 0.7928558276560486, 0.7917510587368809],
        "validation": [0.8161954544876442, 0.8178615488318263, 0.8153942030091444, 0.8190443486334211, 0.8163226372620093],
        "train": [0.8134981828818889, 0.8157000276621654, 0.813169098499566, 0.8179368475941865, 0.8133217173435419]
      },
      "train_shifts": {
        "informativeness": [0.06384304382329262, 0.07192309543699653, 0.06673365783605226, 0.08257921732983875, 0.0777868023965362],
        "invariance": [2.3435098884418317, 0.6328110461663716, 2.4051771599351177, 2.227098494547007, 0.5406345787882428],
        "label_shift": [-0.0058060624703405814, 0.005422396634699895, 0.001190637798646246, 0.0078008519978626295, -0.00813464147073721],
        "latent_covariate_shift": [2.3966382104382227, 0.7249895841659919, 2.4540364902782543, 2.339943924715138, 0.606047627710961],
        "concept_shift": [0.1303714603959396, 0.10139033809270614, 0.10958772675552624, 0.09421133487944658, 0.09576703437816657],
        "residual": [0.059022031596626875, 0.06869480263512603, 0.05859714743436518, 0.07385319684938024, 0.08313222204903002],
        "overall": [-0.03670358820827889, 0.0013335910726775257, -0.02163236890518469, 0.021943494123731963, -0.02458973311558666]
      },
      "test_shifts": {
        "informativeness": [0.08411203507660056, 0.07302656897977043, 0.07455805367589663, 0.07710788014342712, 0.08478386599604668],
        "invariance": [0.001659238442401184, 0.00011964427079663393, 0.0018346077423837541, 0.00040050359393392886, 0.0001656073980519214],
        "label_shift": [-0.0015958378682764684, 0.010002292596673068, 0.006998374135978972, 0.00554061796022068, 0.005847627141978667],
        "latent_covariate_shift": [7.275690334951393e-05, 0.000306275057459886, 0.0005557534170860983, -0.00021764484805806135, 0.0002434021801272332],
        "concept_shift": [0.15345208376761701, 0.14925239191765172, 0.1300750559584437, 0.1383748675648502, 0.15365136945328708],
        "residual": [0.08219237028190403, 0.07040478397477538, 0.07235916474755222, 0.07200638930489947, 0.08293411300688293],
        "overall": [-0.07639753679277604, -0.06690994926216265, -0.059978879145536776, -0.061624708184783106, -0.0720132207754528]
      }
    },
    "arguablycausal": {
      "metrics": {
        "id_test": [0.824095741974869, 0.8091010835834562, 0.8091010835834562, 0.8336724830849062, 0.8232309101083584],
        "ood_test": [0.7990506976553868, 0.7801260280698883, 0.7801260280698883, 0.8100372355661034, 0.7989074839396048],
        "ood_validation": [0.8059289265328669, 0.7864113422942368, 0.7864113422942368, 0.812741668201068, 0.8059289265328669],
        "validation": [0.8274892848512597, 0.8127615195797881, 0.8127615195797881, 0.8376766250778994, 0.8276419041804978],
        "train": [0.8257983078385674, 0.8099418458613267, 0.8099418458613267, 0.8368949696193114, 0.8254867110321167]
      },
      "train_shifts": {
        "informativeness": [0.02117269565994016, 0.001479371232703219, 0.08313453069761803, 0.07863251784973664, 0.10980379110361875],
        "invariance": [0.8580522203304795, -0.0029959141820019796, 1.4790791126784035, 0.8956808201050436, 0.07539313930957198],
        "label_shift": [-0.0058060624703405814, 0.005422396634699895, 0.001190637798646246, 0.0078008519978626295, -0.00813464147073721],
        "latent_covariate_shift": [0.8538935639086318, 0.0065130252636659966, 1.4808960650331178, 0.8860559255476722, 0.0725094008828116],
        "concept_shift": [0.00023983217627564948, 0.009152707885520712, -0.0014251182969250774, -0.0001674388105234345, 0.0004004949526057237],
        "residual": [0.022644303793786, 0.0075896875578553204, 0.07707587793665921, 0.05826375417917621, 0.09618764848729561],
        "overall": [-0.006573883668077745, -0.0032210022277285207, 0.008275006986101521, 0.01954046179606777, 0.007906705191271499]
      },
      "test_shifts": {
        "informativeness": [0.08714593163717108, 0.0035704949473123514, 0.1329946957413029, 0.14078661961236785, 0.12674883651587435],
        "invariance": [0.04526455690789065, 0.0039037661742627482, 0.02802435116926927, 0.045337332923912906, -0.00029922098277898666],
        "label_shift": [-0.0015958378682764684, 0.010002292596673068, 0.006998374135978972, 0.00554061796022068, 0.005847627141978667],
        "latent_covariate_shift": [0.0, 0.002941367292373175, 0.0, 2.2302521665252692e-06, -0.00022024384324612043],
        "concept_shift": [0.0047248262589117155, 0.0034224999751018576, 0.00584291491560062, 0.0036428049782449524, 0.004721227587743867],
        "residual": [0.08067484825990799, -0.007799008963061681, 0.13184347268968027, 0.11162479207355012, 0.10687685134526441],
        "overall": [-0.019321527140276337, 0.014178200780214851, -0.012283222922822828, 0.007443182693932404, 0.02047467351749381]
      }
    },
    "all": {
      "metrics": {
        "id_test": [0.8302640280815994, 0.8091010835834562, 0.8327567787556596, 0.8471791219412932, 0.8351096301571959],
        "ood_test": [0.8050247555137281, 0.7801260280698883, 0.8049838373092189, 0.8214534146241663, 0.807745816113589],
        "ood_validation": [0.8072178236052292, 0.7864113422942368, 0.8120051555882895, 0.8193702817160744, 0.8120051555882895],
        "validation": [0.8330853269233215, 0.8127615195797881, 0.834916758874178, 0.8482455136276342, 0.8372569219224948],
        "train": [0.8313832036603086, 0.8099418458613267, 0.833257553837887, 0.8494812549084446, 0.8352718046224432]
      },
      "train_shifts": {
        "informativeness": [0.014781253211056871, 0.14082812486046864, 0.014682759903526152, 0.059418398033560374, 0.15412103747939201],
        "invariance": [0.8264025635251319, 0.026695433554325108, 0.8201705779552623, 0.9606835934483522, 0.05357316362837534],
        "label_shift": [-0.0058060624703405814, 0.005422396634699895, 0.001190637798646246, 0.0078008519978626295, -0.00813464147073721],
        "latent_covariate_shift": [0.8242371350361992, 0.04057198100153759, 0.816439949645088, 0.9552156500053214, 0.035695560242997096],
        "concept_shift": [0.0002727961129916701, 0.002708276813675969, 0.00022516921042603537, -0.0008367679586503003, 0.0007656137066501976],
        "residual": [0.016004451398585726, 0.15529852362475008, 0.013980766483708251, 0.04226816163114613, 0.12298171175129174],
        "overall": [-0.005345341723661266, -0.006175065130163249, -0.0006805864411591252, 0.01873507465915529, 0.01775039644671747]
      },
      "test_shifts": {
        "informativeness": [0.08603485629808315, 0.1456722860044603, 0.09431103090456448, 0.15563517262128074, 0.15748778282202366],
        "invariance": [0.03689692567073622, 0.0007697035939892439, 0.037798610071291004, 0.04367759236291392, -0.0003353936858872049],
        "label_shift": [-0.0015958378682764684, 0.010002292596673068, 0.006998374135978972, 0.00554061796022068, 0.005847627141978667],
        "latent_covariate_shift": [0.0, 0.000847887071038638, 0.0, 0.0, 0.0014035425567522678],
        "concept_shift": [0.0027411205776893695, 0.0022984564469819037, 0.0018755035531559264, 0.002127975185311227, 0.008229394625319682],
        "residual": [0.08034571084825001, 0.14914914613214705, 0.07830824024550703, 0.10511714962111181, 0.12367889148566016],
        "overall": [-0.014927796608517896, 0.0004141496856835125, -0.0003350790851765345, 0.03038554820616672, 0.03348747571601274]
      }
    }
  },
  "brfss_diabetes": {
    "causal": {
      "metrics": {
        "id_test": [0.8733539482615582, 0.8733539482615582, 0.8733539482615582, 0.8733539482615582, 0.8733539482615582],
        "ood_test": [0.8256898387489898, 0.8256898387489898, 0.8256898387489898, 0.8256898387489898, 0.8256898387489898],
        "ood_validation": [0.8263613623244179, 0.8263613623244179, 0.8263613623244179, 0.8263613623244179, 0.8263613623244179],
        "validation": [0.8727420826765417, 0.8727420826765417, 0.8727420826765417, 0.8727420826765417, 0.8727420826765417],
        "train": [0.8726770320313149, 0.8726770320313149, 0.8726770320313149, 0.8726770320313149, 0.8726770320313149]
      },
      "train_shifts": {
        "informativeness": [-0.0032507071918100455, 0.027737437860607377, 0.040040895061077254, 0.019870982412809393, -0.0011298057052987235],
        "invariance": [0.0015827659409225665, 0.01360167447203454, 0.01986791781859198, 0.0014248031935607504, 0.0044668066956326125],
        "label_shift": [0.017554929267790703, -0.008925562674817243, 0.011349868047816998, 0.011567414362509557, -0.0019713114816129395],
        "latent_covariate_shift": [0.0028081865844864352, 0.01555658606638229, 0.019422214265618517, 0.000922742320186573, 0.00453719422657335],
        "concept_shift": [0.004191765810051154, 0.04571811968833654, 0.03421818299521315, 0.03638103069111941, 0.007322353817841686],
        "residual": [0.009651880604195572, 0.02918327509141107, 0.04481752221692822, 0.018356518451365638, 0.011695186700234157],
        "overall": [-0.005608295745353908, -0.027790222615206712, -0.01643363640603577, -0.011143374639548263, -0.017436631289789825]
      },
      "test_shifts": {
        "informativeness": [-0.003116574063976402, 0.03956725108139802, 0.04422664980266613, 0.029698836711165487, -0.0035490379901829314],
        "invariance": [0.011216107017698313, 0.1410798855210137, 0.15470140492228882, 0.12990431236554148, 0.014226184127300527],
        "label_shift": [0.015683151311908138, -0.003100292479495139, -0.0014220757085065244, 0.010637533141847347, 0.0127744458173991],
        "latent_covariate_shift": [-0.009238683732665568, 0.14746175830205968, 0.16279278678352113, 0.14524152916849362, 0.006029583794569775],
        "concept_shift": [-0.0013094954450389587, 0.12108731969758282, 0.14076773889462205, 0.09885022142131873, -0.0089241290900317],
        "residual": [0.005572694983730717, 0.04363753116109797, 0.05367362986279784, 0.03291832399745565, -0.0008900452280316332],
        "overall": [-0.010420341044415513, -0.06297314977771594, -0.07649619643107984, -0.03965722302454979, 0.0040919945251987255]
      }
    },
    "arguablycausal": {
      "metrics": {
        "id_test": [0.8727734948908001, 0.8727734948908001, 0.8727734948908001, 0.8727734948908001, 0.8727734948908001],
        "ood_test": [0.8258053731343283, 0.8258053731343283, 0.8258053731343283, 0.8258053731343283, 0.8258053731343283],
        "ood_validation": [0.828748280605227, 0.828748280605227, 0.828748280605227, 0.828748280605227, 0.828748280605227],
        "validation": [0.8745233339386236, 0.8745233339386236, 0.8745233339386236, 0.8745233339386236, 0.8745233339386236],
        "train": [0.8752812802753529, 0.8752812802753529, 0.8752812802753529, 0.8752812802753529, 0.8752812802753529]
      },
      "train_shifts": {
        "informativeness": [0.08000885349830192, 0.044114873813994475, 0.0707067077145009, 0.0764581546836384, -0.0013491566901247586],
        "invariance": [7.213475204540125e-05, 0.0013104479954751988, 0.00026449409082929384, 0.00040876359491785394, 0.002740785566125694],
        "label_shift": [0.004410807874824522, 0.005675449120732449, -0.0015315283616279696, 0.002172577156869811, 0.010111601086375974],
        "latent_covariate_shift": [0.0, -0.0002043817974609291, -2.40449173489476e-05, -2.40449173489476e-05, 0.0002116818303358362],
        "concept_shift": [0.0008656170245337632, 0.005638533118141612, 0.0017793238837633394, 0.0005169657229855554, 0.010817958275530302],
        "residual": [0.08009689267074453, 0.04413848182158166, 0.07063153387297538, 0.0764042103120739, -0.0019142902137008599],
        "overall": [0.0016484888766800654, -0.0007625649027598255, -0.001724521785259267, 0.0006653458323732236, -0.0010525969388959916]
      },
      "test_shifts": {
        "informativeness": [0.06435213836270345, 0.036298896505803833, 0.05780755040853132, 0.08157982431430423, 0.0025197467457688076],
        "invariance": [0.1854144370861993, 0.06569867539975346, 0.15294527456231247, 0.10562949998885787, -0.005141338897074624],
        "label_shift": [0.01689154063470388, 0.0014431166650595772, -0.00018751912282007692, 0.0311690038426584, 0.016949909907470674],
        "latent_covariate_shift": [0.20090899658789363, 0.0717953416394552, 0.16035192066884885, 0.10496569286702524, -0.002520244686860109],
        "concept_shift": [-0.0016885891080264971, 0.0018056772302633348, 0.003812406216677971, 0.005496622838186217, 0.00603429365350768],
        "residual": [0.0791743251857448, 0.04182274713915421, 0.0685136734432259, 0.08577889112160406, -0.004671093943432678],
        "overall": [0.0022151577991710025, -0.0026567977961013955, -0.009002762651175417, 0.00830522013401995, 0.01395919592129024]
      }
    },
    "all": {
      "metrics": {
        "id_test": [0.8754312692936262, 0.8727734948908001, 0.8750846030671707, 0.8727734948908001, 0.8727734948908001],
        "ood_test": [0.8304764179104478, 0.8258053731343283, 0.8291725373134329, 0.8258053731343283, 0.8258053731343283],
        "ood_validation": [0.8303817056396149, 0.828748280605227, 0.8302097661623109, 0.828748280605227, 0.828748280605227],
        "validation": [0.8777919012166334, 0.8745233339386236, 0.8770655529326312, 0.8745233339386236, 0.8745233339386236],
        "train": [0.8780762853773463, 0.8752812802753529, 0.8776646179592232, 0.8752812802753529, 0.8752812802753529]
      },
      "train_shifts": {
        "informativeness": [0.12437200229207489, 0.0032156881370866124, 0.11839186484017264, 0.009752377823397027, 0.1221978516123883],
        "invariance": [9.548388861742088e-05, 0.002874006021885033, 0.0012327267284696925, -0.0005506360697804796, 0.002200109937355507],
        "label_shift": [0.004410807874824522, 0.012883342436454523, -0.00045482261578850945, 0.009361792087369564, -0.005396699799542704],
        "latent_covariate_shift": [-2.954055408841677e-06, 0.006274241842374221, -0.000117223031875912, 0.0016965695996482004, -7.213475204428005e-05],
        "concept_shift": [0.0019250761017325455, 0.013627678667676866, 0.0006169974157123858, 0.01758527437566017, 3.60673760223002e-05],
        "residual": [0.12498033528772105, 0.001999471808317509, 0.11810368315497072, 0.004477580336108178, 0.12255973270583315],
        "overall": [0.0005853139188867068, 0.002544166123402527, -0.0009227032107213262, 0.0022866591778578863, -0.0042143870259272465]
      },
      "test_shifts": {
        "informativeness": [0.12922656467449892, 0.0058039176844795065, 0.14443351064046106, -0.006760883890870169, 0.1415164681393514],
        "invariance": [0.05281667968336548, 0.006878247489146877, 0.14126166378341157, -0.009162877278824049, 0.18175137490020474],
        "label_shift": [0.007387840843629615, 0.024372851224442018, 0.01524371127334314, 0.014089815454213556, 0.01953190552363613],
        "latent_covariate_shift": [0.05939594292171596, 0.008472860767711806, 0.15400860448542633, -0.007929418823853989, 0.19716027687045198],
        "concept_shift": [0.003152080093201185, 0.011505398436626202, 0.0010011907488015098, 0.01744280423156949, -0.003405165059889533],
        "residual": [0.13655129585256032, 0.005097396268071055, 0.1465060521954175, -0.002239914365603969, 0.14720068413832857],
        "overall": [-0.0019172191836719366, 0.007937554449598826, 0.011422189058321736, -0.005580734686459137, 0.013488770277909262]
      }
    }
  },
  "acsincome": {
    "causal": {
      "metrics": {
        "id_test": [0.7054222357229648, 0.7063145504252734, 0.7069600546780073, 0.7080105812069664, 0.7056817031186715],
        "ood_test": [0.6688753935529765, 0.668888566874366, 0.6689544334813137, 0.6712070714389219, 0.670653791940562],
        "ood_validation": [0.6681683461766449, 0.6697095435684647, 0.6678126852400711, 0.6671013633669235, 0.6649673977474807],
        "validation": [0.7038951998228017, 0.7057684397050913, 0.7051482454197386, 0.7055406132329209, 0.7048318197639465],
        "train": [0.7035478351394603, 0.7049116264793853, 0.7047281000345694, 0.7056180450794741, 0.7045255880954622]
      },
      "train_shifts": {
        "informativeness": [0.1718679036487681, 0.13024645537614796, 0.19057280265109677, 0.13261173902882842, 0.13303076781051273],
        "invariance": [1.3514355235639695, 0.9132935686573875, 1.3321451959648132, 1.3124863333515475, 1.1048994404142807],
        "label_shift": [0.015213404934141922, 0.008082415533674643, 0.014770968001511706, 0.010263895879720087, 0.005899605919791813],
        "latent_covariate_shift": [1.3293702248688186, 1.0190398404952061, 1.3136450934974317, 1.3146525860322387, 1.150188898393513],
        "concept_shift": [0.19258727200117567, 0.19534999190602015, 0.20296490720268887, 0.206306249967805, 0.1990923066912761],
        "residual": [0.1299219336477541, 0.1204676984275848, 0.12629463053786863, 0.1322669265483376, 0.12753624089479348],
        "overall": [-0.05777361288007825, -0.030981895318700284, -0.039068848721051166, -0.09659323822320609, -0.06845709448040682]
      },
      "test_shifts": {
        "informativeness": [0.1598080233065291, 0.1501260238293464, 0.16608849141724755, 0.1571395051324067, 0.15098129023112053],
        "invariance": [0.005575458153181658, 0.0009645752065005445, 0.010632924350766732, 0.001291428195788422, 0.0004664085862835156],
        "label_shift": [0.003482233702930959, 0.020133433797550723, 0.005815091689467485, 0.001528955556545339, -0.017871635171740674],
        "latent_covariate_shift": [-0.00017586558052376563, 0.0015196109445873639, 5.915124887616732e-05, 0.0010968721199511725, 0.00010388355676364352],
        "concept_shift": [0.10121928966565305, 0.11474775788387552, 0.09806948547113944, 0.11698896223215985, 0.10296927281499257],
        "residual": [0.15806490620797442, 0.1514432331074121, 0.15768527101583488, 0.13917203085038907, 0.15003183741354204],
        "overall": [-0.050001072749659106, -0.0483468534521847, -0.043010863040368594, -0.03985980709370822, -0.059652263690548046]
      }
    },
    "arguablycausal": {
      "metrics": {
        "id_test": [0.8150883454840017, 0.8203536350749291, 0.8163160692588093, 0.8227647833130822, 0.818284224382341],
        "ood_test": [0.8012145802321139, 0.8096323326000184, 0.8057198561473304, 0.8097377191711346, 0.8030851918694261],
        "ood_validation": [0.7991701244813278, 0.8096028452874926, 0.805334914048607, 0.8111440426793124, 0.8008298755186722],
        "validation": [0.8158719108945354, 0.8206815808625764, 0.8168401734012594, 0.8230547732810176, 0.8186374711261589],
        "train": [0.8166855598703607, 0.8225813469100712, 0.8187288736934618, 0.8261007829143209, 0.8194083961766379]
      },
      "train_shifts": {
        "informativeness": [0.013565340222554649, 0.35861529442661777, 0.027388048965512952, 0.021970085365856096, 0.3057018960934735],
        "invariance": [0.45394308822239143, 0.24109340007343164, 0.44309162136842656, 1.0038522366252571, 0.2795166805570272],
        "label_shift": [0.015213404934141922, 0.008082415533674643, 0.014770968001511706, 0.010263895879720087, 0.005899605919791813],
        "latent_covariate_shift": [0.4537992662313899, 0.26602763276976876, 0.4429490094554673, 1.005309459758822, 0.2796626667493288],
        "concept_shift": [0.0009786887888336507, 0.004304794648284048, 0.001276785111187569, 0.0012745869989879445, 0.0021130537780723966],
        "residual": [0.0029716431269568837, 0.144741772271466, 0.0004139229232727601, 0.0069255564035924635, 0.14785580019838682],
        "overall": [0.01763914417275113, 0.22822944894601566, 0.03364991153092262, 0.020267794969412098, 0.1598123650620972]
      },
      "test_shifts": {
        "informativeness": [0.11416685702058206, 0.4113249936679263, 0.059745959481034366, 0.1765522584074429, 0.31909665799238546],
        "invariance": [0.03080623629339345, 0.00043280851226680154, 0.022903699286114174, 0.031451665420131544, 0.009738191526001994],
        "label_shift": [0.003482233702930959, 0.020133433797550723, 0.005815091689467485, 0.001528955556545339, -0.017871635171740674],
        "latent_covariate_shift": [5.77006211246754e-06, 1.8551026968969317e-06, 3.6158752262676373e-07, 5.466974360165078e-07, 0.0],
        "concept_shift": [0.015065342964483672, 0.013354547095162686, 0.01540076956149031, 0.0170538576291752, 0.015016050883919803],
        "residual": [0.05581318955431302, 0.17622071296674038, 0.022195272446580705, 0.06178652815545725, 0.14584360368199883],
        "overall": [0.03716187971985221, 0.23827824734759498, 0.021306179249146483, 0.09127771985432297, 0.15194011551955544]
      }
    },
    "all": {
      "metrics": {
        "id_test": [0.8173729242608343, 0.8235178716079384, 0.8175184791413528, 0.8288337889833941, 0.8239228938841636],
        "ood_test": [0.8018600729802005, 0.8117927573079, 0.8088155866738681, 0.8174441121840049, 0.8104754251689479],
        "ood_validation": [0.79407231772377, 0.8054534676941316, 0.7990515708358032, 0.814226437462952, 0.8045050385299348],
        "validation": [0.8186248140999273, 0.824535645350125, 0.8185235578900737, 0.8292757016738918, 0.8244913457583141],
        "train": [0.8187597251216852, 0.8253753788199408, 0.8190247309795012, 0.8316105315701083, 0.8256213991834656]
      },
      "train_shifts": {
        "informativeness": [0.02125126468837057, 0.3541378715974743, 0.016698496458700054, 0.02268183584451694, 0.3646283889650525],
        "invariance": [0.9540701061692738, 0.2065833346052109, 0.7305136559800648, 0.7602658310779109, 0.18285406567204918],
        "label_shift": [0.015213404934141922, 0.008082415533674643, 0.014770968001511706, 0.010263895879720087, 0.005899605919791813],
        "latent_covariate_shift": [0.9564664052223611, 0.23162637839079436, 0.7312410752411839, 0.760713795395868, 0.18911587454957549],
        "concept_shift": [1.559559645934884e-05, -0.0032981612166185785, 0.0005980028194292245, 4.8427586303460916e-05, 0.0008096052084454385],
        "residual": [0.0071880810214863715, 0.1582103324538484, 0.0017944353256004655, 0.00631890210754053, 0.15766679210624343],
        "overall": [0.022860237862269168, 0.2141393494115642, 0.02235425335470033, 0.021694650042663292, 0.21263750165324538]
      },
      "test_shifts": {
        "informativeness": [0.16634100771919003, 0.4132782304154599, 0.15683556796805362, 0.144114917815865, 0.405767998052652],
        "invariance": [0.02813255329733441, 1.1211992763352213e-15, 0.027772795049114608, 0.026979310793370802, 0.0034252875707721482],
        "label_shift": [0.003482233702930959, 0.020133433797550723, 0.005815091689467485, 0.001528955556545339, -0.017871635171740674],
        "latent_covariate_shift": [2.633591064131417e-06, 1.6594730870896867e-06, 3.6158752262676373e-07, 0.0, -2.171332643537948e-05],
        "concept_shift": [0.00908897875760091, 0.007842020322888556, 0.00905291138157877, 0.009263304408375014, 0.009677944208274565],
        "residual": [0.08144801202115953, 0.19528626387155923, 0.05657743183431616, 0.042136075978034274, 0.18095449553811582],
        "overall": [0.06802466331756035, 0.22413850301777472, 0.08475300955688583, 0.0846220120152305, 0.20931521237592482]
      }
    }
  },
  "acsunemployment": {
    "causal": {
      "metrics": {
        "id_test": [0.966176060483996, 0.966176060483996, 0.966176060483996, 0.966176060483996, 0.966176060483996],
        "ood_test": [0.9484875711290806, 0.9484875711290806, 0.9484875711290806, 0.9484875711290806, 0.9484875711290806],
        "ood_validation": [0.9493949394939494, 0.9493949394939494, 0.9493949394939494, 0.9493949394939494, 0.9493949394939494],
        "validation": [0.9665910612032423, 0.9665910612032423, 0.9665910612032423, 0.9665910612032423, 0.9665910612032423],
        "train": [0.9659411858574622, 0.9659411858574622, 0.9659411858574622, 0.9659411858574622, 0.9659411858574622]
      },
      "train_shifts": {
        "informativeness": [0.048411915914121605, 0.005205213231987773, 0.045755384860778965, 0.017546878533588852, 0.0047504548677936315],
        "invariance": [0.20295843908247396, 0.09118494232923813, 0.19260515057613478, 0.17463556085105741, 0.1401452428860144],
        "label_shift": [0.007477877913284072, 0.0007035110240214094, 0.007083499996848578, 0.012053198707288836, 0.0023029623296704467],
        "latent_covariate_shift": [0.17843126751743726, 0.08942751650694739, 0.1686812858173309, 0.16455977973897032, 0.13968244297595572],
        "concept_shift": [0.1279842227805221, 0.11582024254792195, 0.1249494833516479, 0.13488457442733803, 0.12980572414654945],
        "residual": [0.005776214031321102, 0.007014476574076057, 0.005934345618193201, 0.002873447161597259, 0.0073466321808556565],
        "overall": [-0.02988105633333686, -0.06024634201518392, -0.031073884814215833, -0.051780147044076553, -0.06657895817653087]
      },
      "test_shifts": {
        "informativeness": [0.05675278920531505, 0.0035600114830030174, 0.05685695467824684, 0.03421058827503249, 0.008465389191330802],
        "invariance": [0.36211163286158515, 0.1836913308667624, 0.3777953878680542, 0.34358915529981165, 0.2878792692284804],
        "label_shift": [-0.011390759908765893, 0.008484502040884608, 0.0007397423303629399, 0.0016138361148074567, 0.0008066292787259027],
        "latent_covariate_shift": [0.3384944394587556, 0.19084355287514573, 0.3483959826995014, 0.33227477907728, 0.29325333317248947],
        "concept_shift": [0.12251417672663083, 0.1317707600674984, 0.124640413539784, 0.1203568444391745, 0.12398020891905122],
        "residual": [0.010463533872941638, 0.009852745119315401, 0.007899545893180688, 0.010619458405314057, 0.009067689380194258],
        "overall": [-0.03247180968673971, -0.06435975164542762, -0.027692629403920796, -0.04143756240373093, -0.05950205803702159]
      }
    },
    "arguablycausal": {
      "metrics": {
        "id_test": [0.9717039010937936, 0.9716977039630651, 0.9716977039630651, 0.9717039010937936, 0.9717039010937936],
        "ood_test": [0.960375524873022, 0.9603510766391012, 0.9603510766391012, 0.960375524873022, 0.960375524873022],
        "ood_validation": [0.961001100110011, 0.9608910891089109, 0.961001100110011, 0.961001100110011, 0.961001100110011],
        "validation": [0.9722614709600654, 0.9722614709600654, 0.9722490766217992, 0.9722614709600654, 0.9722614709600654],
        "train": [0.9713745454770806, 0.9713722215422561, 0.9713706722523732, 0.971378418701788, 0.971378418701788]
      },
      "train_shifts": {
        "informativeness": [0.09721084566798768, 0.03703574862057232, 0.03938262203272573, 0.1039616802202839, 0.05914652536084764],
        "invariance": [0.3016213204957619, 0.18507615768814092, 0.2957021550478427, 0.33390222920851736, 0.2302938416173794],
        "label_shift": [0.007477877913284072, 0.0007035110240214094, 0.007083499996848578, 0.012053198707288836, 0.0023029623296704467],
        "latent_covariate_shift": [0.28526159800817613, 0.18617560812357975, 0.2932824157606681, 0.31673330549292744, 0.22731444084894545],
        "concept_shift": [0.00402188058336833, 0.0032357693074180007, 0.00496484004620829, 0.005419870292281694, 0.0027501184236719944],
        "residual": [0.002505895809828025, 0.01763066888864246, 0.0010060837424637494, 0.005544061501207053, 0.018531073047303823],
        "overall": [0.08825308727932465, 0.01868867580795098, 0.03822599862199483, 0.09314982106878546, 0.03890217388232607]
      },
      "test_shifts": {
        "informativeness": [0.09909773969413235, 0.08182754915836019, 0.042202258565511505, 0.11119994274796735, 0.11106309903979804],
        "invariance": [0.32889572204883155, 0.10829146709363861, 0.2857833511657893, 0.3370519638492013, 0.2459270838837291],
        "label_shift": [-0.011390759908765893, 0.008484502040884608, 0.0007397423303629399, 0.0016138361148074567, 0.0008066292787259027],
        "latent_covariate_shift": [0.31133307326691656, 0.10822665165741709, 0.2838835913609002, 0.3188486049335047, 0.24610704340681225],
        "concept_shift": [0.01988210802974708, 0.01991619274380011, 0.02070641562125208, 0.021387409580545177, 0.02099663296556875],
        "residual": [0.01200594044059092, 0.030350826488445316, 0.004530890373759508, 0.009851306060764354, 0.030641152314669937],
        "overall": [0.06267404089332745, 0.04572846960034636, 0.026738151643862878, 0.08236017049648585, 0.07041692464324825]
      }
    },
    "all": {
      "metrics": {
        "id_test": [0.9721872772906145, 0.971617141263595, 0.972063334676045, 0.9729433272394881, 0.9715737613484956],
        "ood_test": [0.9609194980777576, 0.9601738269431762, 0.9603021801712599, 0.9615307039257751, 0.9602777319373392],
        "ood_validation": [0.9609460946094609, 0.961001100110011, 0.9608910891089109, 0.9627612761276128, 0.9601210121012101],
        "validation": [0.9727200614759178, 0.9721623162539352, 0.9730609057782404, 0.9736744255224213, 0.9727572444907167],
        "train": [0.9720655287648906, 0.971290109178458, 0.9723606684875987, 0.9735311569941917, 0.9720841202434864]
      },
      "train_shifts": {
        "informativeness": [0.027024873170535327, 0.12311850056815976, 0.02603586171779666, 0.05082723967073804, 0.2229989943736497],
        "invariance": [0.20803658649418624, 0.0761086408010005, 0.20445331310573683, 0.268422783988718, 0.1851891711516039],
        "label_shift": [0.007477877913284072, 0.0007035110240214094, 0.007083499996848578, 0.012053198707288836, 0.0023029623296704467],
        "latent_covariate_shift": [0.20867892614861622, 0.07722377708166553, 0.2040287801843673, 0.2687907751516348, 0.18044768202429248],
        "concept_shift": [0.001298425536800725, 0.0023815078023522772, 0.0007477969295277, 0.0009377517765780433, 0.0027730443694765914],
        "residual": [0.0032412147263165244, 0.1013752078674185, 0.001773571425028898, 0.008591872511527718, 0.07744066366466588],
        "overall": [0.027194554459675467, 0.021461862451908356, 0.027217875365743428, 0.047977086206024123, 0.14295254512542505]
      },
      "test_shifts": {
        "informativeness": [0.03494862341423756, 0.17343555567532198, 0.03374674907626997, 0.05743753887157996, 0.2324448131079106],
        "invariance": [0.28946826479380944, 0.11825868439354456, 0.27229175190815447, 0.3184996678649902, 0.22292796984056848],
        "label_shift": [-0.011390759908765893, 0.008484502040884608, 0.0007397423303629399, 0.0016138361148074567, 0.0008066292787259027],
        "latent_covariate_shift": [0.29052581934099003, 0.12302621356306931, 0.27133226710196023, 0.31797564267892314, 0.21609404290317769],
        "concept_shift": [0.012962614942387207, 0.011338843538418247, 0.012511600992700756, 0.011700743404937385, 0.016477048294880135],
        "residual": [0.005953708004288548, 0.12390540364155193, 0.0032154790459841334, 0.0115713632699926, 0.10492316464516674],
        "overall": [0.017347005257962757, 0.050486745869765606, 0.024165598296019816, 0.04056070936348887, 0.11626947548597136]
      }
    }
  },
  "assistments": {
    "causal": {
      "metrics": {
        "id_test": [0.9252230216906883, 0.9248928970686434, 0.7361178845013993, 0.924934162646399, 0.924971676807995],
        "ood_test": [0.45120671563483733, 0.45120671563483733, 0.44123819517313745, 0.45120671563483733, 0.45120671563483733],
        "ood_validation": [0.5518867924528302, 0.5518867924528302, 0.5424528301886793, 0.5518867924528302, 0.5518867924528302],
        "validation": [0.9239925571903393, 0.9236886924814117, 0.7341859051792051, 0.9238987717863494, 0.9237899807177209],
        "train": [0.924134570926685, 0.9237824064044237, 0.7349035838250038, 0.9241336330717655, 0.9239301185542403]
      },
      "train_shifts": {
        "informativeness": [0.2950872389088904, 0.16966882570974398, 0.28073204270386026, 0.2692035763186002, 0.2747725738073597],
        "invariance": [1.801567089607421, 1.5822847294799798, 1.6465590805321855, 1.7486708648577305, 1.7172446640541097],
        "label_shift": [0.02660028896165906, 0.020116183344292597, 0.002728217550262214, 0.0028693142637778875, 0.011104698698886382],
        "latent_covariate_shift": [1.8302954872804247, 1.600634891768931, 1.6691617706047046, 1.776970363690949, 1.7509989580258114],
        "concept_shift": [0.16497451775565242, 0.039364803599831195, 0.15652865617095402, 0.14586010872577868, 0.16671157907509168],
        "residual": [0.09339141505420312, 0.06301232642139874, 0.4520296757553602, 0.10638945839089921, 0.1251728161324338],
        "overall": [0.14687290829419236, 0.10620727030505157, -0.23689650732558615, 0.10546847011330994, 0.0886734644726741]
      },
      "test_shifts": {
        "informativeness": [0.21060237189684203, 0.22671978618517297, 0.1908902293017781, 0.1960904534638523, 0.19837947681244625],
        "invariance": [2.017709468028407, 2.0575245189068503, 1.985133230212082, 2.0058035404989023, 2.0048496891971053],
        "label_shift": [0.03028352221961338, -0.010147600388304819, 0.0581604663676183, 0.06362962438809754, 0.04971835036639412],
        "latent_covariate_shift": [2.057787514975451, 2.0780314770528903, 2.053481215415157, 2.0538974560523613, 2.0445989444702706],
        "concept_shift": [0.01812104838009579, -0.01794576364042863, 0.03852041577884726, -0.006425447526620444, 0.017880166494492908],
        "residual": [0.2483551694633307, 0.29348202325282297, 0.24832901150402345, 0.25997952730233653, 0.26515950641910296],
        "overall": [-0.01163253717320789, -0.05260967636856806, -0.013444764306322382, -0.0048145801043956715, -0.03098631003412347]
      }
    },
    "arguablycausal": {
      "metrics": {
        "id_test": [0.9255794062258502, 0.6952874710203102, 0.9267460966514859, 0.9263597007870471, 0.9249116541494414],
        "ood_test": [0.5241343126967472, 0.43651626442812175, 0.5110178384050367, 0.4947534102833158, 0.45120671563483733],
        "ood_validation": [0.6273584905660378, 0.5424528301886793, 0.589622641509434, 0.5801886792452831, 0.5518867924528302],
        "validation": [0.9246453036021098, 0.6932016836355724, 0.9256244232197655, 0.9252530330199651, 0.9237224552268481],
        "train": [0.9248782898778256, 0.6938775893002008, 0.92566843264748, 0.9253969236482932, 0.9238002256478937]
      },
      "train_shifts": {
        "informativeness": [0.1254692874329971, -0.04124620414986012, 0.14429105357567504, 0.14826293095942691, 0.14263468805844662],
        "invariance": [0.9831466377940461, 0.6200106669394713, 1.0105571651870437, 1.034690165344964, 1.0207648843362622],
        "label_shift": [0.02660028896165906, 0.008994641022265475, 0.008013446810794996, 0.013719680027550923, 0.022026949079901596],
        "latent_covariate_shift": [0.9764258645957277, 0.6187455227861055, 1.0063030433835924, 1.0274203973350169, 1.012869114551103],
        "concept_shift": [0.06502240311529188, -0.08450842155372404, 0.07379347904783272, 0.07421691807814784, 0.06401948051778267],
        "residual": [0.08383207812940957, 0.14254468602604148, 0.05729796259836891, 0.059167880739352634, 0.06542208033983092],
        "overall": [0.019065765627611947, -0.13767193096458974, 0.05197601395706162, 0.055211547189802236, 0.05226845710709553]
      },
      "test_shifts": {
        "informativeness": [0.23493775144500065, 0.39533671523885894, 0.2344893544013695, 0.23539104769193897, 0.22728317700464204],
        "invariance": [1.9289583240815382, 1.953425804466138, 1.8176697243979687, 1.884742699244707, 1.9043866631543336],
        "label_shift": [0.02329921323212632, 0.03554938134553872, 0.03995998694127803, 0.07289301982336613, 0.05781653169929162],
        "latent_covariate_shift": [1.925451003284749, 2.0055204733862966, 1.8303350146310473, 1.901389457421388, 1.9227235470852473],
        "concept_shift": [0.05912436961298669, -0.08738764583345811, 0.11265416402319804, 0.10790537830217627, 0.1201761967238418],
        "residual": [0.26578741857362664, 0.47633126988323476, 0.279573300577518, 0.25462998851522867, 0.3125556134584299],
        "overall": [-0.05051590571745082, 0.006521293405201967, -0.07509838960056914, -0.02842174097435418, -0.10728382700060612]
      }
    },
    "all": {
      "metrics": {
        "id_test": [0.9277177134368224, 0.9250316994665486, 0.9272750463299896, 0.9250504565473466, 0.9248328744100898],
        "ood_test": [0.5246589716684156, 0.45120671563483733, 0.49737670514165794, 0.4527806925498426, 0.45120671563483733],
        "ood_validation": [0.5990566037735849, 0.5518867924528302, 0.5754716981132075, 0.5518867924528302, 0.5518867924528302],
        "validation": [0.9267761079807627, 0.9238500033762745, 0.9262021413083439, 0.9238349977116361, 0.9236099127420602],
        "train": [0.926845909498876, 0.9240342204503017, 0.9262386484385184, 0.9239559095645258, 0.9237017508813492]
      },
      "train_shifts": {
        "informativeness": [0.03388800383257744, 0.13701645366248658, 0.11862656258655306, 0.08854318301529236, -0.12111113535858524],
        "invariance": [0.7055535437708127, 0.9190244510800815, 0.7360356133634647, 0.7166805621630118, 0.43622565529682117],
        "label_shift": [0.02660028896165906, 0.008994641022265475, 0.013129028217462604, 0.0211731107553786, 0.012062690606101012],
        "latent_covariate_shift": [0.705358204095572, 0.9094480126703717, 0.7275009625398156, 0.7129568017959902, 0.4380624430082341],
        "concept_shift": [-0.07171042726853061, -0.0002460207643562972, -0.009822704359131029, -0.019800143698283396, -0.16536788803556604],
        "residual": [0.00841933579411013, 0.05259003265877668, 0.03705564629925568, 0.03469927005072719, -0.07603355019501336],
        "overall": [0.07452635631594186, 0.08425853269216585, 0.08877945716376964, 0.07246866000788538, 0.044556098012968115]
      },
      "test_shifts": {
        "informativeness": [0.17320595807102926, 0.21161017449031994, 0.20161576775082055, 0.18799142154565174, 0.03086749123413199],
        "invariance": [1.7480416252697746, 1.8941280085272698, 1.8345941327009399, 1.8307153581160722, 1.668783259093727],
        "label_shift": [0.02329921323212632, 0.08065473411469921, 0.04682927533503343, 0.051937242309833785, 0.04867987076511506],
        "latent_covariate_shift": [1.7320660176731688, 1.8865950822564637, 1.835725505969248, 1.8211146576312998, 1.638627635455749],
        "concept_shift": [-0.01754799581913684, -0.004697998778225648, -0.008865441198630116, -0.00913894287756465, -0.062067677519881785],
        "residual": [0.18986599839529394, 0.26424015910309273, 0.2288949454139233, 0.235546222765144, 0.06709860838947591],
        "overall": [-0.004224239596935991, -0.013720081301713427, 0.001133867237883196, -0.021817058868179223, 0.004064845168165479]
      }
    }
  },
  "acspubcov": {
    "causal": {
      "metrics": {
        "id_test": [0.7762120044250792, 0.7762120044250792, 0.7762120044250792, 0.7759084791386271, 0.7762120044250792],
        "ood_test": [0.36373806819362814, 0.3637295094494649, 0.3637344001604153, 0.3692743529895082, 0.36497908609729823],
        "ood_validation": [0.3601500946344469, 0.3601500946344469, 0.3601721026453629, 0.3659602095162639, 0.3616246313658172],
        "validation": [0.7770881882499536, 0.7770881882499536, 0.7770881882499536, 0.776842571902688, 0.7770881882499536],
        "train": [0.7760952951251907, 0.7760952951251907, 0.7760952951251907, 0.7756761998567737, 0.7760955447352373]
      },
      "train_shifts": {
        "informativeness": [0.022481936513937657, 0.032128509116110975, 0.025253458643589428, 0.03295853574992024, 0.023238136931499394],
        "invariance": [0.0010435427186230954, 0.0020030455241855233, 0.0012123020093198246, 0.0012525082987172378, 0.0016453462395537074],
        "label_shift": [0.016856964365221407, 0.014266508443450773, 0.010231313700030983, 0.014340910522279886, 0.0010940161339568542],
        "latent_covariate_shift": [-0.0007961755945367298, 0.0013622763871742587, 0.0019285951370480523, 0.001212145479443743, 0.0008496471970806619],
        "concept_shift": [0.017397349788036538, 0.019276258946981144, 0.026030721611703077, 0.0273478390154345, 0.03996448840132267],
        "residual": [0.024546288197159188, 0.025559877916422304, 0.02605221394598297, 0.022953899786860684, 0.017959340433344184],
        "overall": [-0.0032544035512090085, 0.0037433713794178536, -0.008340312694365477, 0.0034809903068455, -0.014554289156764221]
      },
      "test_shifts": {
        "informativeness": [0.05372996987496215, 0.046660490358907895, 0.05579306672307077, 0.05308609884924334, 0.04750729805098804],
        "invariance": [-0.00015842030562807012, 0.0006407340060707073, 0.0013555380610761557, 0.0009409745407953138, 0.000490468779722736],
        "label_shift": [-0.003372463110508083, 0.0056231408750471255, -0.004425513714821594, 0.013358719622242665, 0.0014782845574131001],
        "latent_covariate_shift": [0.0005333523056212189, 0.0011764739903047379, 0.0013870150071194753, 0.0009439688264168433, -0.00029020913313400495],
        "concept_shift": [0.11229525542346866, 0.14621646767277854, 0.11943459602371427, 0.13010098868981607, 0.142246377800197],
        "residual": [0.05256220420674637, 0.04711601683660617, 0.05861422880398117, 0.0634160445749854, 0.052380795227598455],
        "overall": [-0.05632020729314795, -0.07048431988444696, -0.06473547847715667, -0.06869958311671799, -0.07564788275443074]
      }
    },
    "arguablycausal": {
      "metrics": {
        "id_test": [0.7872008179207719, 0.7997172422331473, 0.7906254617777796, 0.7999648549668319, 0.7970514115922697],
        "ood_test": [0.5295233879911038, 0.6312734066369393, 0.5703669378158329, 0.6123439099033229, 0.5935330129102542],
        "ood_validation": [0.5286324222016814, 0.6314978652229412, 0.568653990052379, 0.6141445486156961, 0.5936991064747568],
        "validation": [0.7879871640497543, 0.8010986838558172, 0.7914497554819372, 0.8009748772417484, 0.7978317867490979],
        "train": [0.7868499935975023, 0.7999992012478505, 0.790600384549238, 0.800103538247373, 0.7967475311694305]
      },
      "train_shifts": {
        "informativeness": [0.10434172190656288, 0.11686709771254929, 0.10305807688406163, 0.06558631349568658, 0.1143694772317869],
        "invariance": [0.018210270520053293, 0.0012546161253972415, 0.015216652584329029, 0.053830613071464736, 0.0007216761601944693],
        "label_shift": [0.016856964365221407, 0.014266508443450773, 0.010231313700030983, 0.014340910522279886, 0.0010940161339568542],
        "latent_covariate_shift": [0.0001214037341690418, 9.266030738507814e-05, 0.00020380920217192842, -3.860634227398225e-05, -0.00012495880056184554],
        "concept_shift": [0.06280451391199049, 0.0612474266512518, 0.0626920085571089, 0.05638781498845819, 0.05762699622411795],
        "residual": [0.10501860778671046, 0.08301722079652406, 0.09092065963478273, 0.055796459485994085, 0.08284261308857657],
        "overall": [-0.03269509404647425, 0.009778439903118635, -0.02159935187033861, -0.03816820793026601, 0.002837056617751618]
      },
      "test_shifts": {
        "informativeness": [0.2178020924678375, 0.20873247813743342, 0.21582637386916997, 0.14138726113076402, 0.20634797734005225],
        "invariance": [0.028243390112120115, 0.0021640425613346486, 0.022694813249826876, 0.057999780159956243, 0.0005739110089949735],
        "label_shift": [-0.003372463110508083, 0.0056231408750471255, -0.004425513714821594, 0.013358719622242665, 0.0014782845574131001],
        "latent_covariate_shift": [1.0367668448506073e-05, 2.7385515821148096e-06, 1.0616635824606632e-05, 9.851336638289288e-07, 2.4924047597511518e-05],
        "concept_shift": [0.015728982683292137, 0.012922940828763942, 0.017081509284125912, 0.013388209979449997, 0.012995213815753926],
        "residual": [0.2168621730287751, 0.11898950222283763, 0.17905053070734803, 0.09290610215741539, 0.12633816787241567],
        "overall": [-0.022727314679673538, 0.08501242393286113, 0.0146802333553471, 0.019467016281598762, 0.07397685135776746]
      }
    },
    "all": {
      "metrics": {
        "id_test": [0.7762120044250792, 0.8066384175150065, 0.7888302694585668, 0.8085993506156371, 0.8027664732358591],
        "ood_test": [0.3637295094494649, 0.6514451439519634, 0.4348734589675465, 0.635554001396298, 0.6246061449337736],
        "ood_validation": [0.3601500946344469, 0.650699854747128, 0.43297460275540295, 0.635756415335182, 0.6253246181610106],
        "validation": [0.7770881882499536, 0.8075466121917565, 0.7894828278229405, 0.8095135398507531, 0.8040780301169573],
        "train": [0.7760952951251907, 0.806943103137124, 0.7887999472823581, 0.8093660678604849, 0.8032798260916882]
      },
      "train_shifts": {
        "informativeness": [0.08278633818599189, 0.15386071379351168, 0.06992707656848417, 0.002170898531065705, 0.14159719775999619],
        "invariance": [0.06629183712884826, 0.016013914953867173, 0.0767513761752945, 0.004111680866532773, 0.01698880034098671],
        "label_shift": [0.016856964365221407, 0.014266508443450773, 0.010231313700030983, 0.014340910522279886, 0.0010940161339568542],
        "latent_covariate_shift": [0.0, 0.0, 0.0, 0.0, -0.00014296113730723886],
        "concept_shift": [0.002596851073600649, 0.002668985825644929, 0.0036788723542670924, 0.003137861713933871, 0.0031358224670168452],
        "residual": [0.08185726986944304, 0.10622069030803197, 0.06606567599786448, 0.0016611467129033777, 0.11200239776957636],
        "overall": [-0.0250867936020649, 0.04543182731744905, -0.03123806684414561, 0.004055435789068949, 0.020008016084742883]
      },
      "test_shifts": {
        "informativeness": [0.1413406810468876, 0.21570228107467715, 0.12019235026595028, 0.0007158410090273746, 0.2206519323352521],
        "invariance": [0.05954723781269142, 0.010503706064044811, 0.0733971102052265, 0.0010459539046444634, 0.010421358718748447],
        "label_shift": [-0.003372463110508083, 0.0056231408750471255, -0.004425513714821594, 0.013358719622242665, 0.0014782845574131001],
        "latent_covariate_shift": [0.0, -4.272618348960599e-05, 0.0, 0.0, -0.0002645932154001317],
        "concept_shift": [0.002019773057244807, 0.0022215567945783323, 0.003967411362445173, 0.0020558404332672673, 0.006495778132843432],
        "residual": [0.14029549469234767, 0.12718757844308762, 0.11999435325824034, 0.000501790113418165, 0.16030256458258577],
        "overall": [-0.031424550635682225, 0.08494227854805672, -0.040697020633536696, 0.005342513537774677, 0.0524976449978769]
      }
    }
  },
  "brfss_blood_pressure": {
    "causal": {
      "metrics": {
        "id_test": [0.5980334171225787, 0.5980334171225787, 0.5980334171225787, 0.5980334171225787, 0.5980334171225787],
        "ood_test": [0.4157073938244039, 0.4157073938244039, 0.4157073938244039, 0.4157073938244039, 0.4157073938244039],
        "ood_validation": [0.4164859002169197, 0.4164859002169197, 0.4164859002169197, 0.4164859002169197, 0.4164859002169197],
        "validation": [0.5977967542789545, 0.5977967542789545, 0.5977967542789545, 0.5977967542789545, 0.5977967542789545],
        "train": [0.5987865681504175, 0.5987865681504175, 0.5987865681504175, 0.5987865681504175, 0.5987865681504175]
      },
      "train_shifts": {
        "informativeness": [0.10500304144276773, 0.09430098215284434, 0.18923051820221856, 0.3309559329614426, 0.09502800530120528],
        "invariance": [0.06914424136512179, 0.054724994706783256, 0.15612168466488935, 0.2836982363574245, 0.06129984823319716],
        "label_shift": [0.01572578048184541, 0.008211379500363864, 0.0112941417497322, 0.010374680490893433, 0.009249445547397478],
        "latent_covariate_shift": [0.0651181686508618, 0.04956122718613834, 0.16661469125271064, 0.3189019192589373, 0.06479103626360397],
        "concept_shift": [0.08580927663630009, 0.07964670845097789, 0.06866522845415705, 0.06485865648836785, 0.0702960533467498],
        "residual": [0.10073837538573467, 0.0891482704374276, 0.20490414501027576, 0.34120337220399616, 0.10751779116484424],
        "overall": [-0.03279011837732426, -0.033146836520212726, -0.039112666866358975, -0.0198875857905344, -0.04126749574811171]
      },
      "test_shifts": {
        "informativeness": [0.07211583183758163, 0.0692838591307992, 0.16021320841965825, 0.2753215326348832, 0.07135438027535694],
        "invariance": [0.04041303011200097, 0.028533069304893455, 0.13501825802538242, 0.24187678607222748, 0.049548684306098996],
        "label_shift": [0.02105310105154427, 0.013225881376363912, 0.01408512517399938, 0.021910057144686475, 0.04092514965315884],
        "latent_covariate_shift": [0.04690607995310796, 0.04731910963076007, 0.14784076963407097, 0.2731934135543494, 0.05607533303692873],
        "concept_shift": [0.08214690919459713, 0.08970215785636998, 0.08908435893038096, 0.08609900821123709, 0.11327885353113872],
        "residual": [0.08284371695429918, 0.06283147603282546, 0.18737164060533035, 0.3132108289072826, 0.08529624666696198],
        "overall": [-0.03802826426769047, -0.022392734979095996, -0.05824679325951862, -0.05432545806461375, -0.046855393965180105]
      }
    },
    "arguablycausal": {
      "metrics": {
        "id_test": [0.5980334171225787, 0.5980334171225787, 0.5980334171225787, 0.5980334171225787, 0.5980334171225787],
        "ood_test": [0.4157073938244039, 0.4157073938244039, 0.4157073938244039, 0.4157073938244039, 0.4157073938244039],
        "ood_validation": [0.4164859002169197, 0.4164859002169197, 0.4164859002169197, 0.4164859002169197, 0.4164859002169197],
        "validation": [0.5977967542789545, 0.5977967542789545, 0.5977967542789545, 0.5977967542789545, 0.5977967542789545],
        "train": [0.5987865681504175, 0.5987865681504175, 0.5987865681504175, 0.5987865681504175, 0.5987865681504175]
      },
      "train_shifts": {
        "informativeness": [0.10264874625797453, 0.11199137854434577, 0.0877481692518773, 0.10050509838757557, -0.005802809465974606],
        "invariance": [0.085598189377328, 0.08545728109264214, 0.04814065644414719, 0.07575268530344402, 0.0026044088795300568],
        "label_shift": [0.01572578048184541, -0.0008104149368126157, 0.0049205434726238275, 0.017000894207686173, 0.011398482574945381],
        "latent_covariate_shift": [0.08108494491500799, 0.06888306809722614, 0.05023662028899148, 0.08046333707874564, -0.00390807345779779],
        "concept_shift": [0.13584277551833154, 0.12907390690076792, 0.15915930133092604, 0.1484941971343243, 0.004637412459141314],
        "residual": [0.09286424934798851, 0.0966922249821946, 0.08057236067563711, 0.10067130692461926, -0.0018924817071443324],
        "overall": [-0.05253062283941705, -0.0579301138543471, -0.06889558843048878, -0.06355753411271195, -0.0037860338695921633]
      },
      "test_shifts": {
        "informativeness": [0.088473217562582, 0.08935724992686368, 0.07622325238264821, 0.08261287178845028, -0.006317462147432825],
        "invariance": [0.0670503934456645, 0.05822749259112841, 0.0475672747896483, 0.05337623097937207, 0.008164729594555801],
        "label_shift": [0.02338099646990692, 0.030666571022639973, 0.015336765161332633, 0.010559339578347192, 0.008388096020157757],
        "latent_covariate_shift": [0.06474711951761543, 0.050143461550361534, 0.05031246763843325, 0.05395977275614133, 0.0035209279975373783],
        "concept_shift": [0.13396917139529205, 0.11827551938579962, 0.14555165276333648, 0.14755500771439617, 0.03235457929557603],
        "residual": [0.08837761227654588, 0.07910327273612397, 0.08260188594510473, 0.08624811855774898, 0.015055894260508214],
        "overall": [-0.05635011914068097, -0.03759251251122355, -0.07011348093906597, -0.07184130994893857, -0.035678498844159384]
      }
    },
    "all": {
      "metrics": {
        "id_test": [0.5980334171225787, 0.5980334171225787, 0.5980334171225787, 0.5980334171225787, 0.5980334171225787],
        "ood_test": [0.4157073938244039, 0.4157073938244039, 0.4157073938244039, 0.4157073938244039, 0.4157073938244039],
        "ood_validation": [0.4164859002169197, 0.4164859002169197, 0.4164859002169197, 0.4164859002169197, 0.4164859002169197],
        "validation": [0.5977967542789545, 0.5977967542789545, 0.5977967542789545, 0.5977967542789545, 0.5977967542789545],
        "train": [0.5987865681504175, 0.5987865681504175, 0.5987865681504175, 0.5987865681504175, 0.5987865681504175]
      },
      "train_shifts": {
        "informativeness": [0.10536870180776113, -0.004329677862359069, 0.0029439205994273515, 0.10409453536868639, 0.09457303364820008],
        "invariance": [0.08355828349228442, 0.0019304852241900895, 0.0034327365095360774, 0.07405463343613135, 0.06364602219541633],
        "label_shift": [0.01572578048184541, -0.0008104149368126157, 0.018520977507375518, 0.009984346588189993, 0.01771183757947461],
        "latent_covariate_shift": [0.08145625388415952, -0.0002945532714180931, 0.007695550337498453, 0.07639471836586013, 0.05962384342613505],
        "concept_shift": [0.021672945000593503, 0.011961441859362787, 0.004638218550109795, 0.015987349672972207, 0.02066300165556128],
        "residual": [0.09903654408977484, -0.0006364504787409042, 0.006246125258599191, 0.10047872767678721, 0.09069006258082078],
        "overall": [0.0023075606545497895, -0.011191675029509957, 0.00577058173344221, 0.0017843486143724469, 0.00039629964469532764]
      },
      "test_shifts": {
        "informativeness": [0.08513788804278219, -0.0014449100771723369, -0.0006988392126490716, 0.07446162323394266, 0.07118553381909445],
        "invariance": [0.05793842488894905, 0.005948546364966386, -8.195201065849072e-05, 0.04444127337748899, 0.048433980805903526],
        "label_shift": [0.02338099646990692, 0.032872081558980644, 0.006125859055219596, 0.018319849352237984, 0.016569556207142698],
        "latent_covariate_shift": [0.05959542808648237, 0.0008066622959790213, 0.007371452015472859, 0.05408147359903369, 0.048569410922523044],
        "concept_shift": [0.01741941012400651, 0.020383777881350665, 0.02489856291308646, 0.011593450054722263, 0.022959937818610138],
        "residual": [0.0877868020113899, -0.0035583715220396193, 0.0007973829265491145, 0.07818998196079381, 0.07031306970628333],
        "overall": [0.001160380803109165, 0.00578667124918859, -0.007155872055065943, 0.004454941032679072, -0.0022550116346128357]
      }
    }
  }
  }