{
    "diabetes_readmission": {
      "causal": {
        "metrics": {
          "train": [0.5079131075749035, 0.4473398950700256, 0.5623726314876643, 0.4473398950700256, 0.5623726314876643],
          "validation": [0.5, 0.4540363975734951, 0.5730284647690154, 0.4540363975734951, 0.5730284647690154],
          "id_test": [0.5068812689526475, 0.43946815955213436, 0.5798926988570096, 0.43946815955213436, 0.5798926988570096],
          "ood_validation": [0.5192443502824858, 0.4758121468926554, 0.490819209039548, 0.4758121468926554, 0.490819209039548],
          "ood_test": [0.5088879296813688, 0.4747292418772563, 0.5026094804583268, 0.4747292418772563, 0.5026094804583268]
        },
        "train_shifts": {
          "informativeness": [0.013930184584516773, 0.03321147750125085, 0.03909932838908589, 0.03321147750125085, 0.03909932838908589],
          "invariance": [0.3379085839667757, 0.36492551011180785, 0.28445717501327966, 0.36492551011180785, 0.28445717501327966],
          "label_shift": [0.003375592508434266, -0.0031805683642138712, -0.01792304390607593, -0.0031805683642138712, -0.01792304390607593],
          "latent_covariate_shift": [0.35914969827271015, 0.36777776243143034, 0.3083676258327805, 0.36777776243143034, 0.3083676258327805],
          "concept_shift": [0.28054265584890864, 0.26027281484790976, 0.21959813806112338, 0.26027281484790976, 0.21959813806112338],
          "residual": [0.019475988393152, 0.02006133857385319, 0.0301937077922332, 0.02006133857385319, 0.0301937077922332],
          "overall": [-0.1335087783259052, -0.1171504265188529, -0.09789974497699655, -0.1171504265188529, -0.09789974497699655]
        },
        "test_shifts": {
          "informativeness": [0.015592921296414214, 0.01693333411297499, 0.008724273671343485, 0.01693333411297499, 0.008724273671343485],
          "invariance": [0.0014041605909918154, 0.0014809578782016186, 0.0011515141093306777, 0.0014809578782016186, 0.0011515141093306777],
          "label_shift": [-0.006770410690669257, -0.004868900844769146, 0.0057945710351309035, -0.004868900844769146, 0.0057945710351309035],
          "latent_covariate_shift": [0.0010381955149893422, 0.001085353373759695, 0.0011324596206238784, 0.001085353373759695, 0.0011324596206238784],
          "concept_shift": [0.06294521400084924, 0.04892636945092059, 0.05554990411509256, 0.04892636945092059, 0.05554990411509256],
          "residual": [0.024947030640622314, 0.023401810050028428, 0.004193013574069032, 0.023401810050028428, 0.004193013574069032],
          "overall": [-0.04439490422796859, -0.03356391333711927, -0.020355933687059773, -0.03356391333711927, -0.020355933687059773]
        }
      },
      "arguablycausal": {
        "metrics": {
          "train": [0.5638468542687421, 0.5638468542687421, 0.5638468542687421, 0.5638468542687421, 0.5638468542687421],
          "validation": [0.5781614559029398, 0.5781614559029398, 0.5781614559029398, 0.5781614559029398, 0.5781614559029398],
          "id_test": [0.5838581758805692, 0.5838581758805692, 0.5838581758805692, 0.5838581758805692, 0.5838581758805692],
          "ood_validation": [0.4936440677966102, 0.4936440677966102, 0.4936440677966102, 0.4936440677966102, 0.4936440677966102],
          "ood_test": [0.5061607283001098, 0.5061607283001098, 0.5061607283001098, 0.5061607283001098, 0.5061607283001098]
        },
        "train_shifts": {
          "informativeness": [0.04871542390217662, 0.04491268823165321, 0.05948771138433977, 0.04491268823165321, 0.05948771138433977],
          "invariance": [0.2729895033457268, 0.33013643354665473, 0.4235834299567149, 0.33013643354665473, 0.4235834299567149],
          "label_shift": [0.003375592508434266, 8.713826765839446e-05, 0.0013420918373664278, 8.713826765839446e-05, 0.0013420918373664278],
          "latent_covariate_shift": [0.3136090818548045, 0.3640465855742524, 0.4430178715833664, 0.3640465855742524, 0.4430178715833664],
          "concept_shift": [0.0036410820265144308, 0.007866757213481273, 0.001154015420276528, 0.007866757213481273, 0.001154015420276528],
          "residual": [0.04326503318756341, 0.05860343417689499, 0.044032063626140386, 0.05860343417689499, 0.044032063626140386],
          "overall": [0.025627435210111994, -0.0006254794043543954, 0.025266906780070097, -0.0006254794043543954, 0.025266906780070097]
        },
        "test_shifts": {
          "informativeness": [0.07805450992107658, 0.05460145329068601, 0.06691442593790269, 0.05460145329068601, 0.06691442593790269],
          "invariance": [1.1211992763352213e-15, 0.00021640425613396138, 0.0060593191717334596, 0.00021640425613396138, 0.0060593191717334596],
          "label_shift": [0.003414277603891494, -0.0046583752649079465, 0.010913871092375347, -0.0046583752649079465, 0.010913871092375347],
          "latent_covariate_shift": [0.0, 0.0, 0.0, 0.0, 0.0],
          "concept_shift": [0.001550897168956346, 0.0014426950408896054, 0.001406627664867145, 0.0014426950408896054, 0.001406627664867145],
          "residual": [0.07812320968492817, 0.05452717006071516, 0.0669212475610432, 0.05452717006071516, 0.0669212475610432],
          "overall": [0.0008629904536154309, -0.00308445405099491, 0.0017171405047468474, -0.00308445405099491, 0.0017171405047468474]
        }
      },
      "all": {
        "metrics": {
          "train": [0.5638468542687421, 0.43615314573125785, 0.5638468542687421, 0.43615314573125785, 0.5638468542687421],
          "validation": [0.5781614559029398, 0.4218385440970602, 0.5781614559029398, 0.4218385440970602, 0.5781614559029398],
          "id_test": [0.5838581758805692, 0.41614182411943085, 0.5838581758805692, 0.41614182411943085, 0.5838581758805692],
          "ood_validation": [0.4936440677966102, 0.5063559322033898, 0.4936440677966102, 0.5063559322033898, 0.4936440677966102],
          "ood_test": [0.5061607283001098, 0.4938392716998901, 0.5061607283001098, 0.4938392716998901, 0.5061607283001098]
        },
        "train_shifts": {
          "informativeness": [-0.4619406094689947, 0.051998730151658526, 0.07350357743784808, 0.051998730151658526, 0.07350357743784808],
          "invariance": [-0.46133146087185006, 0.602660336312918, 0.6128094009403374, 0.602660336312918, 0.6128094009403374],
          "label_shift": [0.003375592508434266, -0.0031805683642138712, 0.012625311974978784, -0.0031805683642138712, 0.012625311974978784],
          "latent_covariate_shift": [-0.46115651870477525, 0.6497068984393063, 0.6393610117126749, 0.6497068984393063, 0.6393610117126749],
          "concept_shift": [-0.46194060946899496, 0.007644168931590054, 0.009250977908297138, 0.007644168931590054, 0.009250977908297138],
          "residual": [-0.4619406094689947, 0.06058081790038836, 0.0634234765196076, 0.06058081790038836, 0.0634234765196076],
          "overall": [0.232745572072252, 0.009528824666562304, 0.02504307333775005, 0.009528824666562304, 0.02504307333775005]
        },
        "test_shifts": {
          "informativeness": [-0.2652154383500879, 0.05973237562282615, 0.06329749302068381, 0.05973237562282615, 0.06329749302068381],
          "invariance": [-0.2652154383500879, 0.00010820212806625991, 0.001671121755696599, 0.00010820212806625991, 0.001671121755696599],
          "label_shift": [-0.006770410690669257, -0.0002060885658113468, 0.002463625364271657, -0.0002060885658113468, 0.002463625364271657],
          "latent_covariate_shift": [-0.26519139343274006, 0.0, -2.40449173489476e-05, 0.0, -2.40449173489476e-05],
          "concept_shift": [-0.26519139343273923, 1.6017132519074588e-16, -2.40449173478264e-05, 1.6017132519074588e-16, -2.40449173478264e-05],
          "residual": [-0.26519139343273895, 0.05973826664366071, 0.06340933726029968, 0.05973826664366071, 0.06340933726029968],
          "overall": [0.12919846891235998, -0.00016303636777344893, 0.00028440756467110195, -0.00016303636777344893, 0.00028440756467110195]
        }
      }
    },
    "acsfoodstamps": {
      "causal": {
        "metrics": {
          "id_test": [0.8091010835834562, 0.8091010835834562, 0.6951467670549931, 0.8091010835834562, 0.6951467670549931],
          "ood_test": [0.7801260280698883, 0.7801260280698883, 0.7017267482302877, 0.7801260280698883, 0.7017267482302877]
        },
        "train_shifts": {
          "informativeness": [0.05732887540601271, 0.050276062348176866, 0.06883879866172397, 0.050276062348176866, 0.06883879866172397],
          "invariance": [1.6781201158594878, 1.8639149009114988, 2.4556711590083413, 1.8639149009114988, 2.4556711590083413],
          "label_shift": [-0.0058060624703405814, 0.005422396634699895, 0.001190637798646246, 0.005422396634699895, 0.001190637798646246],
          "latent_covariate_shift": [1.8007867615717126, 1.877841022681453, 2.519716471057496, 1.877841022681453, 2.519716471057496],
          "concept_shift": [0.08983085806457751, 0.0848035179529891, 0.10348171557771527, 0.0848035179529891, 0.10348171557771527],
          "residual": [0.06743711036933829, 0.04708262726551119, 0.06712328871096565, 0.04708262726551119, 0.06712328871096565],
          "overall": [0.0034066276253277156, -0.029534064691501903, -0.017407372914198846, -0.029534064691501903, -0.017407372914198846]
        },
        "test_shifts": {
          "informativeness": [0.07727173787441585, 0.07378275338019707, 0.08255162345880881, 0.07378275338019707, 0.08255162345880881],
          "invariance": [-0.00010805314682271558, 0.021219087360934134, 0.0002839701225443713, 0.021219087360934134, 0.0002839701225443713],
          "label_shift": [-0.0015958378682764684, 0.010002292596673068, 0.011090974624432072, 0.010002292596673068, 0.011090974624432072],
          "latent_covariate_shift": [7.274127973615755e-05, 0.0002341986584484944, 0.00036263691248764453, 0.0002341986584484944, 0.00036263691248764453],
          "concept_shift": [0.13145098439406064, 0.11708029250582784, 0.1140340964613749, 0.11708029250582784, 0.1140340964613749],
          "residual": [0.07692034380242023, 0.07187896215962583, 0.0732074247287731, 0.07187896215962583, 0.0732074247287731],
          "overall": [-0.06608161984589349, -0.06212765308524897, -0.042088028793464065, -0.06212765308524897, -0.042088028793464065]
        }
      },
      "arguablycausal": {
        "metrics": {
          "id_test": [0.6111181767309355, 0.8091010835834562, 0.8091010835834562, 0.8091010835834562, 0.8091010835834562],
          "ood_test": [0.5340439461516429, 0.7801260280698883, 0.7801260280698883, 0.7801260280698883, 0.7801260280698883]
        },
        "train_shifts": {
          "informativeness": [0.10065412446304692, 0.03371058911706126, 0.1081019168851599, 0.03371058911706126, 0.1081019168851599],
          "invariance": [0.701087573916279, 0.27888678691138813, 1.6021787146787332, 0.27888678691138813, 1.6021787146787332],
          "label_shift": [-0.0058060624703405814, 0.005422396634699895, 0.001190637798646246, 0.005422396634699895, 0.001190637798646246],
          "latent_covariate_shift": [0.724533541799033, 0.27881492098207394, 1.6384306205999497, 0.27881492098207394, 1.6384306205999497],
          "concept_shift": [-0.008297580610515347, 0.00031012558694969806, -0.007794337827341806, 0.00031012558694969806, -0.007794337827341806],
          "residual": [0.06542748472048526, 0.0036441821017543802, 0.10142310899222817, 0.0036441821017543802, 0.10142310899222817],
          "overall": [0.04819538275402603, 0.032586609574524895, 0.029297248666533965, 0.032586609574524895, 0.029297248666533965]
        },
        "test_shifts": {
          "informativeness": [0.11452408312644688, 0.032828443915379174, 0.1507484783886109, 0.032828443915379174, 0.1507484783886109],
          "invariance": [0.003390333346089972, 0.03336232282055881, 0.013453131256288824, 0.03336232282055881, 0.013453131256288824],
          "label_shift": [-0.0015958378682764684, 0.010002292596673068, 0.011090974624432072, 0.010002292596673068, 0.011090974624432072],
          "latent_covariate_shift": [0.0, 0.0, 0.0, 0.0, 0.0],
          "concept_shift": [0.0025607836975778684, 0.0029935922098451506, 0.003570670226200352, 0.0029935922098451506, 0.003570670226200352],
          "residual": [0.08790034583243295, 0.03201362657558727, 0.15111706355095797, 0.03201362657558727, 0.15111706355095797],
          "overall": [0.022850259838041773, -0.01236199387707354, -0.003334998591375593, -0.01236199387707354, -0.003334998591375593]
        }
      },
      "all": {
        "metrics": {
          "id_test": [0.5585542046090451, 0.7571730172457649, 0.8091010835834562, 0.7571730172457649, 0.8091010835834562],
          "ood_test": [0.531220590040509, 0.726850525798928, 0.7801260280698883, 0.726850525798928, 0.7801260280698883]
        },
        "train_shifts": {
          "informativeness": [0.1723731121869125, 0.04265987099684749, 0.11565962085710584, 0.04265987099684749, 0.11565962085710584],
          "invariance": [0.8143854928666312, 0.2824245031894009, 1.3750120403565513, 0.2824245031894009, 1.3750120403565513],
          "label_shift": [-0.0058060624703405814, 0.005422396634699895, 0.001190637798646246, 0.005422396634699895, 0.001190637798646246],
          "latent_covariate_shift": [0.8156029210387113, 0.28379632692876455, 1.3827082403360735, 0.28379632692876455, 1.3827082403360735],
          "concept_shift": [0.0002324422251369921, 0.0002969547292499887, -0.00412979087478136, 0.0002969547292499887, -0.00412979087478136],
          "residual": [0.12353716932668146, 0.0008521011770960732, 0.11441005757624045, 0.0008521011770960732, 0.11441005757624045],
          "overall": [0.04642540459853231, 0.045056402642158204, 0.007757877607340188, 0.045056402642158204, 0.007757877607340188]
        },
        "test_shifts": {
          "informativeness": [0.1552877718073536, 0.020235373929582547, 0.17211991746967345, 0.020235373929582547, 0.17211991746967345],
          "invariance": [0.006095386547756881, 0.019151776667802323, 0.02189289724549009, 0.019151776667802323, 0.02189289724549009],
          "label_shift": [-0.0015958378682764684, 0.010002292596673068, 0.011090974624432072, 0.010002292596673068, 0.011090974624432072],
          "latent_covariate_shift": [0.0, 0.0, 0.0, 0.0, 0.0],
          "concept_shift": [0.002019773057244807, 0.0013705602888448448, 0.002452581569511448, 0.0013705602888448448, 0.002452581569511448],
          "residual": [0.12465327121361029, 0.019010548894220262, 0.17277161105488661, 0.019010548894220262, 0.17277161105488661],
          "overall": [0.025779001857104203, -0.004035197144624764, -0.007278945680497889, -0.004035197144624764, -0.007278945680497889]
        }
      }
    },
    "brfss_diabetes": {
      "causal": {
        "metrics": {
          "id_test": [0.12664605173844182, 0.12664605173844182, 0.12664605173844182, 0.12664605173844182, 0.12664605173844182],
          "ood_test": [0.17431016125101023, 0.17431016125101023, 0.17431016125101023, 0.17431016125101023, 0.17431016125101023]
        },
        "train_shifts": {
          "informativeness": [0.02354657067396884, 0.022367769406653804, 0.07169175808095796, 0.022367769406653804, 0.07169175808095796],
          "invariance": [0.012196486929886313, 0.0040971731411587695, 0.04954660207449435, 0.0040971731411587695, 0.04954660207449435],
          "label_shift": [0.017554929267790703, 0.001478059644822891, 0.00657745033322343, 0.001478059644822891, 0.00657745033322343],
          "latent_covariate_shift": [0.011276027368508839, 0.004958570337723529, 0.051895569533422344, 0.004958570337723529, 0.051895569533422344],
          "concept_shift": [0.033605629811160914, 0.02887036744938839, 0.034130754230371874, 0.02887036744938839, 0.034130754230371874],
          "residual": [0.03216389081809633, 0.02394375440947617, 0.07034143901182324, 0.02394375440947617, 0.07034143901182324],
          "overall": [-0.017102900196501333, -0.014841440306822731, -0.011251849149975512, -0.014841440306822731, -0.011251849149975512]
        },
        "test_shifts": {
          "informativeness": [0.039143785658839976, 0.03255283946227202, 0.06147007106061617, 0.03255283946227202, 0.06147007106061617],
          "invariance": [0.14951427863986042, 0.15583693290959025, 0.17502842233166105, 0.15583693290959025, 0.17502842233166105],
          "label_shift": [0.010747443489363856, 0.01593201273239112, 0.010718407245671586, 0.01593201273239112, 0.010718407245671586],
          "latent_covariate_shift": [0.1446519961730612, 0.15764776562170915, 0.17819478356361576, 0.15764776562170915, 0.17819478356361576],
          "concept_shift": [0.12685483259389213, 0.12212709709483932, 0.11024334808785942, 0.12212709709483932, 0.11024334808785942],
          "residual": [0.045824190938921684, 0.03590073759163419, 0.07225631295131182, 0.03590073759163419, 0.07225631295131182],
          "overall": [-0.06716524106574545, -0.05554002395452682, -0.05896553169581221, -0.05554002395452682, -0.05896553169581221]
        }
      },
      "arguablycausal": {
        "metrics": {
          "id_test": [0.8727734948908001, 0.8727734948908001, 0.12722650510919986, 0.8727734948908001, 0.12722650510919986],
          "ood_test": [0.8258053731343283, 0.8258053731343283, 0.17419462686567164, 0.8258053731343283, 0.17419462686567164]
        },
        "train_shifts": {
          "informativeness": [0.08224894938551885, 0.01764419016055629, 0.06008873435999195, 0.01764419016055629, 0.06008873435999195],
          "invariance": [0.0017673014250898266, 1.1211992763352213e-15, 1.1211992763352213e-15, 1.1211992763352213e-15, 1.1211992763352213e-15],
          "label_shift": [0.004410807874824522, 0.012883342436454523, -0.00045482261578850945, 0.012883342436454523, -0.00045482261578850945],
          "latent_covariate_shift": [0.0, 0.0, 0.0, 0.0, 0.0],
          "concept_shift": [0.0007934822724894832, 0.0018394361771341067, 0.00032460638420038143, 0.0018394361771341067, 0.00032460638420038143],
          "residual": [0.0821324870508175, 0.01757542579986298, 0.06010676804800366, 0.01757542579986298, 0.06010676804800366],
          "overall": [0.0010414744233239737, 0.005590717490352958, -0.00040774818800672075, 0.005590717490352958, -0.00040774818800672075]
        },
        "test_shifts": {
          "informativeness": [0.0898286775516017, 0.006099043088104391, 0.058157076603544106, 0.006099043088104391, 0.058157076603544106],
          "invariance": [0.16475931940695682, 0.0478643312308402, 0.08868670464052147, 0.0478643312308402, 0.08868670464052147],
          "label_shift": [0.007387840843629615, 0.024372851224442018, 0.01524371127334314, 0.024372851224442018, 0.01524371127334314],
          "latent_covariate_shift": [0.17518670761619357, 0.05352893637706086, 0.0915256490372874, 0.05352893637706086, 0.0915256490372874],
          "concept_shift": [-0.0015362667178287245, 0.0023248635494135575, 0.004830498729457658, 0.0023248635494135575, 0.004830498729457658],
          "residual": [0.09661096626640425, 0.013053111104004575, 0.06424880690364047, 0.013053111104004575, 0.06424880690364047],
          "overall": [0.002893459170544996, 0.006902228394724378, 0.0005343481702293346, 0.006902228394724378, 0.0005343481702293346]
        }
      },
      "all": {
        "metrics": {
          "id_test": [0.12722650510919986, 0.5098964953695296, 0.5581408785512654, 0.5098964953695296, 0.5581408785512654],
          "ood_test": [0.17419462686567164, 0.5282722388059702, 0.5840429850746268, 0.5282722388059702, 0.5840429850746268]
        },
        "train_shifts": {
          "informativeness": [0.000942072697340449, 0.11283029686393628, 0.11102615601016383, 0.11283029686393628, 0.11102615601016383],
          "invariance": [-0.0015018360640900908, 0.0038712316930535474, 0.0003606737602225215, 0.0038712316930535474, 0.0003606737602225215],
          "label_shift": [0.004410807874824522, 0.012883342436454523, -0.009360219372641473, 0.012883342436454523, -0.009360219372641473],
          "latent_covariate_shift": [0.0004947900184779186, -2.40449173489476e-05, 0.0, -2.40449173489476e-05, 0.0],
          "concept_shift": [0.029478215497132292, 0.00015629196276383477, 4.805139755722377e-16, 0.00015629196276383477, 4.805139755722377e-16],
          "residual": [0.002952841064648804, 0.03626650823325748, 0.037073910179898924, 0.03626650823325748, 0.037073910179898924],
          "overall": [-0.013546159137178236, 0.08097967556232291, 0.06909179926383266, 0.08097967556232291, 0.06909179926383266]
        },
        "test_shifts": {
          "informativeness": [0.008609881310117421, 0.13947258225894016, 0.13583491211854937, 0.13947258225894016, 0.13583491211854937],
          "invariance": [0.008604334496450972, 0.22604244551710817, 0.08566860472704088, 0.22604244551710817, 0.08566860472704088],
          "label_shift": [0.007387840843629615, -0.000524659736159124, 0.005067784101228259, -0.000524659736159124, 0.005067784101228259],
          "latent_covariate_shift": [-0.006556722226224264, 0.23061154192062902, 0.09068405718751302, 0.23061154192062902, 0.09068405718751302],
          "concept_shift": [0.013328886364832879, 0.0007443443753332662, 0.002386104089147606, 0.0007443443753332662, 0.002386104089147606],
          "residual": [0.0023932871145931063, 0.045781254784853204, 0.038281228338136686, 0.045781254784853204, 0.038281228338136686],
          "overall": [-0.0043344569264149365, 0.09534137362010117, 0.10140225001668907, 0.09534137362010117, 0.10140225001668907]
        }
      }
    },
    "acsincome": {
      "causal": {
        "metrics": {
          "id_test": [0.6791780579181855, 0.6791780579181855, 0.658635834345889, 0.6791780579181855, 0.658635834345889],
          "ood_test": [0.6020339608225422, 0.6020339608225422, 0.6082912884825651, 0.6020339608225422, 0.6082912884825651]
        },
        "train_shifts": {
          "informativeness": [0.12500385740003178, 0.12561945244546843, 0.12123362309296784, 0.12561945244546843, 0.12123362309296784],
          "invariance": [1.3038020785666047, 1.3296067303311159, 1.329068953986324, 1.3296067303311159, 1.329068953986324],
          "label_shift": [0.015213404934141922, 0.008082415533674643, 0.014770968001511706, 0.008082415533674643, 0.014770968001511706],
          "latent_covariate_shift": [1.304108738702556, 1.3307038806109013, 1.3253996131263508, 1.3307038806109013, 1.3253996131263508],
          "concept_shift": [0.17816080285524416, 0.16478564617601132, 0.1927434377098879, 0.16478564617601132, 0.1927434377098879],
          "residual": [0.1249635995972246, 0.12389763107466752, 0.12752306441313804, 0.12389763107466752, 0.12752306441313804],
          "overall": [-0.0812801110897683, -0.07608121881047465, -0.09711034660434492, -0.07608121881047465, -0.09711034660434492]
        },
        "test_shifts": {
          "informativeness": [0.15820211027877856, 0.1454573984638979, 0.1529027417128521, 0.1454573984638979, 0.1529027417128521],
          "invariance": [-8.707364635417043e-05, 0.0017556553548063376, 0.0004614030633047049, 0.0017556553548063376, 0.0004614030633047049],
          "label_shift": [0.003482233702930959, 0.020133433797550723, -0.00486302279645367, 0.020133433797550723, -0.00486302279645367],
          "latent_covariate_shift": [-0.0001397787235796288, 0.0015907503189019022, 0.0005518212315750971, 0.0015907503189019022, 0.0005518212315750971],
          "concept_shift": [0.09750434993536301, 0.09071897507161308, 0.09419391288946513, 0.09071897507161308, 0.09419391288946513],
          "residual": [0.15838466277363522, 0.1500128985464705, 0.14958546000405912, 0.1500128985464705, 0.14958546000405912],
          "overall": [-0.04721996314968541, -0.039930723237556004, -0.04616597705003124, -0.039930723237556004, -0.04616597705003124]
        }
      },
      "arguablycausal": {
        "metrics": {
          "id_test": [0.5708915552855407, 0.6791780579181855, 0.6774693701903605, 0.6791780579181855, 0.6774693701903605],
          "ood_test": [0.6186059991305608, 0.6020339608225422, 0.6207664238384424, 0.6020339608225422, 0.6207664238384424]
        },
        "train_shifts": {
          "informativeness": [0.27110541193703036, 0.11958914811544608, 0.2916846229837679, 0.11958914811544608, 0.2916846229837679],
          "invariance": [1.364327723668212, 0.7683681028132827, 2.090059048025014, 0.7683681028132827, 2.090059048025014],
          "label_shift": [0.015213404934141922, 0.008082415533674643, 0.014770968001511706, 0.008082415533674643, 0.014770968001511706],
          "latent_covariate_shift": [1.4370490461854457, 0.7900244198962948, 2.1374629655797497, 0.7900244198962948, 2.1374629655797497],
          "concept_shift": [-0.005170456404964975, 0.002805216185491728, -0.003929925107246675, 0.002805216185491728, -0.003929925107246675],
          "residual": [0.2760274256450834, 0.10383543257203348, 0.29584029176965165, 0.10383543257203348, 0.29584029176965165],
          "overall": [0.041630578220117176, 0.029220473759010074, 0.028896736545863444, 0.029220473759010074, 0.028896736545863444]
        },
        "test_shifts": {
          "informativeness": [0.3689829985567462, 0.18614718364572866, 0.39657137379915847, 0.18614718364572866, 0.39657137379915847],
          "invariance": [0.0006899773148386143, 0.02017368565509672, 0.006244275564072994, 0.02017368565509672, 0.006244275564072994],
          "label_shift": [0.003482233702930959, 0.020133433797550723, -0.00486302279645367, 0.020133433797550723, -0.00486302279645367],
          "latent_covariate_shift": [5.773702524787593e-06, -2.2186186871482004e-05, 9.475786904363412e-07, -2.2186186871482004e-05, 9.475786904363412e-07],
          "concept_shift": [0.0171572507737726, 0.015566679491192188, 0.01416846754739791, 0.015566679491192188, 0.01416846754739791],
          "residual": [0.3554011423443423, 0.1858311132524078, 0.39314558082360085, 0.1858311132524078, 0.39314558082360085],
          "overall": [0.006402245870826162, -0.007498488374483969, -0.009211616189059468, -0.007498488374483969, -0.009211616189059468]
        }
      },
      "all": {
        "metrics": {
          "id_test": [0.42864646618063995, 0.627354191980559, 0.6791780579181855, 0.627354191980559, 0.6791780579181855],
          "ood_test": [0.47758559365572845, 0.6199101579481234, 0.6020339608225422, 0.6199101579481234, 0.6020339608225422]
        },
        "train_shifts": {
          "informativeness": [0.2958793972547656, 0.061310342148671364, 0.21987994190022486, 0.061310342148671364, 0.21987994190022486],
          "invariance": [1.2212127791469642, 0.4465126000453322, 1.6820653190968748, 0.4465126000453322, 1.6820653190968748],
          "label_shift": [0.015213404934141922, 0.008082415533674643, 0.014770968001511706, 0.008082415533674643, 0.014770968001511706],
          "latent_covariate_shift": [1.2751721775151483, 0.44721814163527185, 1.7168400321565553, 0.44721814163527185, 1.7168400321565553],
          "concept_shift": [0.000984952328216191, -0.0006768882587575906, -0.0035823203783161605, -0.0006768882587575906, -0.0035823203783161605],
          "residual": [0.2781202101990372, 0.06577765047595019, 0.23618064175760686, 0.06577765047595019, 0.23618064175760686],
          "overall": [0.0518531125427833, 0.0002651143639071235, 0.010263300862372232, 0.0002651143639071235, 0.010263300862372232]
        },
        "test_shifts": {
          "informativeness": [0.3790472062658341, 0.1323368089470532, 0.3610685658173993, 0.1323368089470532, 0.3610685658173993],
          "invariance": [0.0032821312180222706, 0.035562432757913195, 0.016015305051173215, 0.035562432757913195, 0.016015305051173215],
          "label_shift": [0.003482233702930959, 0.020133433797550723, -0.00486302279645367, 0.020133433797550723, -0.00486302279645367],
          "latent_covariate_shift": [2.633591064131417e-06, 1.4391203746147608e-06, 9.475786904363412e-07, 1.4391203746147608e-06, 9.475786904363412e-07],
          "concept_shift": [0.010820212806667796, 0.009242866228628794, 0.008223361733067949, 0.009242866228628794, 0.008223361733067949],
          "residual": [0.3594496414376615, 0.1286975002100983, 0.3609127022570839, 0.1286975002100983, 0.3609127022570839],
          "overall": [0.014288826462825144, -0.00869590429735341, -0.014394507440686766, -0.00869590429735341, -0.014394507440686766]
        }
      }
    },
    "acsunemployment": {
      "causal": {
        "metrics": {
          "id_test": [0.9653394478356521, 0.9194249062683977, 0.6644129767917454, 0.9194249062683977, 0.6644129767917454],
          "ood_test": [0.9470817976786402, 0.9071517196276534, 0.7523027180324061, 0.9071517196276534, 0.7523027180324061]
        },
        "train_shifts": {
          "informativeness": [0.01714001685009849, 0.037713695022730066, 0.013068826972631977, 0.037713695022730066, 0.013068826972631977],
          "invariance": [0.14957878447704895, 0.17229539605979968, 0.16496559607077887, 0.17229539605979968, 0.16496559607077887],
          "label_shift": [0.007477877913284072, 0.0007035110240214094, 0.007083499996848578, 0.0007035110240214094, 0.007083499996848578],
          "latent_covariate_shift": [0.14352149527321403, 0.1600782637027731, 0.1587627833033177, 0.1600782637027731, 0.1587627833033177],
          "concept_shift": [0.13002531644270512, 0.12216229254056127, 0.12366711144168625, 0.12216229254056127, 0.12366711144168625],
          "residual": [0.006673157448798285, 0.004493769314627629, 0.006118396941673351, 0.004493769314627629, 0.006118396941673351],
          "overall": [-0.05383550446532778, -0.03361803122868079, -0.0544427820751908, -0.03361803122868079, -0.0544427820751908]
        },
        "test_shifts": {
          "informativeness": [0.025069298918221957, 0.05315613879407997, 0.023483156954193767, 0.05315613879407997, 0.023483156954193767],
          "invariance": [0.3066970487898585, 0.3176209635469152, 0.32393831686521446, 0.3176209635469152, 0.32393831686521446],
          "label_shift": [-0.011390759908765893, 0.008484502040884608, 0.003640261983926621, 0.008484502040884608, 0.003640261983926621],
          "latent_covariate_shift": [0.3059235319232671, 0.2978882244222823, 0.31926452433286107, 0.2978882244222823, 0.31926452433286107],
          "concept_shift": [0.11611848743314968, 0.10661458024120518, 0.11659422483496208, 0.10661458024120518, 0.11659422483496208],
          "residual": [0.014333990122148001, 0.01398244049722256, 0.01460243973230221, 0.01398244049722256, 0.01460243973230221],
          "overall": [-0.05340607330817951, -0.019757710365619345, -0.04993316046980287, -0.019757710365619345, -0.04993316046980287]
        }
      },
      "arguablycausal": {
        "metrics": {
          "id_test": [0.9400675487249404, 0.966176060483996, 0.6978093142874849, 0.966176060483996, 0.6978093142874849],
          "ood_test": [0.9439096393274291, 0.9484875711290806, 0.6628771904089579, 0.9484875711290806, 0.6628771904089579]
        },
        "train_shifts": {
          "informativeness": [0.03265488120196461, 0.07480241340821882, 0.11983221842024154, 0.07480241340821882, 0.11983221842024154],
          "invariance": [0.24986762026949993, 0.22655490114612015, 0.3742158489653212, 0.22655490114612015, 0.3742158489653212],
          "label_shift": [0.007477877913284072, 0.0007035110240214094, 0.007083499996848578, 0.0007035110240214094, 0.007083499996848578],
          "latent_covariate_shift": [0.24386430478187718, 0.2151734612629179, 0.3499292673906292, 0.2151734612629179, 0.3499292673906292],
          "concept_shift": [0.0065254377221020425, 0.003731295253774717, 0.004605365980239403, 0.003731295253774717, 0.004605365980239403],
          "residual": [0.018028623272397182, 0.0013903885870546718, 0.021788147452812864, 0.0013903885870546718, 0.021788147452812864],
          "overall": [0.012100820281347069, 0.06620741276468636, 0.08713984718838727, 0.06620741276468636, 0.08713984718838727]
        },
        "test_shifts": {
          "informativeness": [0.07647361500102687, 0.07255125394236314, 0.12197771371884751, 0.07255125394236314, 0.12197771371884751],
          "invariance": [0.29060457054633915, 0.2590871516051648, 0.35670045984395055, 0.2590871516051648, 0.35670045984395055],
          "label_shift": [-0.011390759908765893, 0.008484502040884608, 0.003640261983926621, 0.008484502040884608, 0.003640261983926621],
          "latent_covariate_shift": [0.2836909878678193, 0.24811825105716012, 0.3288594539336704, 0.24811825105716012, 0.3288594539336704],
          "concept_shift": [0.024492474682711842, 0.02031644681368458, 0.01962015162226058, 0.02031644681368458, 0.01962015162226058],
          "residual": [0.05084715224538667, 0.007888006195677791, 0.03233076757410429, 0.007888006195677791, 0.03233076757410429],
          "overall": [0.0042280541206414154, 0.053262825086283015, 0.06773649837043616, 0.053262825086283015, 0.06773649837043616]
        }
      },
      "all": {
        "metrics": {
          "id_test": [0.9659405695163139, 0.966176060483996, 0.9610324419793635, 0.966176060483996, 0.9610324419793635],
          "ood_test": [0.9484814590706004, 0.9484875711290806, 0.9429683823214821, 0.9484875711290806, 0.9429683823214821]
        },
        "train_shifts": {
          "informativeness": [0.1132707824731602, 0.027432696817748972, 0.05487263802309532, 0.027432696817748972, 0.05487263802309532],
          "invariance": [0.29413763589366293, 0.19565820318866953, 0.30675011127252955, 0.19565820318866953, 0.30675011127252955],
          "label_shift": [0.007477877913284072, 0.0007035110240214094, 0.007083499996848578, 0.0007035110240214094, 0.007083499996848578],
          "latent_covariate_shift": [0.2874026797431802, 0.19664241788185866, 0.3091248499334819, 0.19664241788185866, 0.3091248499334819],
          "concept_shift": [0.0032021789322119742, 0.001143904714802591, 0.0007886732890188608, 0.001143904714802591, 0.0007886732890188608],
          "residual": [0.09603254459992448, 0.0038378624563284833, 0.012576580527545707, 0.0038378624563284833, 0.012576580527545707],
          "overall": [0.0160086092885304, 0.023866744862624464, 0.04663084017994064, 0.023866744862624464, 0.04663084017994064]
        },
        "test_shifts": {
          "informativeness": [0.19446389048911247, 0.040357854190449086, 0.054469176256161496, 0.040357854190449086, 0.054469176256161496],
          "invariance": [0.2878756694262006, 0.2488889537049776, 0.3086514231468793, 0.2488889537049776, 0.3086514231468793],
          "label_shift": [-0.011390759908765893, 0.008484502040884608, 0.003640261983926621, 0.008484502040884608, 0.003640261983926621],
          "latent_covariate_shift": [0.28260513325047026, 0.24774605686852805, 0.307206719197589, 0.24774605686852805, 0.307206719197589],
          "concept_shift": [0.018395707272851232, 0.012985272452791342, 0.013086016893206098, 0.012985272452791342, 0.013086016893206098],
          "residual": [0.16774712098126854, 0.0047852517406643934, 0.013604420256200253, 0.0047852517406643934, 0.013604420256200253],
          "overall": [0.009188267829170205, 0.03275076882560655, 0.03541952657067634, 0.03275076882560655, 0.03541952657067634]
        }
      }
    },
      "assistments": {
        "causal": {
          "metrics": {
            "id_test": [
              0.3047125289796898,
              0.46022748587591816,
              0.30466751198577463,
              0.46022748587591816,
              0.30466751198577463
            ],
            "ood_test": [
              0.5634837355718783,
              0.46432318992654775,
              0.5634837355718783,
              0.46432318992654775,
              0.5634837355718783
            ]
          },
          "train_shifts": {
            "informativeness": [
              0.3477475549710781,
              0.2739737555535773,
              0.3149098038667958,
              0.2739737555535773,
              0.3149098038667958
            ],
            "invariance": [
              1.9144494688580846,
              1.9720525874713033,
              1.8911568957776015,
              1.9720525874713033,
              1.8911568957776015
            ],
            "label_shift": [
              0.02660028896165906,
              0.008994641022265475,
              0.008013446810794996,
              0.008994641022265475,
              0.008013446810794996
            ],
            "latent_covariate_shift": [
              2.0045857476678646,
              1.9774349630672277,
              1.986014993779788,
              1.9774349630672277,
              1.986014993779788
            ],
            "concept_shift": [
              0.16181195720700559,
              0.17412268972031658,
              0.1423357729565479,
              0.17412268972031658,
              0.1423357729565479
            ],
            "residual": [
              0.5761952005315738,
              0.5238034017468945,
              0.5591630664196235,
              0.5238034017468945,
              0.5591630664196235
            ],
            "overall": [
              -0.250985340278279,
              -0.32970248274438063,
              -0.2639853766246109,
              -0.32970248274438063,
              -0.2639853766246109
            ]
          },
          "test_shifts": {
            "informativeness": [
              0.21781217405978429,
              0.18624227464361254,
              0.20282546245345226,
              0.18624227464361254,
              0.20282546245345226
            ],
            "invariance": [
              1.9987402241026107,
              2.046647290101274,
              1.9878062143463457,
              2.046647290101274,
              1.9878062143463457
            ],
            "label_shift": [
              0.02329921323212632,
              0.03554938134553872,
              0.06326781654055122,
              0.03554938134553872,
              0.06326781654055122
            ],
            "latent_covariate_shift": [
              2.0771206869481396,
              2.084118720400334,
              2.086779496560173,
              2.084118720400334,
              2.086779496560173
            ],
            "concept_shift": [
              -0.0028710877608915455,
              0.038960356180363025,
              -0.003582677533538154,
              0.038960356180363025,
              -0.003582677533538154
            ],
            "residual": [
              0.24058438232172763,
              0.24521265351425556,
              0.24366774759139717,
              0.24521265351425556,
              0.24366774759139717
            ],
            "overall": [
              0.029503173657330017,
              -0.04194015113852517,
              0.042069603006013284,
              -0.04194015113852517,
              0.042069603006013284
            ]
          }
        },
        "arguablycausal": {
          "metrics": {
            "id_test": [
              0.30509142201180944,
              0.3058979764861235,
              0.29472250774667436,
              0.3058979764861235,
              0.29472250774667436
            ],
            "ood_test": [
              0.5634837355718783,
              0.5640083945435467,
              0.5634837355718783,
              0.5640083945435467,
              0.5634837355718783
            ]
          },
          "train_shifts": {
            "informativeness": [
              0.15662804093638533,
              0.2289817506680302,
              0.20355589299611926,
              0.2289817506680302,
              0.20355589299611926
            ],
            "invariance": [
              1.2675231192461105,
              1.375209296826757,
              1.4210914832000885,
              1.375209296826757,
              1.4210914832000885
            ],
            "label_shift": [
              0.02660028896165906,
              0.024927097951032234,
              0.006967999709964291,
              0.024927097951032234,
              0.006967999709964291
            ],
            "latent_covariate_shift": [
              1.25412656822083,
              1.3748992854921058,
              1.4029616976026564,
              1.3748992854921058,
              1.4029616976026564
            ],
            "concept_shift": [
              0.08074731032449696,
              0.07807860859632762,
              0.07896226522662711,
              0.07807860859632762,
              0.07896226522662711
            ],
            "residual": [
              0.3117439011082059,
              0.4655417894996592,
              0.4169234221074725,
              0.4655417894996592,
              0.4169234221074725
            ],
            "overall": [
              -0.1888876463658797,
              -0.26329079982160236,
              -0.25842955466840073,
              -0.26329079982160236,
              -0.25842955466840073
            ]
          },
          "test_shifts": {
            "informativeness": [
              0.24751267693904722,
              0.2872978449612156,
              0.25706239217561927,
              0.2872978449612156,
              0.25706239217561927
            ],
            "invariance": [
              1.9795946941566949,
              1.9350682199363367,
              1.9597128102329002,
              1.9350682199363367,
              1.9597128102329002
            ],
            "label_shift": [
              0.05048711684579724,
              0.0839318025912957,
              0.0331774435527358,
              0.0839318025912957,
              0.0331774435527358
            ],
            "latent_covariate_shift": [
              1.9793231601033827,
              1.9978593053437341,
              2.007259335804655,
              1.9978593053437341,
              2.007259335804655
            ],
            "concept_shift": [
              0.09807045308453846,
              0.15003910647215613,
              0.1308626356734855,
              0.15003910647215613,
              0.1308626356734855
            ],
            "residual": [
              0.2939593625403367,
              0.3335722066489113,
              0.3386980269132226,
              0.3335722066489113,
              0.3386980269132226
            ],
            "overall": [
              -0.0703741207473162,
              -0.04793247092442726,
              -0.10670496801210064,
              -0.04793247092442726,
              -0.10670496801210064
            ]
          }
        },
        "all": {
          "metrics": {
            "id_test": [
              0.3047125289796898,
              0.3047125289796898,
              0.3047125289796898,
              0.3047125289796898,
              0.3047125289796898
            ],
            "ood_test": [
              0.5634837355718783,
              0.5634837355718783,
              0.5634837355718783,
              0.5634837355718783,
              0.5634837355718783
            ]
          },
          "train_shifts": {
            "informativeness": [
              0.20298482702156553,
              0.09777179421574336,
              0.20193023228963042,
              0.09777179421574336,
              0.20193023228963042
            ],
            "invariance": [
              1.3460694000212008,
              0.871746913595717,
              1.046746350599576,
              0.871746913595717,
              1.046746350599576
            ],
            "label_shift": [
              0.02660028896165906,
              0.024927097951032234,
              0.013114977580103217,
              0.024927097951032234,
              0.013114977580103217
            ],
            "latent_covariate_shift": [
              1.3313711595788307,
              0.8690918028401441,
              0.9934335515860903,
              0.8690918028401441,
              0.9934335515860903
            ],
            "concept_shift": [
              0.0012617581823473995,
              -0.018506962449172593,
              0.005522342059034534,
              -0.018506962449172593,
              0.005522342059034534
            ],
            "residual": [
              0.4140790489433416,
              0.1822935310822091,
              0.3689160150955572,
              0.1822935310822091,
              0.3689160150955572
            ],
            "overall": [
              -0.20577407675330528,
              -0.06413226204414982,
              -0.18984586455213528,
              -0.06413226204414982,
              -0.18984586455213528
            ]
          },
          "test_shifts": {
            "informativeness": [
              0.2651928812802467,
              0.18517303416424816,
              0.25588443114332854,
              0.18517303416424816,
              0.25588443114332854
            ],
            "invariance": [
              1.9603554465139543,
              1.8813088296584357,
              1.8578006603489827,
              1.8813088296584357,
              1.8578006603489827
            ],
            "label_shift": [
              0.05048711684579724,
              0.04979416579420589,
              0.019753473660892567,
              0.04979416579420589,
              0.019753473660892567
            ],
            "latent_covariate_shift": [
              2.010199697393739,
              1.8751833503274224,
              1.906874711861358,
              1.8751833503274224,
              1.906874711861358
            ],
            "concept_shift": [
              -0.00825898371561863,
              -0.013712919809778113,
              0.0021946614864112347,
              -0.013712919809778113,
              0.0021946614864112347
            ],
            "residual": [
              0.3185335635624641,
              0.24111504895787508,
              0.29232971614206776,
              0.24111504895787508,
              0.29232971614206776
            ],
            "overall": [
              0.0009544934383828307,
              -0.027251211657141616,
              -0.0031288531553108068,
              -0.027251211657141616,
              -0.0031288531553108068
            ]
          }
        }
      },
      "acspubcov": {
    "causal": {
      "metrics": {
        "validation": [0.6814720812182741, 0.6814720812182741, 0.6814720812182741, 0.6814720812182741, 0.6814720812182741],
        "id_test": [0.685116099035135, 0.685116099035135, 0.685116099035135, 0.685116099035135, 0.685116099035135],
        "ood_test": [0.6850482906934039, 0.6850482906934039, 0.6850482906934039, 0.6850482906934039, 0.6850482906934039],
        "ood_validation": [0.6814574179263887, 0.6814574179263887, 0.6814574179263887, 0.6814574179263887, 0.6814574179263887]
      },
      "train_shifts": {
        "informativeness": [0.3512071681633836, 0.3512071681633836, 0.3512071681633836, 0.3512071681633836, 0.3512071681633836],
        "invariance": [1.3962339375325514, 1.3962339375325514, 1.3962339375325514, 1.3962339375325514, 1.3962339375325514],
        "label_shift": [0.02836924313860048, 0.02836924313860048, 0.02836924313860048, 0.02836924313860048, 0.02836924313860048],
        "latent_covariate_shift": [1.2594095746506825, 1.2594095746506825, 1.2594095746506825, 1.2594095746506825, 1.2594095746506825],
        "concept_shift": [0.1096492649532102, 0.1096492649532102, 0.1096492649532102, 0.1096492649532102, 0.1096492649532102],
        "residual": [0.3292063208060031, 0.3292063208060031, 0.3292063208060031, 0.3292063208060031, 0.3292063208060031],
        "overall": [-0.10230158264102857, -0.10230158264102857, -0.10230158264102857, -0.10230158264102857, -0.10230158264102857]
      },
      "test_shifts": {
        "informativeness": [0.22849770843957356, 0.22849770843957356, 0.22849770843957356, 0.22849770843957356, 0.22849770843957356],
        "invariance": [1.2396706928473946, 1.2396706928473946, 1.2396706928473946, 1.2396706928473946, 1.2396706928473946],
        "label_shift": [0.030289891968151145, 0.030289891968151145, 0.030289891968151145, 0.030289891968151145, 0.030289891968151145],
        "latent_covariate_shift": [1.1589305883873098, 1.1589305883873098, 1.1589305883873098, 1.1589305883873098, 1.1589305883873098],
        "concept_shift": [0.004261634126956977, 0.004261634126956977, 0.004261634126956977, 0.004261634126956977, 0.004261634126956977],
        "residual": [0.3076551238323726, 0.3076551238323726, 0.3076551238323726, 0.3076551238323726, 0.3076551238323726],
        "overall": [0.005222213967701306, 0.005222213967701306, 0.005222213967701306, 0.005222213967701306, 0.005222213967701306]
      }
    },
    "arguablycausal": {
      "metrics": {
        "validation": [0.6802066155407075, 0.6802066155407075, 0.6802066155407075, 0.6802066155407075, 0.6802066155407075],
        "id_test": [0.6857855361594744, 0.6857855361594744, 0.6857855361594744, 0.6857855361594744, 0.6857855361594744],
        "ood_test": [0.6842794309715738, 0.6842794309715738, 0.6842794309715738, 0.6842794309715738, 0.6842794309715738],
        "ood_validation": [0.6800148992911919, 0.6800148992911919, 0.6800148992911919, 0.6800148992911919, 0.6800148992911919]
      },
      "train_shifts": {
        "informativeness": [0.2476313386971401, 0.2476313386971401, 0.2476313386971401, 0.2476313386971401, 0.2476313386971401],
        "invariance": [0.9921186242759441, 0.9921186242759441, 0.9921186242759441, 0.9921186242759441, 0.9921186242759441],
        "label_shift": [0.02836924313860048, 0.02836924313860048, 0.02836924313860048, 0.02836924313860048, 0.02836924313860048],
        "latent_covariate_shift": [0.9055705481649417, 0.9055705481649417, 0.9055705481649417, 0.9055705481649417, 0.9055705481649417],
        "concept_shift": [0.05299550626940616, 0.05299550626940616, 0.05299550626940616, 0.05299550626940616, 0.05299550626940616],
        "residual": [0.2658812252632061, 0.2658812252632061, 0.2658812252632061, 0.2658812252632061, 0.2658812252632061],
        "overall": [-0.10274902520667416, -0.10274902520667416, -0.10274902520667416, -0.10274902520667416, -0.10274902520667416]
      },
      "test_shifts": {
        "informativeness": [0.2426534080809536, 0.2426534080809536, 0.2426534080809536, 0.2426534080809536, 0.2426534080809536],
        "invariance": [1.1471576907186354, 1.1471576907186354, 1.1471576907186354, 1.1471576907186354, 1.1471576907186354],
        "label_shift": [0.030289891968151145, 0.030289891968151145, 0.030289891968151145, 0.030289891968151145, 0.030289891968151145],
        "latent_covariate_shift": [1.0596018003142504, 1.0596018003142504, 1.0596018003142504, 1.0596018003142504, 1.0596018003142504],
        "concept_shift": [0.02322402162236996, 0.02322402162236996, 0.02322402162236996, 0.02322402162236996, 0.02322402162236996],
        "residual": [0.28438726730593884, 0.28438726730593884, 0.28438726730593884, 0.28438726730593884, 0.28438726730593884],
        "overall": [-0.006696220326524621, -0.006696220326524621, -0.006696220326524621, -0.006696220326524621, -0.006696220326524621]
      }
    },
    "all": {
      "metrics": {
        "validation": [0.6793130904545156, 0.6793130904545156, 0.6793130904545156, 0.6793130904545156, 0.6793130904545156],
        "id_test": [0.6853378732804337, 0.6853378732804337, 0.6853378732804337, 0.6853378732804337, 0.6853378732804337],
        "ood_test": [0.6839750581162325, 0.6839750581162325, 0.6839750581162325, 0.6839750581162325, 0.6839750581162325],
        "ood_validation": [0.6788236994219653, 0.6788236994219653, 0.6788236994219653, 0.6788236994219653, 0.6788236994219653]
      },
      "train_shifts": {
        "informativeness": [0.20116929223691935, 0.20116929223691935, 0.20116929223691935, 0.20116929223691935, 0.20116929223691935],
        "invariance": [0.8890003433594196, 0.8890003433594196, 0.8890003433594196, 0.8890003433594196, 0.8890003433594196],
        "label_shift": [0.02836924313860048, 0.02836924313860048, 0.02836924313860048, 0.02836924313860048, 0.02836924313860048],
        "latent_covariate_shift": [0.8324892012919761, 0.8324892012919761, 0.8324892012919761, 0.8324892012919761, 0.8324892012919761],
        "concept_shift": [0.024236562206843336, 0.024236562206843336, 0.024236562206843336, 0.024236562206843336, 0.024236562206843336],
        "residual": [0.2494918656320058, 0.2494918656320058, 0.2494918656320058, 0.2494918656320058, 0.2494918656320058],
        "overall": [-0.09544966493344757, -0.09544966493344757, -0.09544966493344757, -0.09544966493344757, -0.09544966493344757]
      },
      "test_shifts": {
        "informativeness": [0.18754249445863644, 0.18754249445863644, 0.18754249445863644, 0.18754249445863644, 0.18754249445863644],
        "invariance": [0.9941899388886764, 0.9941899388886764, 0.9941899388886764, 0.9941899388886764, 0.9941899388886764],
        "label_shift": [0.030289891968151145, 0.030289891968151145, 0.030289891968151145, 0.030289891968151145, 0.030289891968151145],
        "latent_covariate_shift": [0.9197082831754094, 0.9197082831754094, 0.9197082831754094, 0.9197082831754094, 0.9197082831754094],
        "concept_shift": [0.016979150128981714, 0.016979150128981714, 0.016979150128981714, 0.016979150128981714, 0.016979150128981714],
        "residual": [0.2505122947702172, 0.2505122947702172, 0.2505122947702172, 0.2505122947702172, 0.2505122947702172],
        "overall": [-0.020427193822916447, -0.020427193822916447, -0.020427193822916447, -0.020427193822916447, -0.020427193822916447]
      }
    }
  },
  "brfss_blood_pressure": {
    "causal": {
      "metrics": {
        "validation": [0.7493734335839599, 0.7493734335839599, 0.7493734335839599, 0.7493734335839599, 0.7493734335839599],
        "id_test": [0.7503730912599221, 0.7503730912599221, 0.7503730912599221, 0.7503730912599221, 0.7503730912599221],
        "ood_test": [0.7498598537719793, 0.7498598537719793, 0.7498598537719793, 0.7498598537719793, 0.7498598537719793],
        "ood_validation": [0.7489997398753895, 0.7489997398753895, 0.7489997398753895, 0.7489997398753895, 0.7489997398753895]
      },
      "train_shifts": {
        "informativeness": [0.1641760535432209, 0.1641760535432209, 0.1641760535432209, 0.1641760535432209, 0.1641760535432209],
        "invariance": [1.3278301343781435, 1.3278301343781435, 1.3278301343781435, 1.3278301343781435, 1.3278301343781435],
        "label_shift": [0.027993229505231065, 0.027993229505231065, 0.027993229505231065, 0.027993229505231065, 0.027993229505231065],
        "latent_covariate_shift": [1.3264447184189118, 1.3264447184189118, 1.3264447184189118, 1.3264447184189118, 1.3264447184189118],
        "concept_shift": [0.09578601742809785, 0.09578601742809785, 0.09578601742809785, 0.09578601742809785, 0.09578601742809785],
        "residual": [0.4148134728981174, 0.4148134728981174, 0.4148134728981174, 0.4148134728981174, 0.4148134728981174],
        "overall": [-0.08998321849195616, -0.08998321849195616, -0.08998321849195616, -0.08998321849195616, -0.08998321849195616]
      },
      "test_shifts": {
        "informativeness": [0.1299830407898302, 0.1299830407898302, 0.1299830407898302, 0.1299830407898302, 0.1299830407898302],
        "invariance": [1.1950286450495532, 1.1950286450495532, 1.1950286450495532, 1.1950286450495532, 1.1950286450495532],
        "label_shift": [0.031100519120253824, 0.031100519120253824, 0.031100519120253824, 0.031100519120253824, 0.031100519120253824],
        "latent_covariate_shift": [1.189296277219332, 1.189296277219332, 1.189296277219332, 1.189296277219332, 1.189296277219332],
        "concept_shift": [0.0015738315888219747, 0.0015738315888219747, 0.0015738315888219747, 0.0015738315888219747, 0.0015738315888219747],
        "residual": [0.41224283299104965, 0.41224283299104965, 0.41224283299104965, 0.41224283299104965, 0.41224283299104965],
        "overall": [0.008090582723124375, 0.008090582723124375, 0.008090582723124375, 0.008090582723124375, 0.008090582723124375]
      }
    },
    "arguablycausal": {
      "metrics": {
        "validation": [0.7489242158808933, 0.7489242158808933, 0.7489242158808933, 0.7489242158808933, 0.7489242158808933],
        "id_test": [0.7503881217279026, 0.7503881217279026, 0.7503881217279026, 0.7503881217279026, 0.7503881217279026],
        "ood_test": [0.7498999147079402, 0.7498999147079402, 0.7498999147079402, 0.7498999147079402, 0.7498999147079402],
        "ood_validation": [0.7488404680820567, 0.7488404680820567, 0.7488404680820567, 0.7488404680820567, 0.7488404680820567]
      },
      "train_shifts": {
        "informativeness": [0.13550436937143624, 0.13550436937143624, 0.13550436937143624, 0.13550436937143624, 0.13550436937143624],
        "invariance": [0.956140039847465, 0.956140039847465, 0.956140039847465, 0.956140039847465, 0.956140039847465],
        "label_shift": [0.027993229505231065, 0.027993229505231065, 0.027993229505231065, 0.027993229505231065, 0.027993229505231065],
        "latent_covariate_shift": [0.9304327640875396, 0.9304327640875396, 0.9304327640875396, 0.9304327640875396, 0.9304327640875396],
        "concept_shift": [0.06539410357958615, 0.06539410357958615, 0.06539410357958615, 0.06539410357958615, 0.06539410357958615],
        "residual": [0.3497339308704121, 0.3497339308704121, 0.3497339308704121, 0.3497339308704121, 0.3497339308704121],
        "overall": [-0.0815113928288727, -0.0815113928288727, -0.0815113928288727, -0.0815113928288727, -0.0815113928288727]
      },
      "test_shifts": {
        "informativeness": [0.13609301528030463, 0.13609301528030463, 0.13609301528030463, 0.13609301528030463, 0.13609301528030463],
        "invariance": [1.0462720152146495, 1.0462720152146495, 1.0462720152146495, 1.0462720152146495, 1.0462720152146495],
        "label_shift": [0.031100519120253824, 0.031100519120253824, 0.031100519120253824, 0.031100519120253824, 0.031100519120253824],
        "latent_covariate_shift": [1.0383703281423715, 1.0383703281423715, 1.0383703281423715, 1.0383703281423715, 1.0383703281423715],
        "concept_shift": [0.012362082148670564, 0.012362082148670564, 0.012362082148670564, 0.012362082148670564, 0.012362082148670564],
        "residual": [0.3646324437759646, 0.3646324437759646, 0.3646324437759646, 0.3646324437759646, 0.3646324437759646],
        "overall": [-0.005946702145320398, -0.005946702145320398, -0.005946702145320398, -0.005946702145320398, -0.005946702145320398]
      }
    },
    "all": {
      "metrics": {
        "validation": [0.7476539677617253, 0.7476539677617253, 0.7476539677617253, 0.7476539677617253, 0.7476539677617253],
        "id_test": [0.7503722060429334, 0.7503722060429334, 0.7503722060429334, 0.7503722060429334, 0.7503722060429334],
        "ood_test": [0.7487445951271746, 0.7487445951271746, 0.7487445951271746, 0.7487445951271746, 0.7487445951271746],
        "ood_validation": [0.7480900953367972, 0.7480900953367972, 0.7480900953367972, 0.7480900953367972, 0.7480900953367972]
      },
      "train_shifts": {
        "informativeness": [0.10576064480122164, 0.10576064480122164, 0.10576064480122164, 0.10576064480122164, 0.10576064480122164],
        "invariance": [0.8370178023620557, 0.8370178023620557, 0.8370178023620557, 0.8370178023620557, 0.8370178023620557],
        "label_shift": [0.027993229505231065, 0.027993229505231065, 0.027993229505231065, 0.027993229505231065, 0.027993229505231065],
        "latent_covariate_shift": [0.8205252160272875, 0.8205252160272875, 0.8205252160272875, 0.8205252160272875, 0.8205252160272875],
        "concept_shift": [0.002216165793953676, 0.002216165793953676, 0.002216165793953676, 0.002216165793953676, 0.002216165793953676],
        "residual": [0.30393934872655286, 0.30393934872655286, 0.30393934872655286, 0.30393934872655286, 0.30393934872655286],
        "overall": [-0.0873484910512147, -0.0873484910512147, -0.0873484910512147, -0.0873484910512147, -0.0873484910512147]
      },
      "test_shifts": {
        "informativeness": [0.10411273236979987, 0.10411273236979987, 0.10411273236979987, 0.10411273236979987, 0.10411273236979987],
        "invariance": [0.9424914562038748, 0.9424914562038748, 0.9424914562038748, 0.9424914562038748, 0.9424914562038748],
        "label_shift": [0.031100519120253824, 0.031100519120253824, 0.031100519120253824, 0.031100519120253824, 0.031100519120253824],
        "latent_covariate_shift": [0.9143909369628503, 0.9143909369628503, 0.9143909369628503, 0.9143909369628503, 0.9143909369628503],
        "concept_shift": [-0.0029943851859650673, -0.0029943851859650673, -0.0029943851859650673, -0.0029943851859650673, -0.0029943851859650673],
        "residual": [0.31284682159008324, 0.31284682159008324, 0.31284682159008324, 0.31284682159008324, 0.31284682159008324],
        "overall": [-0.026152563796889986, -0.026152563796889986, -0.026152563796889986, -0.026152563796889986, -0.026152563796889986]
      }
    }
  }
    }
    