{
    "diabetes_readmission": {
      "causal": {
        "metrics": {
          "train": [0.5479047355455861, 0.4525924357539953, 0.5488108962812548, 0.4525924357539953, 0.5488108962812548],
          "validation": [0.5781614559029398, 0.4225384974335044, 0.5783947736817545, 0.4225384974335044, 0.5783947736817545],
          "id_test": [0.5838581758805692, 0.4166083508280849, 0.5850244926522044, 0.4166083508280849, 0.5850244926522044],
          "ood_validation": [0.4936440677966102, 0.506002824858757, 0.4936440677966102, 0.506002824858757, 0.4936440677966102],
          "ood_test": [0.5061607283001098, 0.49446711662219434, 0.5061999686077538, 0.49446711662219434, 0.5061999686077538]
        },
        "train_shifts": {
          "informativeness": [0.01375947357098106, 0.035491102037690216, 0.03265328316917298, 0.035491102037690216, 0.03265328316917298],
          "invariance": [0.25697157586807007, 0.32591953091199216, 0.34614762095793283, 0.32591953091199216, 0.34614762095793283],
          "label_shift": [0.003375592508434266, -0.0031805683642138712, -0.01792304390607593, -0.0031805683642138712, -0.01792304390607593],
          "latent_covariate_shift": [0.2882694048348382, 0.3550506031229789, 0.36529891301655454, 0.3550506031229789, 0.36529891301655454],
          "concept_shift": [0.20493252076789212, 0.2772927896165331, 0.2971695935932198, 0.2772927896165331, 0.2971695935932198],
          "residual": [0.01904462461654597, 0.022224518251825545, 0.031681721022627146, 0.022224518251825545, 0.031681721022627146],
          "overall": [-0.09041470069190977, -0.11240455909901544, -0.14699911057379117, -0.11240455909901544, -0.14699911057379117]
        },
        "test_shifts": {
          "informativeness": [0.015054588603336232, 0.01601138908318828, 0.010012582551369342, 0.01601138908318828, 0.010012582551369342],
          "invariance": [0.0017650721130085315, 0.0014809652572510034, 0.0006100753565161459, 0.0014809652572510034, 0.0006100753565161459],
          "label_shift": [-0.006770410690669257, -0.004868900844769146, 0.0057945710351309035, -0.004868900844769146, 0.0057945710351309035],
          "latent_covariate_shift": [0.0010384260463486353, 0.0010853686169059295, 0.0011801685080679001, 0.0010853686169059295, 0.0011801685080679001],
          "concept_shift": [0.05919420689453771, 0.052965915565410526, 0.056018780003380376, 0.052965915565410526, 0.056018780003380376],
          "residual": [0.02190662457964358, 0.026726177933536408, 0.005964249046477158, 0.026726177933536408, 0.005964249046477158],
          "overall": [-0.04019766780224078, -0.0398299953756105, -0.020778724403456676, -0.0398299953756105, -0.020778724403456676]
        }
      },
      "arguablycausal": {
        "metrics": {
          "train": [0.5479047355455861, 0.5479047355455861, 0.4520735847076334, 0.5479047355455861, 0.4520735847076334],
          "validation": [0.5781614559029398, 0.5781614559029398, 0.4218385440970602, 0.5781614559029398, 0.4218385440970602],
          "id_test": [0.5838581758805692, 0.5838581758805692, 0.41614182411943085, 0.5838581758805692, 0.41614182411943085],
          "ood_validation": [0.4936440677966102, 0.4936440677966102, 0.5063559322033898, 0.4936440677966102, 0.5063559322033898],
          "ood_test": [0.5061607283001098, 0.5061607283001098, 0.4938000313922461, 0.5061607283001098, 0.4938000313922461]
        },
        "train_shifts": {
          "informativeness": [0.07518415869311407, 0.06069208677293379, 0.054711498601276345, 0.06069208677293379, 0.054711498601276345],
          "invariance": [0.11054204095254547, 0.18685149770482265, 0.05613576846637255, 0.18685149770482265, 0.05613576846637255],
          "label_shift": [0.003375592508434266, -0.0031805683642138712, 0.03056067027352713, -0.0031805683642138712, 0.03056067027352713],
          "latent_covariate_shift": [0.09374602674260973, 0.13860522497359762, 0.05298069455385805, 0.13860522497359762, 0.05298069455385805],
          "concept_shift": [0.024938386645107755, 0.006832666789477041, 0.01652569401720646, 0.006832666789477041, 0.01652569401720646],
          "residual": [0.0593472802812215, 0.03404763592959773, 0.036613766797790354, 0.03404763592959773, 0.036613766797790354],
          "overall": [-0.0033425257614120504, -0.0024853030991219133, 0.023537682975389065, -0.0024853030991219133, 0.023537682975389065]
        },
        "test_shifts": {
          "informativeness": [0.04660420759994022, 0.04350626553399571, 0.05001421011114664, 0.04350626553399571, 0.05001421011114664],
          "invariance": [0.0009617966939257095, 0.012215436242634607, 0.0013224704541496726, 0.012215436242634607, 0.0013224704541496726],
          "label_shift": [-0.006770410690669257, 0.0007466110447008205, 0.0008123026729152539, 0.0007466110447008205, 0.0008123026729152539],
          "latent_covariate_shift": [-4.80898346978952e-05, -4.80898346978952e-05, -4.80898346978952e-05, -4.80898346978952e-05, -4.80898346978952e-05],
          "concept_shift": [0.0005650555576821692, 0.001039942675307547, 0.0010699988219927702, 0.001039942675307547, 0.0010699988219927702],
          "residual": [0.04659546963508248, 0.04339344325386599, 0.05017567227623434, 0.04339344325386599, 0.05017567227623434],
          "overall": [-0.004163938423629783, -0.006165606573839889, -0.0009755903840502414, -0.006165606573839889, -0.0009755903840502414]
        }
      },
      "all": {
        "metrics": {
          "train": [0.5479047355455861, 0.5499936176446393, 0.5479047355455861, 0.5479047355455861, 0.5499936176446393],
          "validation": [0.5781614559029398, 0.5781614559029398, 0.579794680354643, 0.5781614559029398, 0.579794680354643],
          "id_test": [0.5838581758805692, 0.5857242827151854, 0.5857242827151854, 0.5838581758805692, 0.5857242827151854],
          "ood_validation": [0.4936440677966102, 0.4936440677966102, 0.4978813559322034, 0.4936440677966102, 0.4978813559322034],
          "ood_test": [0.5061607283001098, 0.5083974258358186, 0.5083974258358186, 0.5061607283001098, 0.5083974258358186]
        },
        "train_shifts": {
          "informativeness": [0.047310823329308666, 0.03916069171615847, -0.03494281200815709, 0.03916069171615847, -0.03494281200815709],
          "invariance": [0.45246196583376563, 0.23183736155103668, 0.03406036487489026, 0.23183736155103668, 0.03406036487489026],
          "label_shift": [0.003375592508434266, -0.0031805683642138712, -0.01792304390607593, -0.0031805683642138712, -0.01792304390607593],
          "latent_covariate_shift": [0.5112834211657711, 0.27543050585667334, 0.035071165436601395, 0.27543050585667334, 0.035071165436601395],
          "concept_shift": [-0.0049067178741159425, 0.0026920325007886658, -0.05160094229133961, 0.0026920325007886658, -0.05160094229133961],
          "residual": [0.05962285635834849, 0.023405030807815384, -0.051600942291340886, 0.023405030807815384, -0.051600942291340886],
          "overall": [0.02123984982823801, 0.03461593262866013, 0.0340024797566712, 0.03461593262866013, 0.0340024797566712]
        },
        "test_shifts": {
          "informativeness": [0.058871362498228615, 0.04496839263859891, -0.0178894185070239, 0.04496839263859891, -0.0178894185070239],
          "invariance": [0.00034865130154804766, 0.001971683222548193, -0.0178894185070239, 0.001971683222548193, -0.0178894185070239],
          "label_shift": [-0.006770410690669257, -0.004868900844769146, 0.0011850967860879177, -0.004868900844769146, 0.0011850967860879177],
          "latent_covariate_shift": [-4.80898346978952e-05, -4.80898346978952e-05, -0.01788941850702502, -4.80898346978952e-05, -0.01788941850702502],
          "concept_shift": [-4.808983469549263e-05, 0.0001322470454152075, -0.01788941850702278, 0.0001322470454152075, -0.01788941850702278],
          "residual": [0.05880695649570663, 0.04489025695499836, -0.0178894185070239, 0.04489025695499836, -0.0178894185070239],
          "overall": [-0.003495124993587867, -0.0034323247901146686, 0.009537257646554788, -0.0034323247901146686, 0.009537257646554788]
        }
      }
    },
    "acsfoodstamps": {
    "causal": {
      "metrics": {
        "train": [0.785849, 0.785849, 0.786141, 0.785849, 0.786141],
        "validation": [0.812762, 0.812762, 0.813105, 0.812762, 0.813105],
        "id_test": [0.809101, 0.809101, 0.809241, 0.809101, 0.809241],
        "ood_validation": [0.786411, 0.786411, 0.787148, 0.786411, 0.787148],
        "ood_test": [0.780126, 0.780126, 0.780801, 0.780126, 0.780801]
      },
      "train_shifts": {
        "informativeness": [0.076533, 0.065045, 0.071325, 0.065045, 0.071325],
        "invariance": [2.528118, 2.592678, 2.476122, 2.592678, 2.476122],
        "label_shift": [-0.005806, 0.005422, 0.001191, 0.005422, 0.001191],
        "latent_covariate_shift": [2.594300, 2.646860, 2.539826, 2.646860, 2.539826],
        "concept_shift": [0.110395, 0.109945, 0.104911, 0.109945, 0.104911],
        "residual": [0.079931, 0.073532, 0.076407, 0.073532, 0.076407],
        "overall": [-0.028407, -0.033658, -0.025090, -0.033658, -0.025090]
      },
      "test_shifts": {
        "informativeness": [0.080683, 0.084979, 0.087740, 0.084979, 0.087740],
        "invariance": [-0.000144, 0.000120, 0.000284, 0.000120, 0.000284],
        "label_shift": [-0.001596, 0.010002, 0.011091, 0.010002, 0.011091],
        "latent_covariate_shift": [0.000073, 0.000378, 0.000399, 0.000378, 0.000399],
        "concept_shift": [0.125247, 0.140813, 0.121897, 0.140813, 0.121897],
        "residual": [0.079624, 0.085612, 0.086230, 0.085612, 0.086230],
        "overall": [-0.062254, -0.065909, -0.053835, -0.065909, -0.053835]
      }
    },
    "arguablycausal": {
      "metrics": {
        "train": [0.783240, 0.681444, 0.782331, 0.681444, 0.782331],
        "validation": [0.807890, 0.664581, 0.819617, 0.664581, 0.819617],
        "id_test": [0.804192, 0.660986, 0.817177, 0.660986, 0.817177],
        "ood_validation": [0.779967, 0.650525, 0.798196, 0.650525, 0.798196],
        "ood_test": [0.774111, 0.645914, 0.788330, 0.645914, 0.788330]
      },
      "train_shifts": {
        "informativeness": [0.126082, 0.115856, 0.125655, 0.115856, 0.125655],
        "invariance": [1.606555, 1.720180, 1.478130, 1.720180, 1.478130],
        "label_shift": [-0.005806, 0.005422, 0.001191, 0.005422, 0.001191],
        "latent_covariate_shift": [1.721376, 1.823983, 1.604355, 1.823983, 1.604355],
        "concept_shift": [-0.011666, -0.007941, -0.012872, -0.007941, -0.012872],
        "residual": [0.120814, 0.085709, 0.132596, 0.085709, 0.132596],
        "overall": [0.065609, 0.088730, 0.063203, 0.088730, 0.063203]
      },
      "test_shifts": {
        "informativeness": [0.167381, 0.149783, 0.172557, 0.149783, 0.172557],
        "invariance": [0.000036, 0.000433, 0.000000, 0.000433, 0.000000],
        "label_shift": [-0.001596, 0.010002, 0.011091, 0.010002, 0.011091],
        "latent_covariate_shift": [0.000000, 0.000000, 0.000000, 0.000000, 0.000000],
        "concept_shift": [0.004040, 0.004581, 0.003751, 0.004581, 0.003751],
        "residual": [0.152033, 0.119911, 0.167038, 0.119911, 0.167038],
        "overall": [0.012512, 0.032366, 0.009189, 0.032366, 0.009189]
      }
    },
    "all": {
      "metrics": {
        "train": [0.820821, 0.800366, 0.821908, 0.800366, 0.821908],
        "validation": [0.814402, 0.815038, 0.819922, 0.815038, 0.819922],
        "id_test": [0.810551, 0.810729, 0.815765, 0.810729, 0.815765],
        "ood_validation": [0.788068, 0.789357, 0.795618, 0.789357, 0.795618],
        "ood_test": [0.780924, 0.782745, 0.789905, 0.782745, 0.789905]
      },
      "train_shifts": {
        "informativeness": [0.181982, 0.150014, 0.172458, 0.150014, 0.172458],
        "invariance": [1.655553, 1.478344, 1.545839, 1.478344, 1.545839],
        "label_shift": [-0.005806, 0.005422, 0.001191, 0.005422, 0.001191],
        "latent_covariate_shift": [1.729954, 1.565130, 1.648662, 1.565130, 1.648662],
        "concept_shift": [-0.007182, -0.008780, -0.009319, -0.008780, -0.009319],
        "residual": [0.179717, 0.151953, 0.181199, 0.151953, 0.181199],
        "overall": [0.040153, 0.048556, 0.047925, 0.048556, 0.047925]
      },
      "test_shifts": {
        "informativeness": [0.199005, 0.185916, 0.203150, 0.185916, 0.203150],
        "invariance": [0.000902, 0.001118, 0.000000, 0.001118, 0.000000],
        "label_shift": [-0.001596, 0.010002, 0.011091, 0.010002, 0.011091],
        "latent_covariate_shift": [0.000000, 0.000000, 0.000000, 0.000000, 0.000000],
        "concept_shift": [0.002525, 0.002380, 0.002417, 0.002380, 0.002417],
        "residual": [0.198998, 0.186464, 0.203134, 0.186464, 0.203134],
        "overall": [-0.002504, 0.002704, 0.004353, 0.002704, 0.004353]
      }
    }
  },
  "brfss_diabetes": {
    "causal": {
      "metrics": {
        "train": [0.1273229679686852, 0.1273229679686852, 0.8726770320313149, 0.1273229679686852, 0.8726770320313149],
        "validation": [0.1272579173234582, 0.1272579173234582, 0.8727420826765417, 0.1272579173234582, 0.8727420826765417],
        "id_test": [0.12664605173844182, 0.12664605173844182, 0.8733539482615582, 0.12664605173844182, 0.8733539482615582],
        "ood_validation": [0.17363863767558207, 0.17363863767558207, 0.8263613623244179, 0.17363863767558207, 0.8263613623244179],
        "ood_test": [0.17431016125101023, 0.17431016125101023, 0.8256898387489898, 0.17431016125101023, 0.8256898387489898]
      },
      "train_shifts": {
        "informativeness": [0.40575382110614866, 0.02745115455114848, 0.024779113994668537, 0.02745115455114848, 0.024779113994668537],
        "invariance": [0.3927679358234868, 0.010187023168985045, 0.006885943663801567, 0.010187023168985045, 0.006885943663801567],
        "label_shift": [0.017554929267790703, -0.008925562674817243, -2.2532771176831046e-05, -0.008925562674817243, -2.2532771176831046e-05],
        "latent_covariate_shift": [0.4022993597633462, 0.013060146813211002, 0.006466809980712902, 0.013060146813211002, 0.006466809980712902],
        "concept_shift": [0.043655480461925696, 0.033669894344752246, 0.032326023453650994, 0.033669894344752246, 0.032326023453650994],
        "residual": [0.4192639872428213, 0.02643943711704958, 0.019251087151020873, 0.02643943711704958, 0.019251087151020873],
        "overall": [-0.021794729763810472, -0.01884944925357287, -0.01085581811031058, -0.01884944925357287, -0.01085581811031058]
      },
      "test_shifts": {
        "informativeness": [0.320603532232479, 0.04044141428870524, 0.03184344558914692, 0.04044141428870524, 0.03184344558914692],
        "invariance": [0.43611074916140063, 0.15719965891915008, 0.1336726584843891, 0.15719965891915008, 0.1336726584843891],
        "label_shift": [0.015683151311908138, 0.013249473317606253, -0.0021312183477133926, 0.013249473317606253, -0.0021312183477133926],
        "latent_covariate_shift": [0.45180675716950647, 0.15019635816955557, 0.1432861943562174, 0.15019635816955557, 0.1432861943562174],
        "concept_shift": [0.06514086895678033, 0.12779367786309556, 0.10128778051197597, 0.12779367786309556, 0.10128778051197597],
        "residual": [0.40313456637273315, 0.04616205199177709, 0.034573977931033874, 0.04616205199177709, 0.034573977931033874],
        "overall": [-0.09941188895863728, -0.06649439035061375, -0.049633263835817495, -0.06649439035061375, -0.049633263835817495]
      }
    },
    "arguablycausal": {
      "metrics": {
        "train": [0.12471871972464711, 0.8752812802753529, 0.12471871972464711, 0.8752812802753529, 0.12471871972464711],
        "validation": [0.12547666606137642, 0.8745233339386236, 0.12547666606137642, 0.8745233339386236, 0.12547666606137642],
        "id_test": [0.12722650510919986, 0.8727734948908001, 0.12722650510919986, 0.8727734948908001, 0.12722650510919986],
        "ood_validation": [0.17125171939477304, 0.828748280605227, 0.17125171939477304, 0.828748280605227, 0.17125171939477304],
        "ood_test": [0.17419462686567164, 0.8258053731343283, 0.17419462686567164, 0.8258053731343283, 0.17419462686567164]
      },
      "train_shifts": {
        "informativeness": [0.026461787317131037, 0.043871307148236435, 0.052634299937629456, 0.043871307148236435, 0.052634299937629456],
        "invariance": [0.035562432757913195, 0.003943366445097828, 0.0001442695040896813, 0.003943366445097828, 0.0001442695040896813],
        "label_shift": [0.004410807874824522, 0.0011844314582365686, 0.001173587585282219, 0.0011844314582365686, 0.001173587585282219],
        "latent_covariate_shift": [0.0, -2.40449173489476e-05, 0.0, -2.40449173489476e-05, 0.0],
        "concept_shift": [0.0009377517765780433, 0.0018153912597857998, 0.0011180886566893842, 0.0018153912597857998, 0.0011180886566893842],
        "residual": [0.02717140576457989, 0.044138654773566315, 0.052694306946315016, 0.044138654773566315, 0.052694306946315016],
        "overall": [-0.016754306777282214, -0.00256653320732788, -0.00010439229643398329, -0.00256653320732788, -0.00010439229643398329]
      },
      "test_shifts": {
        "informativeness": [0.06514471041357092, 0.057386465539023684, 0.04673395619923277, 0.057386465539023684, 0.04673395619923277],
        "invariance": [0.16507371067407675, 0.0888578277247766, 0.10574602576988394, 0.0888578277247766, 0.10574602576988394],
        "label_shift": [0.004553317822596618, 0.010314087944422293, 0.0193389075900948, 0.010314087944422293, 0.0193389075900948],
        "latent_covariate_shift": [0.1295642828104366, 0.07527696813166225, 0.11315061509582909, 0.07527696813166225, 0.11315061509582909],
        "concept_shift": [-0.0005191601160111734, 0.007095888976907921, 0.004624210408192308, 0.007095888976907921, 0.004624210408192308],
        "residual": [0.02207390707522259, 0.05126719121285245, 0.05045090149804097, 0.05126719121285245, 0.05045090149804097],
        "overall": [0.02785232837583216, 0.0009379440133712447, 0.007342697955115621, 0.0009379440133712447, 0.007342697955115621]
      }
    },
    "all": {
      "metrics": {
        "train": [0.8752812802753529, 0.8752812802753529, 0.12471871972464711, 0.8752812802753529, 0.12471871972464711],
        "validation": [0.8745233339386236, 0.8745233339386236, 0.12547666606137642, 0.8745233339386236, 0.12547666606137642],
        "id_test": [0.8727734948908001, 0.8727734948908001, 0.12722650510919986, 0.8727734948908001, 0.12722650510919986],
        "ood_validation": [0.828748280605227, 0.828748280605227, 0.17125171939477304, 0.828748280605227, 0.17125171939477304],
        "ood_test": [0.8258053731343283, 0.8258053731343283, 0.17419462686567164, 0.8258053731343283, 0.17419462686567164]
      },
      "train_shifts": {
        "informativeness": [0.11857388342037983, 0.0782615977706043, 0.07467029656351223, 0.0782615977706043, 0.07467029656351223],
        "invariance": [0.0023443794414440672, 0.009617966939259818, 1.1211992763352213e-15, 0.009617966939259818, 1.1211992763352213e-15],
        "label_shift": [0.004410807874824522, 0.012883342436454523, -0.009360219372641473, 0.012883342436454523, -0.009360219372641473],
        "latent_covariate_shift": [0.0, -4.80898346978952e-05, 0.0, -4.80898346978952e-05, 0.0],
        "concept_shift": [0.0008656170245334429, 0.001358537830171172, 0.000577078016355682, 0.001358537830171172, 0.000577078016355682],
        "residual": [0.11850281204325457, 0.07721584269230339, 0.0746330774758595, 0.07721584269230339, 0.0746330774758595],
        "overall": [0.0006714770815487853, 0.00197512899446374, -0.004931429606846394, 0.00197512899446374, -0.004931429606846394]
      },
      "test_shifts": {
        "informativeness": [0.14316948135513846, 0.10112053380817108, 0.07125854162270867, 0.10112053380817108, 0.07125854162270867],
        "invariance": [0.12804395470360333, 0.10272798637906318, 0.10379585305333613, 0.10272798637906318, 0.10379585305333613],
        "label_shift": [0.007387840843629615, -0.000524659736159124, 0.005067784101228259, -0.000524659736159124, 0.005067784101228259],
        "latent_covariate_shift": [0.12419069720293814, 0.08666505158490595, 0.12118709271372759, 0.08666505158490595, 0.12118709271372759],
        "concept_shift": [0.005522824641078829, 0.0022993454534924037, -0.006455778193615094, 0.0022993454534924037, -0.006455778193615094],
        "residual": [0.1398038649520535, 0.09338806989222179, 0.08892889348463454, 0.09338806989222179, 0.08892889348463454],
        "overall": [0.002371495754027758, -0.0017110060759550766, -0.003212950884308466, -0.0017110060759550766, -0.003212950884308466]
      }
    }
  },
  "acsincome": {
    "causal": {
      "metrics": {
        "train": [0.9131455399061033, 0.9131455399061033, 0.9131455399061033, 0.9131455399061033, 0.9131455399061033],
        "validation": [0.6764864095180837, 0.6764864095180837, 0.6764864095180837, 0.6764864095180837, 0.6764864095180837],
        "id_test": [0.6791780579181855, 0.6791780579181855, 0.6791780579181855, 0.6791780579181855, 0.6791780579181855],
        "ood_validation": [0.5981031416716064, 0.5981031416716064, 0.5981031416716064, 0.5981031416716064, 0.5981031416716064],
        "ood_test": [0.6020339608225422, 0.6020339608225422, 0.6020339608225422, 0.6020339608225422, 0.6020339608225422]
      },
      "train_shifts": {
        "informativeness": [0.12579463333273697, 0.12364556568342625, 0.1269498404169275, 0.12364556568342625, 0.1269498404169275],
        "invariance": [1.3337261572827095, 1.337711312715413, 1.3422003330340904, 1.337711312715413, 1.3422003330340904],
        "label_shift": [0.015213404934141922, 0.008082415533674643, 0.014770968001511706, 0.008082415533674643, 0.014770968001511706],
        "latent_covariate_shift": [1.3216001730144318, 1.3252713057847, 1.3291327530961932, 1.3252713057847, 1.3291327530961932],
        "concept_shift": [0.20655779509164718, 0.19712802326525564, 0.20374525544095967, 0.19712802326525564, 0.20374525544095967],
        "residual": [0.12616826657625665, 0.1235216372874669, 0.13298143302379292, 0.1235216372874669, 0.13298143302379292],
        "overall": [-0.10210882045641115, -0.10061887893518759, -0.10705252629553799, -0.10061887893518759, -0.10705252629553799]
      },
      "test_shifts": {
        "informativeness": [0.15856739683350887, 0.14524187916219156, 0.1574026901425328, 0.14524187916219156, 0.1574026901425328],
        "invariance": [-0.0001592053123352428, 0.0009621915834681319, 0.0004613998977529533, 0.0009621915834681319, 0.0004613998977529533],
        "label_shift": [0.003482233702930959, 0.020133433797550723, -0.00486302279645367, 0.020133433797550723, -0.00486302279645367],
        "latent_covariate_shift": [-0.00017583857124067455, 0.0015546754655172178, 0.000515739079339451, 0.0015546754655172178, 0.000515739079339451],
        "concept_shift": [0.10839669749407493, 0.10334255667939156, 0.09902694127644407, 0.10334255667939156, 0.09902694127644407],
        "residual": [0.15717172423172263, 0.1501063647916234, 0.15185414777776787, 0.1501063647916234, 0.15185414777776787],
        "overall": [-0.051069875923238445, -0.0461728051293277, -0.0463692700808907, -0.0461728051293277, -0.0463692700808907]
      }
    },
    "arguablycausal": {
      "metrics": {
        "train": [0.9131455399061033, 0.8446561723280862, 0.9244683789008561, 0.8446561723280862, 0.9244683789008561],
        "validation": [0.6764864095180837, 0.7169002942758599, 0.8057336328829542, 0.7169002942758599, 0.8057336328829542],
        "id_test": [0.6791780579181855, 0.7146238355609559, 0.8052602268124747, 0.7146238355609559, 0.8052602268124747],
        "ood_validation": [0.5981031416716064, 0.7370480142264375, 0.7826911677534084, 0.7370480142264375, 0.7826911677534084],
        "ood_test": [0.6020339608225422, 0.7394712228794246, 0.782692890358446, 0.7394712228794246, 0.782692890358446]
      },
      "train_shifts": {
        "informativeness": [0.3355880146130698, 0.3009767423485443, 0.3316969553716261, 0.3009767423485443, 0.3316969553716261],
        "invariance": [1.4579962929889225, 2.0581670323286354, 1.7407196212349312, 2.0581670323286354, 1.7407196212349312],
        "label_shift": [0.015213404934141922, 0.008082415533674643, 0.014770968001511706, 0.008082415533674643, 0.014770968001511706],
        "latent_covariate_shift": [1.557239796069236, 2.13843334230836, 1.8455585670930894, 2.13843334230836, 1.8455585670930894],
        "concept_shift": [-0.011581724871820505, -0.01075819831156686, -0.012477373881422369, -0.01075819831156686, -0.012477373881422369],
        "residual": [0.33370179118414783, 0.17835130970653681, 0.3419745318359259, 0.17835130970653681, 0.3419745318359259],
        "overall": [0.06490553987205988, 0.17217889455449056, 0.0557660674062464, 0.17217889455449056, 0.0557660674062464]
      },
      "test_shifts": {
        "informativeness": [0.42308300719035963, 0.3892030864518937, 0.41587637699631774, 0.3892030864518937, 0.41587637699631774],
        "invariance": [0.002204807107771058, 0.00003606737602197985, 0.000004619512231236604, 0.00003606737602197985, 0.000004619512231236604],
        "label_shift": [0.003482233702930959, 0.020133433797550723, -0.00486302279645367, 0.020133433797550723, -0.00486302279645367],
        "latent_covariate_shift": [0.000005773702524787593, 0.0000018551026968969317, 0.0000009475786904363412, 0.0000018551026968969317, 0.0000009475786904363412],
        "concept_shift": [0.01755399191001646, 0.016059600296829277, 0.01654891436486428, 0.016059600296829277, 0.01654891436486428],
        "residual": [0.4231075873358167, 0.22684706298582313, 0.41526328660946915, 0.22684706298582313, 0.41526328660946915],
        "overall": [-0.008159975951622989, 0.16437583407976875, -0.01007668047257032, 0.16437583407976875, -0.01007668047257032]
      }
    },
    "all": {
      "metrics": {
        "train": [0.9131455399061033, 0.3696492681579674, 0.9230875448771058, 0.3696492681579674, 0.9230875448771058],
        "validation": [0.6764864095180837, 0.5037939436129482, 0.809176344017973, 0.5037939436129482, 0.809176344017973],
        "id_test": [0.6791780579181855, 0.5003227521263669, 0.8071904110976104, 0.5003227521263669, 0.8071904110976104],
        "ood_validation": [0.5981031416716064, 0.5754593953764078, 0.78814463544754, 0.5754593953764078, 0.78814463544754],
        "ood_test": [0.6020339608225422, 0.5744753724756623, 0.7914268024396991, 0.5744753724756623, 0.7914268024396991]
      },
      "train_shifts": {
        "informativeness": [0.34351870471470214, 0.3497944864337984, 0.3526851511294667, 0.3497944864337984, 0.3526851511294667],
        "invariance": [1.46223191761976, 1.675794398585982, 1.3904180005776663, 1.675794398585982, 1.3904180005776663],
        "label_shift": [0.015213404934141922, 0.008082415533674643, 0.014770968001511706, 0.008082415533674643, 0.014770968001511706],
        "latent_covariate_shift": [1.5574767044078366, 1.7447494736151816, 1.4767653694600733, 1.7447494736151816, 1.4767653694600733],
        "concept_shift": [-0.011490337808313586, -0.006301414710408688, -0.006855860793184234, -0.006301414710408688, -0.006855860793184234],
        "residual": [0.34226673438721006, 0.22880199494750902, 0.3614754995714818, 0.22880199494750902, 0.3614754995714818],
        "overall": [0.0622262350927581, 0.16266194412293083, 0.04519675039653637, 0.16266194412293083, 0.04519675039653637]
      },
      "test_shifts": {
        "informativeness": [0.4294231450395157, 0.4156867582306524, 0.4210868177568113, 0.4156867582306524, 0.4210868177568113],
        "invariance": [0.0015508971689569865, 0.004039546114488492, 0.0002899291054842836, 0.004039546114488492, 0.0002899291054842836],
        "label_shift": [0.003482233702930959, 0.020133433797550723, -0.00486302279645367, 0.020133433797550723, -0.00486302279645367],
        "latent_covariate_shift": [0.000002633591064131417, 0.0000014391203746147608, 0.0000009475786904363412, 0.0000014391203746147608, 0.0000009475786904363412],
        "concept_shift": [0.009305383013734072, 0.009062529348517452, 0.008259429109089767, 0.009062529348517452, 0.008259429109089767],
        "residual": [0.4293900768726635, 0.25827912206245923, 0.42133521328361373, 0.25827912206245923, 0.42133521328361373],
        "overall": [-0.00365263827749579, 0.16092403489565282, -0.0069541122429711, 0.16092403489565282, -0.0069541122429711]
      }
    }
  },
  "acsunemployment": {
    "causal": {
      "metrics": {
        "train": [0.98139558291883, 0.98139558291883, 0.9690988852448016, 0.98139558291883, 0.9690988852448016],
        "validation": [0.9665910612032423, 0.966572469695843, 0.9309201556728887, 0.966572469695843, 0.9309201556728887],
        "id_test": [0.966176060483996, 0.9661450748303535, 0.9293465125646826, 0.9661450748303535, 0.9293465125646826],
        "ood_validation": [0.9493949394939494, 0.9492849284928493, 0.8666666666666667, 0.9492849284928493, 0.8666666666666667],
        "ood_test": [0.9484875711290806, 0.9484264505442788, 0.866433186032724, 0.9484264505442788, 0.866433186032724]
      },
      "train_shifts": {
        "informativeness": [0.015725522941875583, 0.008765538687453462, 0.005643444891074857, 0.008765538687453462, 0.005643444891074857],
        "invariance": [0.1747961217476823, 0.15957690174775752, 0.15658313693386453, 0.15957690174775752, 0.15658313693386453],
        "label_shift": [0.007477877913284072, 0.0007035110240214094, 0.007083499996848578, 0.0007035110240214094, 0.007083499996848578],
        "latent_covariate_shift": [0.16824331839092618, 0.15721454988156303, 0.15757420263085342, 0.15721454988156303, 0.15757420263085342],
        "concept_shift": [0.13361584376648178, 0.138132849398075, 0.12482892110618976, 0.138132849398075, 0.12482892110618976],
        "residual": [0.00684873534924653, 0.005599962484409691, 0.0078875492601309, 0.005599962484409691, 0.0078875492601309],
        "overall": [-0.057468597012347855, -0.06673026891708027, -0.06062128207523218, -0.06673026891708027, -0.06062128207523218]
      },
      "test_shifts": {
        "informativeness": [0.02027614312265445, 0.010565180196816236, 0.012813071374761774, 0.010565180196816236, 0.012813071374761774],
        "invariance": [0.3470847789106694, 0.3176207229931287, 0.3159405558971419, 0.3176207229931287, 0.3159405558971419],
        "label_shift": [-0.011390759908765893, 0.008484502040884608, 0.003640261983926621, 0.008484502040884608, 0.003640261983926621],
        "latent_covariate_shift": [0.3432189369848049, 0.32044140799455334, 0.3198155990598044, 0.32044140799455334, 0.3198155990598044],
        "concept_shift": [0.12394314309714136, 0.12234604909905641, 0.11132294014333233, 0.12234604909905641, 0.11132294014333233],
        "residual": [0.01164210395447066, 0.012416118510945769, 0.01638547810925837, 0.012416118510945769, 0.01638547810925837],
        "overall": [-0.060965833297702096, -0.05737136934250311, -0.055476224232868174, -0.05737136934250311, -0.055476224232868174]
      }
    },
    "arguablycausal": {
      "metrics": {
        "train": [0.9835345037284325, 0.9813871949940866, 0.9814039708435736, 0.9813871949940866, 0.9814039708435736],
        "validation": [0.9722428794526661, 0.9665910612032423, 0.9552378473513299, 0.9665910612032423, 0.9552378473513299],
        "id_test": [0.9716977039630651, 0.966176060483996, 0.9545626374988381, 0.966176060483996, 0.9545626374988381],
        "ood_validation": [0.9609460946094609, 0.9493949394939494, 0.935093509350935, 0.9493949394939494, 0.935093509350935],
        "ood_test": [0.9602960681127797, 0.9484875711290806, 0.9343137075135535, 0.9484875711290806, 0.9343137075135535]
      },
      "train_shifts": {
        "informativeness": [0.06559145351517552, 0.03825087025692918, 0.025071387428834697, 0.03825087025692918, 0.025071387428834697],
        "invariance": [0.3073129741089418, 0.30965875005698096, 0.33179380527027463, 0.30965875005698096, 0.33179380527027463],
        "label_shift": [0.007477877913284072, 0.0007035110240214094, 0.007083499996848578, 0.0007035110240214094, 0.007083499996848578],
        "latent_covariate_shift": [0.2836419323866442, 0.297095215641924, 0.33179674610576904, 0.297095215641924, 0.33179674610576904],
        "concept_shift": [0.005658873459536464, 0.006325228095988427, 0.003448440427205571, 0.006325228095988427, 0.003448440427205571],
        "residual": [0.009026125253369325, 0.022578115529542288, 0.013109219612805412, 0.022578115529542288, 0.013109219612805412],
        "overall": [0.0456393096275312, 0.006580128983874896, 0.013781168018597991, 0.006580128983874896, 0.013781168018597991]
      },
      "test_shifts": {
        "informativeness": [0.1054311825032758, 0.08025948002276079, 0.06899665979311806, 0.08025948002276079, 0.06899665979311806],
        "invariance": [0.3785545094539948, 0.3550978809516055, 0.3473676902393294, 0.3550978809516055, 0.3473676902393294],
        "label_shift": [-0.011390759908765893, 0.008484502040884608, 0.003640261983926621, 0.008484502040884608, 0.003640261983926621],
        "latent_covariate_shift": [0.3473820365716773, 0.3289218946748798, 0.34144993556993924, 0.3289218946748798, 0.34144993556993924],
        "concept_shift": [0.01982085819898444, 0.02520859256537849, 0.022884481113125712, 0.02520859256537849, 0.022884481113125712],
        "residual": [0.03248332813419533, 0.0563711638466109, 0.036924959168997185, 0.0563711638466109, 0.036924959168997185],
        "overall": [0.04175580887404655, 0.0024382777755401, 0.019490713724826247, 0.0024382777755401, 0.019490713724826247]
      }
    },
    "all": {
      "metrics": {
        "train": [0.9699021820917983, 0.9855243828155792, 0.9589379769966677, 0.9855243828155792, 0.9589379769966677],
        "validation": [0.9486998339158672, 0.9709662626112392, 0.9256959420936516, 0.9709662626112392, 0.9256959420936516],
        "id_test": [0.946382424937254, 0.9703095466798872, 0.9241966969293217, 0.9703095466798872, 0.9241966969293217],
        "ood_validation": [0.9283828382838284, 0.9585258525852586, 0.9043454345434544, 0.9585258525852586, 0.9043454345434544],
        "ood_test": [0.929387388378532, 0.9568366430130003, 0.9051164041537549, 0.9568366430130003, 0.9051164041537549]
      },
      "train_shifts": {
        "informativeness": [0.1085308576880384, 0.0955796655942448, 0.11190111761146801, 0.0955796655942448, 0.11190111761146801],
        "invariance": [0.2601564557620158, 0.27798675446250054, 0.2782482767860748, 0.27798675446250054, 0.2782482767860748],
        "label_shift": [0.007477877913284072, 0.0007035110240214094, 0.007083499996848578, 0.0007035110240214094, 0.007083499996848578],
        "latent_covariate_shift": [0.25147843695151395, 0.272725018806357, 0.2780035159370324, 0.272725018806357, 0.2780035159370324],
        "concept_shift": [0.0020398865181416215, 0.0018392340248462812, 0.0021411038280017966, 0.0018392340248462812, 0.0021411038280017966],
        "residual": [0.03736013805250659, 0.09391849668996678, 0.030722430835124406, 0.09391849668996678, 0.030722430835124406],
        "overall": [0.06955070592785212, -0.0015375604242061774, 0.08352750443624579, -0.0015375604242061774, 0.08352750443624579]
      },
      "test_shifts": {
        "informativeness": [0.16698445833296013, 0.1440573630401641, 0.1511676957435368, 0.1440573630401641, 0.1511676957435368],
        "invariance": [0.38883003077055917, 0.36325925825290295, 0.3613080807954454, 0.36325925825290295, 0.3613080807954454],
        "label_shift": [-0.011390759908765893, 0.008484502040884608, -0.00486302279645367, 0.008484502040884608, -0.00486302279645367],
        "latent_covariate_shift": [0.3797228173875563, 0.359224208330951, 0.3597218241641173, 0.359224208330951, 0.3597218241641173],
        "concept_shift": [0.014567337538648053, 0.00982708561559586, 0.017298688675405016, 0.00982708561559586, 0.017298688675405016],
        "residual": [0.07270640588625986, 0.12832331145930068, 0.04047769772257647, 0.12832331145930068, 0.04047769772257647],
        "overall": [0.07674539703149187, 0.01304523483253181, 0.10306765635955709, 0.01304523483253181, 0.10306765635955709]
      }
    }
  },
"assistments": {
    "causal": {
      "metrics": {
        "validation": [0.6903318502734782, 0.6903318502734782, 0.6903318502734782, 0.6903318502734782, 0.6903318502734782],
        "id_test":    [0.6924589032359716, 0.6924589032359716, 0.6924589032359716, 0.6924589032359716, 0.6924589032359716],
        "ood_test":   [0.4386149003147954, 0.4386149003147954, 0.4386149003147954, 0.4386149003147954, 0.4386149003147954],
        "ood_validation": [0.5424528301886793, 0.5424528301886793, 0.5424528301886793, 0.5424528301886793, 0.5424528301886793]
      },
      "train_shifts": {
        "informativeness": [0.29752463194003365, 0.3553477840563324, 0.2911844422036177, 0.3553477840563324, 0.2911844422036177],
        "invariance":      [1.6437501646568717, 1.957399749582271, 1.8275305412541945, 1.957399749582271, 1.8275305412541945],
        "label_shift":     [0.02660028896165906, 0.008994641022265475, 0.013129028217462604, 0.008994641022265475, 0.013129028217462604],
        "latent_covariate_shift": [1.6688786547341359, 2.047567040446003, 1.852928118612994, 2.047567040446003, 1.852928118612994],
        "concept_shift":   [0.15965798338772882, 0.16260343980916117, 0.15603614402584115, 0.16260343980916117, 0.15603614402584115],
        "residual":        [0.5117066946708639, 0.586863716271995, 0.5306902177380958, 0.586863716271995, 0.5306902177380958],
        "overall":         [-0.26814666490523315, -0.2632366861772445, -0.29826054475926755, -0.2632366861772445, -0.29826054475926755]
      },
      "test_shifts": {
        "informativeness": [0.21545644824381074, 0.19609509360041494, 0.21605653440213798, 0.19609509360041494, 0.21605653440213798],
        "invariance":      [1.986209660154473, 1.9995634896675698, 2.0646882185629853, 1.9995634896675698, 2.0646882185629853],
        "label_shift":     [0.02329921323212632, 0.08065473411469921, 0.0465449048506624, 0.08065473411469921, 0.0465449048506624],
        "latent_covariate_shift": [2.059326869771794, 2.096115239819585, 2.1121253261182114, 2.096115239819585, 2.1121253261182114],
        "concept_shift":   [-0.005568024005660109, 0.03470317125743043, 0.043747390815670785, 0.03470317125743043, 0.043747390815670785],
        "residual":        [0.24185188030162227, 0.2439664553539039, 0.2701493074980709, 0.2439664553539039, 0.2701493074980709],
        "overall":         [0.02459679136974227, 0.023380294751152914, -0.02897546230082415, 0.023380294751152914, -0.02897546230082415]
      }
    },
    "arguablycausal": {
      "metrics": {
        "validation": [0.6903318502734782, 0.6903318502734782, 0.6903318502734782, 0.6903318502734782, 0.6903318502734782],
        "id_test":    [0.6924589032359716, 0.6924589032359716, 0.6924589032359716, 0.6924589032359716, 0.6924589032359716],
        "ood_test":   [0.4386149003147954, 0.4386149003147954, 0.4386149003147954, 0.4386149003147954, 0.4386149003147954],
        "ood_validation": [0.5424528301886793, 0.5424528301886793, 0.5424528301886793, 0.5424528301886793, 0.5424528301886793]
      },
      "train_shifts": {
        "informativeness": [0.18588379626408955, 0.2350340418394394, 0.14488033008747667, 0.2350340418394394, 0.14488033008747667],
        "invariance":      [1.1973652576025677, 1.1823641483307479, 1.089007042502183, 1.1823641483307479, 1.089007042502183],
        "label_shift":     [0.02660028896165906, 0.008994641022265475, 0.010584968025361248, 0.008994641022265475, 0.010584968025361248],
        "latent_covariate_shift": [1.1956458954827212, 1.1885640276185678, 1.083583344017349, 1.1885640276185678, 1.083583344017349],
        "concept_shift":   [0.07240003686741989, 0.08107944620342356, 0.07318055231289436, 0.08107944620342356, 0.07318055231289436],
        "residual":        [0.44343826172450074, 0.4295326470592411, 0.2642993869562642, 0.4295326470592411, 0.2642993869562642],
        "overall":         [-0.28131402047321485, -0.22744106816647075, -0.15342869825497102, -0.22744106816647075, -0.15342869825497102]
      },
      "test_shifts": {
        "informativeness": [0.26486323608218265, 0.24951189863891673, 0.2592214532376226, 0.24951189863891673, 0.2592214532376226],
        "invariance":      [1.8519618610912916, 1.7807290671474658, 1.9877039154544751, 1.7807290671474658, 1.9877039154544751],
        "label_shift":     [0.02329921323212632, 0.05429385611444123, 0.030913719696912156, 0.05429385611444123, 0.030913719696912156],
        "latent_covariate_shift": [1.9229455238719215, 1.8818818879431667, 1.9854767112331344, 1.8818818879431667, 1.9854767112331344],
        "concept_shift":   [0.07359380164542259, 0.15071423983409465, 0.13132523433210555, 0.15071423983409465, 0.13132523433210555],
        "residual":        [0.2898129078142183, 0.27708092962776554, 0.29513904524198403, 0.27708092962776554, 0.29513904524198403],
        "overall":         [-0.014605134548368814, -0.025202812450825007, -0.08723695143262844, -0.025202812450825007, -0.08723695143262844]
      }
    },
    "all": {
      "metrics": {
        "validation": [0.6903318502734782, 0.6903318502734782, 0.6903318502734782, 0.6903318502734782, 0.6903318502734782],
        "id_test":    [0.6924589032359716, 0.6924589032359716, 0.6924589032359716, 0.6924589032359716, 0.6924589032359716],
        "ood_test":   [0.4386149003147954, 0.4386149003147954, 0.4386149003147954, 0.4386149003147954, 0.4386149003147954],
        "ood_validation": [0.5424528301886793, 0.5424528301886793, 0.5424528301886793, 0.5424528301886793, 0.5424528301886793]
      },
      "train_shifts": {
        "informativeness": [0.1363449890952756, 0.2005686497499293, 0.2385108808338345, 0.2005686497499293, 0.2385108808338345],
        "invariance":      [0.9892023212571058, 1.2940814071600504, 0.9080668224576939, 1.2940814071600504, 0.9080668224576939],
        "label_shift":     [0.02660028896165906, 0.020116183344292597, 0.002728217550262214, 0.020116183344292597, 0.002728217550262214],
        "latent_covariate_shift": [0.9740990496125573, 1.2799446408773651, 0.9762513226866322, 1.2799446408773651, 0.9762513226866322],
        "concept_shift":   [-0.0004293680125118433, 0.0037943652515505474, -0.00467639458049566, 0.0037943652515505474, -0.00467639458049566],
        "residual":        [0.2600943465110196, 0.39133258735302656, 0.42453101256259823, 0.39133258735302656, 0.42453101256259823],
        "overall":         [-0.11778616475093276, -0.1896714116980689, -0.1482255755489157, -0.1896714116980689, -0.1482255755489157]
      },
      "test_shifts": {
        "informativeness": [0.21884674942957716, 0.2687075390869349, 0.2651669368755747, 0.2687075390869349, 0.2651669368755747],
        "invariance":      [1.8858090387472959, 1.9666337592956984, 1.6031932488451592, 1.9666337592956984, 1.6031932488451592],
        "label_shift":     [0.03028352221961338, -0.010147600388304819, 0.07740818412505449, -0.010147600388304819, 0.07740818412505449],
        "latent_covariate_shift": [1.8957597716279628, 2.0113115872747995, 1.7518201266162785, 2.0113115872747995, 1.7518201266162785],
        "concept_shift":   [-0.0056838686949808965, -0.009882415643874333, 0.015816551633726566, -0.009882415643874333, 0.015816551633726566],
        "residual":        [0.2669985108652552, 0.32267374604911, 0.31102880982280784, 0.32267374604911, 0.31102880982280784],
        "overall":         [-0.025192699538047453, -0.0317598853448397, 0.05924738218399045, -0.0317598853448397, 0.05924738218399045]
      }
    }
  },


  "acspubcov": {
    "causal": {
      "metrics": {
        "validation": [0.22317939378690485, 0.7968553120026518, 0.23668230224389503, 0.7968553120026518, 0.23668230224389503],
        "id_test":    [0.2240495864467972, 0.7957414603560032, 0.23726491766876606, 0.7957414603560032, 0.23726491766876606],
        "ood_test":   [0.6364000943907213, 0.6260379005645104, 0.6414864337791624, 0.6260379005645104, 0.6414864337791624],
        "ood_validation":[0.6400039614419649, 0.6252035741009727, 0.644823715832563, 0.6252035741009727, 0.644823715832563]
      },
      "train_shifts": {
        "informativeness": [0.023017683453396054, 0.030459984649773814, 0.028093306627841243, 0.030459984649773814, 0.028093306627841243],
        "invariance":      [0.0027628300983049427, 0.0019110082547603177, 0.0011701157499796767, 0.0019110082547603177, 0.0011701157499796767],
        "label_shift":     [0.016856964365221407, 0.014266508443450773, 0.010231313700030983, 0.014266508443450773, 0.010231313700030983],
        "latent_covariate_shift": [-0.0009042637826179954, 0.0013162056276792152, 0.0017594654557178426, 0.0013162056276792152, 0.0017594654557178426],
        "concept_shift":   [0.016351395883393197, 0.014633993893116353, 0.03096975191482735, 0.014633993893116353, 0.03096975191482735],
        "residual":        [0.024652737716312184, 0.009035799136396329, 0.03750791645848293, 0.009035799136396329, 0.03750791645848293],
        "overall":         [-0.0032158169624634907, 0.020943041475004143, -0.019489154085170785, 0.020943041475004143, -0.019489154085170785]
      },
      "test_shifts": {
        "informativeness": [0.05076439280003649, 0.05076439280003649, 0.05147799598092579, 0.05076439280003649, 0.05147799598092579],
        "invariance":      [0.0020417057191240732, 0.0020417057191240732, 0.0006171836420215138, 0.0020417057191240732, 0.0006171836420215138],
        "label_shift":     [-0.003372463110508083, -0.003372463110508083, 0.0020792925334653205, -0.003372463110508083, 0.0020792925334653205],
        "latent_covariate_shift": [0.0006055064083605201, 0.0006055064083605201, 0.0007011778968059959, 0.0006055064083605201, 0.0007011778968059959],
        "concept_shift":   [0.11503637600115771, 0.11503637600115771, 0.10957829765184879, 0.11503637600115771, 0.10957829765184879],
        "residual":        [0.04947606461206469, 0.04947606461206469, 0.05342370169920815, 0.04947606461206469, 0.05342370169920815],
        "overall":         [-0.058634191023242875, -0.058634191023242875, -0.055653211150081844, -0.058634191023242875, -0.055653211150081844]
      }
    },
    "arguablycausal": {
      "metrics": {
        "validation": [0.22317939378690485, 0.7968553120026518, 0.23668230224389503, 0.7968553120026518, 0.23668230224389503],
        "id_test":    [0.2240495864467972, 0.7957414603560032, 0.23726491766876606, 0.7957414603560032, 0.23726491766876606],
        "ood_test":   [0.6364000943907213, 0.6260379005645104, 0.6414864337791624, 0.6260379005645104, 0.6414864337791624],
        "ood_validation":[0.6400039614419649, 0.6252035741009727, 0.644823715832563, 0.6252035741009727, 0.644823715832563]
      },
      "train_shifts": {
        "informativeness": [0.0565234693950674, 0.11052938862476298, 0.07988558801221685, 0.11052938862476298, 0.07988558801221685],
        "invariance":      [0.05254642201393969, 0.0010742839226774922, 0.05075102475487279, 0.0010742839226774922, 0.05075102475487279],
        "label_shift":     [0.016856964365221407, 0.014266508443450773, 0.010231313700030983, 0.014266508443450773, 0.010231313700030983],
        "latent_covariate_shift": [0.0001214037528411742, 9.266030738507814e-05, -7.391093825237327e-06, 9.266030738507814e-05, -7.391093825237327e-06],
        "concept_shift":   [0.06085687560678981, 0.06186057204363043, 0.05753961433740358, 0.06186057204363043, 0.05753961433740358],
        "residual":        [0.05559000590834069, 0.09724023329871864, 0.0768182301536331, 0.09724023329871864, 0.0768182301536331],
        "overall":         [-0.047279001264606754, -0.010998688281691704, -0.045966000384451554, -0.010998688281691704, -0.045966000384451554]
      },
      "test_shifts": {
        "informativeness": [0.11827759277693504, 0.23061023514970622, 0.17344218434108827, 0.23061023514970622, 0.17344218434108827],
        "invariance":      [0.05352662070369538, 0.0009377517765793247, 0.05201109222089802, 0.0009377517765793247, 0.05201109222089802],
        "label_shift":     [-0.003372463110508083, 0.0056231408750471255, 0.0020792925334653205, 0.0056231408750471255, 0.0020792925334653205],
        "latent_covariate_shift": [1.0367668448506073e-05, 2.7385515821148096e-06, 1.696431733668995e-06, 2.7385515821148096e-06, 1.696431733668995e-06],
        "concept_shift":   [0.014358422394447934, 0.013500018845118502, 0.015401971807357086, 0.013500018845118502, 0.015401971807357086],
        "residual":        [0.11775250807571001, 0.20533989919692291, 0.15902406055491689, 0.20533989919692291, 0.15902406055491689],
        "overall":         [-0.03509848456887642, 0.020864390355249007, -0.01824791374535667, 0.020864390355249007, -0.01824791374535667]
      }
    },
    "all": {
      "metrics": {
        "validation": [0.22292978367789512, 0.7770881882499536, 0.36646358388197636, 0.7770881882499536, 0.36646358388197636],
        "id_test":    [0.22379797995934358, 0.7762120044250792, 0.36602154230783057, 0.7762120044250792, 0.36602154230783057],
        "ood_test":   [0.6362729359060103, 0.3637295094494649, 0.6741527148947825, 0.3637295094494649, 0.6741527148947825],
        "ood_validation":[0.6398499053655531, 0.3601500946344469, 0.6759650512786655, 0.3601500946344469, 0.6759650512786655]
      },
      "train_shifts": {
        "informativeness": [0.0004082341229237691, 0.10511546886599923, 0.002846350261034337, 0.10511546886599923, 0.002846350261034337],
        "invariance":      [0.0016230319210012666, 0.048186014365690394, 0.004292017746644754, 0.048186014365690394, 0.004292017746644754],
        "label_shift":     [0.016856964365221407, 0.014266508443450773, 0.010231313700030983, 0.014266508443450773, 0.010231313700030983],
        "latent_covariate_shift": [0.0, 0.0, 0.0, 0.0, 0.0],
        "concept_shift":   [0.0033903333460893314, 0.002452581569511448, 0.0036788723542670924, 0.002452581569511448, 0.0036788723542670924],
        "residual":        [0.00043771008517291864, 0.10416617551914374, 0.0033848338107061284, 0.10416617551914374, 0.0033848338107061284],
        "overall":         [0.005892323586816255, -0.017236750399020048, 0.0005917282498877768, -0.017236750399020048, 0.0005917282498877768]
      },
      "test_shifts": {
        "informativeness": [0.0006144318762230631, 0.20331645429689008, 0.0032630611056699206, 0.20331645429689008, 0.0032630611056699206],
        "invariance":      [1.1211992763352213e-15, 0.04079220228113503, 0.003570670226199391, 0.04079220228113503, 0.003570670226199391],
        "label_shift":     [-0.003372463110508083, 0.0056231408750471255, 0.0020792925334653205, 0.0056231408750471255, 0.0020792925334653205],
        "latent_covariate_shift": [0.0, 0.0, 0.0, 0.0, 0.0],
        "concept_shift":   [0.00288539008177825, 0.003390333346089652, 0.0020919078092890868, 0.003390333346089652, 0.0020919078092890868],
        "residual":        [0.0005727134080964691, 0.20295400219217888, 0.00227861638209272, 0.20295400219217888, 0.00227861638209272],
        "overall":         [-0.003087208128017133, -0.018917245271377586, -0.0008071980274343784, -0.018917245271377586, -0.0008071980274343784]
      }
    }
  },



  "brfss_blood_pressure": {
    "causal": {
      "metrics": {
        "train": [0.37695933355255945, 0.37695933355255945, 0.37695933355255945, 0.37695933355255945, 0.37695933355255945],
        "validation": [0.40220324572104543, 0.40220324572104543, 0.40220324572104543, 0.40220324572104543, 0.40220324572104543],
        "id_test": [0.40196658287742126, 0.40196658287742126, 0.40196658287742126, 0.40196658287742126, 0.40196658287742126],
        "ood_validation": [0.5835140997830802, 0.5835140997830802, 0.5835140997830802, 0.5835140997830802, 0.5835140997830802],
        "ood_test": [0.5842926061755961, 0.5842926061755961, 0.5842926061755961, 0.5842926061755961, 0.5842926061755961]
      },
      "train_shifts": {
        "informativeness": [0.10209533758950476, 0.10098889277799034, 0.11039654645255713, 0.10098889277799034, 0.11039654645255713],
        "invariance": [0.0705711973638247, 0.06534166469530568, 0.07157909541127701, 0.06534166469530568, 0.07157909541127701],
        "label_shift": [0.01572578048184541, 0.008211379500363864, 0.0112941417497322, 0.008211379500363864, 0.0112941417497322],
        "latent_covariate_shift": [0.06739636134760768, 0.05817369476045172, 0.07853093616436259, 0.05817369476045172, 0.07853093616436259],
        "concept_shift": [0.07064893933016522, 0.07236043283238824, 0.07339466359951155, 0.07236043283238824, 0.07339466359951155],
        "residual": [0.09716295416044868, 0.09299730148574259, 0.09903199045672066, 0.09299730148574259, 0.09903199045672066],
        "overall": [-0.024116614003212328, -0.02766692034119142, -0.01620978455251043, -0.02766692034119142, -0.01620978455251043]
      },
      "test_shifts": {
        "informativeness": [0.06802254386081065, 0.07442549178130371, 0.08757165224437427, 0.07442549178130371, 0.08757165224437427],
        "invariance": [0.03989767921750146, 0.030668202738024716, 0.05395037478719507, 0.030668202738024716, 0.05395037478719507],
        "label_shift": [0.02105310105154427, 0.013225881376363912, 0.014592304614744202, 0.013225881376363912, 0.014592304614744202],
        "latent_covariate_shift": [0.04530902835198197, 0.052030146309756005, 0.05473184140704238, 0.052030146309756005, 0.05473184140704238],
        "concept_shift": [0.06432191445791458, 0.0761113395797976, 0.07292304325624296, 0.0761113395797976, 0.07292304325624296],
        "residual": [0.0799075367413597, 0.06725298083195509, 0.09980038390310167, 0.06725298083195509, 0.09980038390310167],
        "overall": [-0.03081372501649393, -0.013589246366502578, -0.04100336766955312, -0.013589246366502578, -0.04100336766955312]
      }
    },
    "arguablycausal": {
      "metrics": {
        "train": [0.6230406664474405, 0.37695933355255945, 0.6230406664474405, 0.37695933355255945, 0.6230406664474405],
        "validation": [0.5977967542789545, 0.40220324572104543, 0.5977967542789545, 0.40220324572104543, 0.5977967542789545],
        "id_test": [0.5980334171225787, 0.40196658287742126, 0.5980334171225787, 0.40196658287742126, 0.5980334171225787],
        "ood_validation": [0.4164859002169197, 0.5835140997830802, 0.4164859002169197, 0.5835140997830802, 0.4164859002169197],
        "ood_test": [0.4157073938244039, 0.5842926061755961, 0.4157073938244039, 0.5842926061755961, 0.4157073938244039]
      },
      "train_shifts": {
        "informativeness": [0.09548139296380295, -0.007132494954065974, 0.08915048790072619, -0.007132494954065974, 0.08915048790072619],
        "invariance": [0.07974691101304347, -0.004530948471274605, 0.04611788693744185, -0.004530948471274605, 0.04611788693744185],
        "label_shift": [0.01572578048184541, -0.0008104149368126157, 0.022030101976591086, -0.0008104149368126157, 0.022030101976591086],
        "latent_covariate_shift": [0.07455477332008317, 0.0039258784941260585, 0.04839733477025502, 0.0039258784941260585, 0.04839733477025502],
        "concept_shift": [0.1226859870320291, 0.005829848336937636, 0.12288650108449932, 0.005829848336937636, 0.12288650108449932],
        "residual": [0.0921815433925679, 0.014966238950947635, 0.08461768988215632, 0.014966238950947635, 0.08461768988215632],
        "overall": [-0.05277632255033694, -0.021190452059188403, -0.04475567761897766, -0.021190452059188403, -0.04475567761897766]
      },
      "test_shifts": {
        "informativeness": [0.07952641743238671, -0.00033138862242324186, 0.06569051521470501, -0.00033138862242324186, 0.06569051521470501],
        "invariance": [0.06014170240500904, 0.004327718990908224, 0.035095559479942535, 0.004327718990908224, 0.035095559479942535],
        "label_shift": [0.02338099646990692, 0.01509751562984458, 0.0196391862539724, 0.01509751562984458, 0.0196391862539724],
        "latent_covariate_shift": [0.05952025178162438, -0.0039806990542786864, 0.04542282994958311, -0.0039806990542786864, 0.04542282994958311],
        "concept_shift": [0.11651657145389789, 0.017277395267454185, 0.1058659934099131, 0.017277395267454185, 0.1058659934099131],
        "residual": [0.0839015430884463, 0.005981774075746209, 0.07620010935589058, 0.005981774075746209, 0.07620010935589058],
        "overall": [-0.051253638459747404, -0.011557311539567709, -0.04845936248433563, -0.011557311539567709, -0.04845936248433563]
      }
    },
    "all": {
      "metrics": {
        "train": [0.37695933355255945, 0.37695933355255945, 0.37695933355255945, 0.37695933355255945, 0.37695933355255945],
        "validation": [0.40220324572104543, 0.40220324572104543, 0.40220324572104543, 0.40220324572104543, 0.40220324572104543],
        "id_test": [0.40196658287742126, 0.40196658287742126, 0.40196658287742126, 0.40196658287742126, 0.40196658287742126],
        "ood_validation": [0.5835140997830802, 0.5835140997830802, 0.5835140997830802, 0.5835140997830802, 0.5835140997830802],
        "ood_test": [0.5842926061755961, 0.5842926061755961, 0.5842926061755961, 0.5842926061755961, 0.5842926061755961]
      },
      "train_shifts": {
        "informativeness": [0.07436460027693002, 0.08229337072580914, 0.09539781627870154, 0.08229337072580914, 0.09539781627870154],
        "invariance": [0.030099235822969774, 0.04813988871604857, 0.05046040317002305, 0.04813988871604857, 0.05046040317002305],
        "label_shift": [0.01572578048184541, -0.0008104149368126157, 0.022030101976591086, -0.0008104149368126157, 0.022030101976591086],
        "latent_covariate_shift": [0.03267684123648923, 0.0496659599731287, 0.05027986243259644, 0.0496659599731287, 0.05027986243259644],
        "concept_shift": [0.011428222458809919, 0.015593456886188585, 0.015423813995263314, 0.015593456886188585, 0.015423813995263314],
        "residual": [0.07560862753906634, 0.08036024859708799, 0.0909571240080725, 0.08036024859708799, 0.0909571240080725],
        "overall": [0.002193554456141153, -0.005505778154239374, 0.0076535658925796085, -0.005505778154239374, 0.0076535658925796085]
      },
      "test_shifts": {
        "informativeness": [0.06863761646819104, 0.06654694588323387, 0.06943546097754033, 0.06654694588323387, 0.06943546097754033],
        "invariance": [0.029240837037353067, 0.03629818144677289, 0.04109199012973489, 0.03629818144677289, 0.04109199012973489],
        "label_shift": [0.02338099646990692, 0.01509751562984458, 0.0196391862539724, 0.01509751562984458, 0.0196391862539724],
        "latent_covariate_shift": [0.031646541190456116, 0.03933317172401004, 0.05141865148533185, 0.03933317172401004, 0.05141865148533185],
        "concept_shift": [0.016250873196803677, 0.018058597528077227, 0.014365586980060385, 0.018058597528077227, 0.014365586980060385],
        "residual": [0.07488423604674103, 0.06852353396483629, 0.0807290217607535, 0.06852353396483629, 0.0807290217607535],
        "overall": [-0.00147870586544685, -0.0019396338921001677, -0.0034934304684586803, -0.0019396338921001677, -0.0034934304684586803]
      }
    }
  }
  }
  