{
    "ade_corpus_v2_classification":{
        "pred":0.3759129893,
        "depvar":0.6359832473,
        "abs_diff":0.260070258,
        "coeff_avg_confidence":-0.047565332,
        "pval_avg_confidence":0.7394542602,
        "intercept":0.4142414807,
        "pval_intercept":0.0004710088
    },
    "anli":{
        "pred":0.4098334706,
        "depvar":0.1422328903,
        "abs_diff":0.2676005804,
        "coeff_avg_confidence":-0.0645325503,
        "pval_avg_confidence":0.655017771,
        "intercept":0.4438113336,
        "pval_intercept":0.000276624
    },
    "banking77":{
        "pred":0.3937881992,
        "depvar":0.4196436442,
        "abs_diff":0.025855445,
        "coeff_avg_confidence":-0.0233559418,
        "pval_avg_confidence":0.8741685775,
        "intercept":0.4049112575,
        "pval_intercept":0.0012566931
    },
    "boolean_expressions":{
        "pred":0.3887976413,
        "depvar":0.3344918831,
        "abs_diff":0.0543057582,
        "coeff_avg_confidence":-0.0235820115,
        "pval_avg_confidence":0.8743177708,
        "intercept":0.4077460302,
        "pval_intercept":0.0008628705
    },
    "boolq":{
        "pred":0.4070242581,
        "depvar":0.146029937,
        "abs_diff":0.2609943211,
        "coeff_avg_confidence":0.0310630837,
        "pval_avg_confidence":0.8342147972,
        "intercept":0.3759841705,
        "pval_intercept":0.0015297705
    },
    "circa":{
        "pred":0.3610332203,
        "depvar":0.6433464357,
        "abs_diff":0.2823132153,
        "coeff_avg_confidence":0.0516817542,
        "pval_avg_confidence":0.7317195006,
        "intercept":0.3432874133,
        "pval_intercept":0.0046923513
    },
    "commonsense_qa":{
        "pred":0.3877150057,
        "depvar":0.4738480301,
        "abs_diff":0.0861330244,
        "coeff_avg_confidence":-0.0251904985,
        "pval_avg_confidence":0.8649708386,
        "intercept":0.4042046507,
        "pval_intercept":0.0009258147
    },
    "fig_qa":{
        "pred":0.3888165702,
        "depvar":0.3996823311,
        "abs_diff":0.0108657609,
        "coeff_avg_confidence":-0.0277681619,
        "pval_avg_confidence":0.8519839716,
        "intercept":0.4085328484,
        "pval_intercept":0.0008623531
    },
    "formal_fallacies_syllogisms_negation":{
        "pred":0.395626652,
        "depvar":0.1835028233,
        "abs_diff":0.2121238287,
        "coeff_avg_confidence":-0.0060848282,
        "pval_avg_confidence":0.9236960009,
        "intercept":0.4006276041,
        "pval_intercept":0.0007882318
    },
    "high":{
        "pred":0.3909765544,
        "depvar":0.4576005125,
        "abs_diff":0.0666239581,
        "coeff_avg_confidence":-0.0148900168,
        "pval_avg_confidence":0.9020893386,
        "intercept":0.3975648194,
        "pval_intercept":0.0015122045
    },
    "hyperbaton":{
        "pred":0.3803351586,
        "depvar":0.5693484241,
        "abs_diff":0.1890132654,
        "coeff_avg_confidence":-0.037496577,
        "pval_avg_confidence":0.7973723564,
        "intercept":0.4094785361,
        "pval_intercept":0.0006646854
    },
    "medmcqa":{
        "pred":0.3961605189,
        "depvar":0.3096702923,
        "abs_diff":0.0864902266,
        "coeff_avg_confidence":-0.0353652969,
        "pval_avg_confidence":0.8122375951,
        "intercept":0.4171520987,
        "pval_intercept":0.0007446496
    },
    "mmlu":{
        "pred":0.3855034578,
        "depvar":0.3605165295,
        "abs_diff":0.0249869283,
        "coeff_avg_confidence":-0.0238931054,
        "pval_avg_confidence":0.8729759176,
        "intercept":0.4069849151,
        "pval_intercept":0.0009436805
    },
    "mnist_ascii":{
        "pred":0.4073518532,
        "depvar":0.3484815647,
        "abs_diff":0.0588702885,
        "coeff_avg_confidence":-0.044206462,
        "pval_avg_confidence":0.7786191145,
        "intercept":0.4224817639,
        "pval_intercept":0.0012066953
    },
    "mnli":{
        "pred":0.3879774562,
        "depvar":0.3841092911,
        "abs_diff":0.0038681651,
        "coeff_avg_confidence":-0.0274174008,
        "pval_avg_confidence":0.8541356513,
        "intercept":0.4087747644,
        "pval_intercept":0.0008610277
    },
    "mrpc":{
        "pred":0.3938084385,
        "depvar":0.227715013,
        "abs_diff":0.1660934255,
        "coeff_avg_confidence":-0.0212874047,
        "pval_avg_confidence":0.8827859258,
        "intercept":0.4098546506,
        "pval_intercept":0.0006911279
    },
    "object_counting":{
        "pred":0.3830506447,
        "depvar":0.495369272,
        "abs_diff":0.1123186273,
        "coeff_avg_confidence":-0.0333783432,
        "pval_avg_confidence":0.8216691134,
        "intercept":0.4091168509,
        "pval_intercept":0.0007994693
    },
    "overruling":{
        "pred":0.375150936,
        "depvar":0.4726776467,
        "abs_diff":0.0975267108,
        "coeff_avg_confidence":-0.0451943336,
        "pval_avg_confidence":0.7659965443,
        "intercept":0.417960877,
        "pval_intercept":0.000724238
    },
    "qnli":{
        "pred":0.3586060966,
        "depvar":0.6462857332,
        "abs_diff":0.2876796365,
        "coeff_avg_confidence":-0.0831741629,
        "pval_avg_confidence":0.5685731063,
        "intercept":0.4384911041,
        "pval_intercept":0.0002754644
    },
    "qqp":{
        "pred":0.3869238554,
        "depvar":0.382766081,
        "abs_diff":0.0041577744,
        "coeff_avg_confidence":-0.0273908947,
        "pval_avg_confidence":0.8544602992,
        "intercept":0.4087659329,
        "pval_intercept":0.0008522403
    },
    "quail":{
        "pred":0.3886983955,
        "depvar":0.4854499462,
        "abs_diff":0.0967515507,
        "coeff_avg_confidence":-0.0137454451,
        "pval_avg_confidence":0.9033231355,
        "intercept":0.3957505258,
        "pval_intercept":0.0013525841
    },
    "reasoning_about_colored_objects":{
        "pred":0.4091870845,
        "depvar":0.2807345474,
        "abs_diff":0.1284525371,
        "coeff_avg_confidence":-0.0558084631,
        "pval_avg_confidence":0.7141553499,
        "intercept":0.4330126364,
        "pval_intercept":0.0006907174
    },
    "rte":{
        "pred":0.3703796271,
        "depvar":0.4827788782,
        "abs_diff":0.1123992511,
        "coeff_avg_confidence":-0.0525458412,
        "pval_avg_confidence":0.7315237218,
        "intercept":0.4226686017,
        "pval_intercept":0.000690634
    },
    "sports_understanding":{
        "pred":0.3875441367,
        "depvar":0.33238561,
        "abs_diff":0.0551585266,
        "coeff_avg_confidence":-0.0205590728,
        "pval_avg_confidence":0.8860811551,
        "intercept":0.405633133,
        "pval_intercept":0.0009411089
    },
    "sst2":{
        "pred":0.3994481954,
        "depvar":0.2066002433,
        "abs_diff":0.1928479522,
        "coeff_avg_confidence":0.0137552603,
        "pval_avg_confidence":0.9098372128,
        "intercept":0.3859509264,
        "pval_intercept":0.0014031212
    },
    "temporal_sequences":{
        "pred":0.3694532884,
        "depvar":0.75,
        "abs_diff":0.3805467116,
        "coeff_avg_confidence":0.0341188996,
        "pval_avg_confidence":0.8048584907,
        "intercept":0.3524249053,
        "pval_intercept":0.0017735798
    },
    "toxicchat0124":{
        "pred":0.3729609327,
        "depvar":0.4645692793,
        "abs_diff":0.0916083466,
        "coeff_avg_confidence":-0.0473710201,
        "pval_avg_confidence":0.7571434497,
        "intercept":0.4197046078,
        "pval_intercept":0.0007493972
    },
    "tracking_shuffled_objects":{
        "pred":0.4224970835,
        "depvar":0.1958714588,
        "abs_diff":0.2266256246,
        "coeff_avg_confidence":-0.0821858888,
        "pval_avg_confidence":0.5856012582,
        "intercept":0.4549409471,
        "pval_intercept":0.0003536592
    },
    "web_of_lies":{
        "pred":0.3963524616,
        "depvar":0.2788861425,
        "abs_diff":0.1174663192,
        "coeff_avg_confidence":-0.0357055504,
        "pval_avg_confidence":0.8094509589,
        "intercept":0.4184263189,
        "pval_intercept":0.000669509
    },
    "wic":{
        "pred":0.3986870109,
        "depvar":0.1681799281,
        "abs_diff":0.2305070828,
        "coeff_avg_confidence":-0.0360944293,
        "pval_avg_confidence":0.801944363,
        "intercept":0.4224753932,
        "pval_intercept":0.0004434737
    }
}