{
  "models": {
    "Skywork-Reward-Llama-3.1-8B": {
      "model_name": "Skywork-Reward-Llama-3.1-8B",
      "model_path": "Skywork/Skywork-Reward-Llama-3.1-8B",
      "files": {
        "semantic_benchmark_chat_filtered.json": {
          "file_name": "semantic_benchmark_chat_filtered.json",
          "processed_samples": 200,
          "global_mean": 2.9518823665917537,
          "global_std": 16.874437799077988,
          "mean_variance": 0.6759854476616521,
          "mean_rvariance": 0.13279242987173057,
          "sample_results": [
            {
              "id": "chat_sample_306",
              "rewards": [
                0.48805286027711314,
                1.299190994950132,
                1.9288416017739365,
                1.3732675369294032,
                1.4399364247107471,
                -0.2883618953431223,
                1.8547650597946654
              ],
              "variance": 1.7069087185573548,
              "mean_reward": 1.1565275118704108,
              "min_reward": -0.2883618953431223,
              "max_reward": 1.9288416017739365,
              "num_responses": 7,
              "rvariance": 0.538031172205685
            },
            {
              "id": "chat_sample_202",
              "rewards": [
                0.12692971812816645,
                -0.7082832926881155,
                -0.8082866243601314,
                -0.7379139094798239,
                0.6102791545429105,
                -0.8860669934383661,
                -0.5601302087295732
              ],
              "variance": 1.1596682646854894,
              "mean_reward": -0.42335316514641896,
              "min_reward": -0.8860669934383661,
              "max_reward": 0.6102791545429105,
              "num_responses": 7,
              "rvariance": 0.2760466397077173
            },
            {
              "id": "chat_sample_298",
              "rewards": [
                0.24360027174551846,
                -0.44531156866170296,
                -1.078666002584471,
                -1.212003778147159,
                -0.6027242203676542,
                -0.19715515303114473,
                -0.9453282270217831
              ],
              "variance": 1.1111481296890668,
              "mean_reward": -0.6053698111526281,
              "min_reward": -1.212003778147159,
              "max_reward": 0.24360027174551846,
              "num_responses": 7,
              "rvariance": 0.23151440402241222
            },
            {
              "id": "chat_sample_268",
              "rewards": [
                0.029704256780373087,
                -1.67127833841864,
                -1.478679329272535,
                -0.6897641571932976,
                -1.2860803201264301,
                -1.3008956285222844,
                -0.8860669934383661
              ],
              "variance": 1.153742141327148,
              "mean_reward": -1.0404372157415973,
              "min_reward": -1.67127833841864,
              "max_reward": 0.029704256780373087,
              "num_responses": 7,
              "rvariance": 0.2871714746270867
            },
            {
              "id": "chat_sample_303",
              "rewards": [
                -0.4027175570236221,
                -0.7305062552818968,
                -0.4564230499585937,
                -1.0008856335062364,
                -0.4564230499585937,
                -1.6194247590331503,
                -0.4564230499585937
              ],
              "variance": 0.813360430932397,
              "mean_reward": -0.7318290506743839,
              "min_reward": -1.6194247590331503,
              "max_reward": -0.4027175570236221,
              "num_responses": 7,
              "rvariance": 0.17086844385621958
            },
            {
              "id": "chat_sample_65",
              "rewards": [
                -0.06937311811690204,
                -1.6194247590331503,
                -0.48234983965133854,
                -0.38882820540250873,
                -1.3823798246994827,
                -1.4120104414911911,
                -0.7008756384901884
              ],
              "variance": 1.233929998019709,
              "mean_reward": -0.8650345466978232,
              "min_reward": -1.6194247590331503,
              "max_reward": -0.06937311811690204,
              "num_responses": 7,
              "rvariance": 0.30988266845649115
            },
            {
              "id": "chat_sample_212",
              "rewards": [
                0.6769480423242545,
                0.5436102667615665,
                0.24174835819603668,
                1.3288216117418403,
                0.31026915952686246,
                -0.6360586642583261,
                1.1362226025957354
              ],
              "variance": 1.3226366570398858,
              "mean_reward": 0.5145087681268528,
              "min_reward": -0.6360586642583261,
              "max_reward": 1.3288216117418403,
              "num_responses": 7,
              "rvariance": 0.35954062709757434
            },
            {
              "id": "chat_sample_262",
              "rewards": [
                0.9806618644392662,
                -0.8231019327559858,
                -0.4860536667503021,
                0.9732542102413391,
                0.8176934720848696,
                -0.5953165661697271,
                0.8843623598662137
              ],
              "variance": 1.6626479847247404,
              "mean_reward": 0.2502142487079534,
              "min_reward": -0.8231019327559858,
              "max_reward": 0.9806618644392662,
              "num_responses": 7,
              "rvariance": 0.598505346969301
            },
            {
              "id": "chat_sample_178",
              "rewards": [
                0.9362159392517034,
                -0.005482100659780695,
                -0.5304995919378648,
                0.6325021171366918,
                -0.5767974306749092,
                0.573240883553275,
                -0.5860569984223181
              ],
              "variance": 1.3344889037565693,
              "mean_reward": 0.0633032597495425,
              "min_reward": -0.5860569984223181,
              "max_reward": 0.9362159392517034,
              "num_responses": 7,
              "rvariance": 0.36210445095867116
            },
            {
              "id": "chat_sample_290",
              "rewards": [
                0.2732308885372269,
                -0.911993783131111,
                0.09729910133645799,
                0.38064187440717,
                -0.38697629185302695,
                -0.1284028625066337,
                0.38434570150613356
              ],
              "variance": 0.979106693611016,
              "mean_reward": -0.041693624529111885,
              "min_reward": -0.911993783131111,
              "max_reward": 0.38434570150613356,
              "num_responses": 7,
              "rvariance": 0.1946477408759373
            },
            {
              "id": "chat_sample_292",
              "rewards": [
                0.4250877995947327,
                -1.597201796439369,
                -1.1453348903658152,
                -1.1601501987616694,
                -1.2934879743243572,
                -1.130519581969961,
                -1.2490420491367946
              ],
              "variance": 0.906696873826279,
              "mean_reward": -1.0215212416290333,
              "min_reward": -1.597201796439369,
              "max_reward": 0.4250877995947327,
              "num_responses": 7,
              "rvariance": 0.37089226949218673
            },
            {
              "id": "chat_sample_116",
              "rewards": [
                0.3510112576154616,
                0.10100292843542154,
                0.23248879044862777,
                -0.3517899344128732,
                -0.5379072461357919,
                -0.5267957648389012,
                0.5250911312667487
              ],
              "variance": 0.951883564433634,
              "mean_reward": -0.029556976803043828,
              "min_reward": -0.5379072461357919,
              "max_reward": 0.5250911312667487,
              "num_responses": 7,
              "rvariance": 0.16395443792174813
            },
            {
              "id": "chat_sample_106",
              "rewards": [
                1.1732608735853711,
                0.3732342202092429,
                -0.22562832385442708,
                0.7954705094910883,
                -0.21011854787751716,
                0.8176934720848696
              ],
              "variance": 1.2133506087010926,
              "mean_reward": 0.4539853672731046,
              "min_reward": -0.22562832385442708,
              "max_reward": 1.1732608735853711,
              "num_responses": 6,
              "rvariance": 0.2792804114801119
            },
            {
              "id": "chat_sample_251",
              "rewards": [
                -0.03140889035252559,
                -1.2490420491367946,
                -0.04900206907260248,
                -0.17909899592369738,
                -0.13419009234876428,
                0.1380411994250571,
                -0.2999363550273834
              ],
              "variance": 0.7159497782296552,
              "mean_reward": -0.257805321776673,
              "min_reward": -1.2490420491367946,
              "max_reward": 0.1380411994250571,
              "num_responses": 7,
              "rvariance": 0.17962132787929516
            },
            {
              "id": "chat_sample_280",
              "rewards": [
                -0.06983609650427249,
                -0.9601435354176373,
                -0.44531156866170296,
                -0.09437395103490605,
                -0.23604533757026205,
                -0.11104117298024205,
                -0.8823631663394026
              ],
              "variance": 0.8289165047480439,
              "mean_reward": -0.39987354692977506,
              "min_reward": -0.9601435354176373,
              "max_reward": -0.06983609650427249,
              "num_responses": 7,
              "rvariance": 0.12304026440795846
            },
            {
              "id": "chat_sample_58",
              "rewards": [
                -0.1439126384835436,
                -0.05363185294630692,
                -0.1731236811116976,
                -0.7342100823808604,
                -0.561982122279055,
                -0.1626053908736253,
                -0.9342167457248924
              ],
              "variance": 0.7064124234498242,
              "mean_reward": -0.3948117876857116,
              "min_reward": -0.9342167457248924,
              "max_reward": -0.05363185294630692,
              "num_responses": 7,
              "rvariance": 0.10235919860332222
            },
            {
              "id": "chat_sample_90",
              "rewards": [
                0.5769447106522385,
                -0.1263194597634667,
                -0.6749488487974434,
                -1.0601468670896532,
                0.05007530582467265,
                -0.31197379309901496
              ],
              "variance": 1.181057866182004,
              "mean_reward": -0.25772815871211124,
              "min_reward": -1.0601468670896532,
              "max_reward": 0.5769447106522385,
              "num_responses": 6,
              "rvariance": 0.27159691573879013
            },
            {
              "id": "chat_sample_180",
              "rewards": [
                0.7028748320169994,
                -0.6490220591046986,
                0.5473140938605301,
                0.513979649969858,
                0.03803786775304109
              ],
              "variance": 1.0148486251160145,
              "mean_reward": 0.23063687689914597,
              "min_reward": -0.6490220591046986,
              "max_reward": 0.7028748320169994,
              "num_responses": 5,
              "rvariance": 0.2428940990126355
            },
            {
              "id": "chat_sample_291",
              "rewards": [
                -0.7490253907767146,
                -0.9527358812197102,
                -1.1231119277720338,
                -1.2342267407409404,
                -1.597201796439369,
                -1.4194180956891183
              ],
              "variance": 0.6574293100660311,
              "mean_reward": -1.179286638772981,
              "min_reward": -1.597201796439369,
              "max_reward": -0.7490253907767146,
              "num_responses": 6,
              "rvariance": 0.07915669930725731
            },
            {
              "id": "chat_sample_129",
              "rewards": [
                -0.1544453967962212,
                -0.3443822802149461,
                -0.3249371879453874,
                -0.3091959227747923,
                -0.4638307041565208,
                -0.7749521804694595,
                -0.9082899560321475
              ],
              "variance": 0.5809915783111709,
              "mean_reward": -0.4685762326270679,
              "min_reward": -0.9082899560321475,
              "max_reward": -0.1544453967962212,
              "num_responses": 7,
              "rvariance": 0.0639104968812502
            },
            {
              "id": "chat_sample_31",
              "rewards": [
                -0.7119871197870791,
                -1.271265011730576,
                -1.404602787293264,
                -1.597201796439369,
                -1.33793389951192,
                -1.330526245313993
              ],
              "variance": 0.5092762261074889,
              "mean_reward": -1.2755861433460336,
              "min_reward": -1.597201796439369,
              "max_reward": -0.7119871197870791,
              "num_responses": 6,
              "rvariance": 0.07410835196137913
            },
            {
              "id": "chat_sample_294",
              "rewards": [
                0.48805286027711314,
                -0.7379139094798239,
                -0.2591942569387843,
                0.13063354522713,
                -0.08465140490012671,
                -0.5156842835420106,
                -0.1302547760561155
              ],
              "variance": 0.8781774051642594,
              "mean_reward": -0.15843031791608825,
              "min_reward": -0.7379139094798239,
              "max_reward": 0.48805286027711314,
              "num_responses": 7,
              "rvariance": 0.14018865801162966
            },
            {
              "id": "chat_sample_128",
              "rewards": [
                -0.8156942785580586,
                -1.5305329086580248,
                -1.330526245313993,
                -1.6120171048352232,
                -1.5083099460642435,
                -1.5009022918663164,
                -1.7157242636062027
              ],
              "variance": 0.5289065097319958,
              "mean_reward": -1.430529576986009,
              "min_reward": -1.7157242636062027,
              "max_reward": -0.8156942785580586,
              "num_responses": 7,
              "rvariance": 0.07475708767696777
            },
            {
              "id": "chat_sample_173",
              "rewards": [
                0.8547317430745052,
                -0.2735465869472681,
                -0.1725883623513005,
                0.8917700140641408,
                -0.2721576517851567,
                -0.1219211650834475,
                -0.18222410003844788
              ],
              "variance": 1.1422602773203607,
              "mean_reward": 0.10343769870471789,
              "min_reward": -0.2735465869472681,
              "max_reward": 0.8917700140641408,
              "num_responses": 7,
              "rvariance": 0.239668466659255
            },
            {
              "id": "chat_sample_174",
              "rewards": [
                -0.21567428852596252,
                -1.0490353857927626,
                -1.1749655071575236,
                -0.41568095186999454,
                -1.3823798246994827,
                -0.7379139094798239,
                -0.9082899560321475
              ],
              "variance": 0.9222529476419256,
              "mean_reward": -0.8405628319368138,
              "min_reward": -1.3823798246994827,
              "max_reward": -0.21567428852596252,
              "num_responses": 7,
              "rvariance": 0.14785509669534674
            },
            {
              "id": "chat_sample_297",
              "rewards": [
                0.5547217480584572,
                0.06766848454474954,
                -0.22447087788600095,
                -0.1334956247677086,
                -0.06844716134216115,
                0.06581657099526776,
                0.3065653324278989
              ],
              "variance": 0.5757136246951479,
              "mean_reward": 0.08119406743292894,
              "min_reward": -0.22447087788600095,
              "max_reward": 0.5547217480584572,
              "num_responses": 7,
              "rvariance": 0.062479328610932625
            },
            {
              "id": "chat_sample_264",
              "rewards": [
                -1.204596123949232,
                -1.6786859926165671,
                -1.1082966193761796,
                -1.1897808155533778,
                -1.4860869834704622
              ],
              "variance": 0.4607560911110662,
              "mean_reward": -1.333489306993164,
              "min_reward": -1.6786859926165671,
              "max_reward": -1.1082966193761796,
              "num_responses": 5,
              "rvariance": 0.04608482646698184
            },
            {
              "id": "chat_sample_275",
              "rewards": [
                0.9436235934496305,
                -0.7379139094798239,
                0.02692638645615042,
                0.5028681686729674,
                -0.3166035769727194,
                0.17322755686521088,
                -0.2726206301725272
              ],
              "variance": 1.164298048559194,
              "mean_reward": 0.04564394125984124,
              "min_reward": -0.7379139094798239,
              "max_reward": 0.9436235934496305,
              "num_responses": 7,
              "rvariance": 0.26836112615137636
            },
            {
              "id": "chat_sample_172",
              "rewards": [
                -0.0017782735608171387,
                -0.9860703251103822,
                -0.7897674888653137,
                -0.8490287224487306,
                -0.7379139094798239,
                -0.8934746476362933,
                -0.7119871197870791
              ],
              "variance": 0.5026093373293548,
              "mean_reward": -0.7100029266983486,
              "min_reward": -0.9860703251103822,
              "max_reward": -0.0017782735608171387,
              "num_responses": 7,
              "rvariance": 0.09113296534363599
            },
            {
              "id": "chat_sample_145",
              "rewards": [
                0.5473140938605301,
                0.7510245843035257,
                1.2102991445750066,
                1.1732608735853711,
                0.9362159392517034,
                1.7214272842319773,
                1.6547583964506334
              ],
              "variance": 1.0118855634368433,
              "mean_reward": 1.1420429023226784,
              "min_reward": 0.5473140938605301,
              "max_reward": 1.7214272842319773,
              "num_responses": 7,
              "rvariance": 0.16473704794625924
            },
            {
              "id": "chat_sample_270",
              "rewards": [
                1.8547650597946654,
                0.5991676732460198,
                1.4177134621169658,
                1.5140129666900182,
                0.9139929766579221,
                1.3954904995231845,
                1.365859882731476
              ],
              "variance": 0.862250948638716,
              "mean_reward": 1.2944289315371786,
              "min_reward": 0.5991676732460198,
              "max_reward": 1.8547650597946654,
              "num_responses": 7,
              "rvariance": 0.14583262213752599
            },
            {
              "id": "chat_sample_278",
              "rewards": [
                0.13989311297453888,
                -1.5379405628559522,
                -0.8527325495476942,
                -0.6230952694119537,
                -0.6434663184562532,
                -0.428644346716367,
                -0.7268024281829333
              ],
              "variance": 0.925586392030993,
              "mean_reward": -0.6675411945995163,
              "min_reward": -1.5379405628559522,
              "max_reward": 0.13989311297453888,
              "num_responses": 7,
              "rvariance": 0.21528281384539477
            },
            {
              "id": "chat_sample_165",
              "rewards": [
                0.2824904562846358,
                -0.6601335404015892,
                0.09729910133645799,
                0.7139863133138901,
                0.6658365610273639,
                0.613982981641874,
                0.6880595236211452
              ],
              "variance": 0.904104194857004,
              "mean_reward": 0.3430744852605397,
              "min_reward": -0.6601335404015892,
              "max_reward": 0.7139863133138901,
              "num_responses": 7,
              "rvariance": 0.21495133407290587
            },
            {
              "id": "chat_sample_127",
              "rewards": [
                1.0547384064185372,
                2.4325620872329803,
                2.4621927040246887,
                1.299190994950132,
                1.3214139575439132,
                1.306598649148059,
                1.3732675369294032
              ],
              "variance": 1.2430043744121695,
              "mean_reward": 1.607137762321102,
              "min_reward": 1.0547384064185372,
              "max_reward": 2.4621927040246887,
              "num_responses": 7,
              "rvariance": 0.291296808987387
            },
            {
              "id": "chat_sample_256",
              "rewards": [
                -0.2314155536965576,
                -1.597201796439369,
                -0.6749488487974434,
                -0.5323515054873466,
                -0.9786626709124551,
                -0.7934713159642772,
                -0.7934713159642772
              ],
              "variance": 0.8141011963521898,
              "mean_reward": -0.8002175724659608,
              "min_reward": -1.597201796439369,
              "max_reward": -0.2314155536965576,
              "num_responses": 7,
              "rvariance": 0.15401396427141817
            },
            {
              "id": "chat_sample_114",
              "rewards": [
                -0.021223365830375807,
                0.39916100990198783,
                -0.18401814128950836,
                -0.295306571153679,
                0.36953039311027935,
                -0.1439126384835436,
                -0.10594841071916715
              ],
              "variance": 0.6099161530621393,
              "mean_reward": 0.002611753647999044,
              "min_reward": -0.295306571153679,
              "max_reward": 0.39916100990198783,
              "num_responses": 7,
              "rvariance": 0.06418420946499405
            },
            {
              "id": "chat_sample_119",
              "rewards": [
                -0.12238414347081794,
                -0.26937978146093405,
                -0.6267990965109173,
                -0.043446328424157146,
                -0.013815711632448695,
                0.10285484198490333,
                -0.26845382468619317
              ],
              "variance": 0.44520001729541947,
              "mean_reward": -0.17734629202865212,
              "min_reward": -0.6267990965109173,
              "max_reward": 0.10285484198490333,
              "num_responses": 7,
              "rvariance": 0.049283361913654324
            },
            {
              "id": "chat_sample_179",
              "rewards": [
                -0.2103500370712024,
                -0.8490287224487306,
                -0.7601368720736053,
                -0.5175361970914923,
                -0.39808777314991767,
                -0.528647678388383,
                -0.6934679842922612
              ],
              "variance": 0.4727009335052239,
              "mean_reward": -0.5653221806450847,
              "min_reward": -0.8490287224487306,
              "max_reward": -0.2103500370712024,
              "num_responses": 7,
              "rvariance": 0.041780657422087406
            },
            {
              "id": "chat_sample_191",
              "rewards": [
                0.06766848454474954,
                0.5917600190480927,
                1.7066119758361231,
                2.358485545253709,
                1.4399364247107471,
                2.477008012420543,
                1.8399497513988112
              ],
              "variance": 2.0237711268736867,
              "mean_reward": 1.4973457447446823,
              "min_reward": 0.06766848454474954,
              "max_reward": 2.477008012420543,
              "num_responses": 7,
              "rvariance": 0.6756897400748826
            },
            {
              "id": "chat_sample_156",
              "rewards": [
                1.3732675369294032,
                2.8473907223168986,
                3.4992642917344843,
                3.5140796001303385,
                3.736309226068152,
                3.736309226068152
              ],
              "variance": 1.625980096445001,
              "mean_reward": 3.117770100541238,
              "min_reward": 1.3732675369294032,
              "max_reward": 3.736309226068152,
              "num_responses": 6,
              "rvariance": 0.6973624232685326
            },
            {
              "id": "chat_sample_166",
              "rewards": [
                0.05933487357208154,
                -0.9268090915269653,
                -0.511980456443047,
                -0.9453282270217831,
                -0.6971718113912247,
                -1.1897808155533778,
                -1.1971884697513049
              ],
              "variance": 0.9092895527955533,
              "mean_reward": -0.7727034283022317,
              "min_reward": -1.1971884697513049,
              "max_reward": 0.05933487357208154,
              "num_responses": 7,
              "rvariance": 0.16766545756219026
            },
            {
              "id": "chat_sample_245",
              "rewards": [
                -0.2314155536965576,
                -1.4860869834704622,
                -1.1120004464751432,
                -0.8119904514590951,
                -0.8156942785580586,
                -1.0601468670896532,
                -1.1749655071575236
              ],
              "variance": 0.719653605328619,
              "mean_reward": -0.9560428697009276,
              "min_reward": -1.4860869834704622,
              "max_reward": -0.2314155536965576,
              "num_responses": 7,
              "rvariance": 0.13279540929929795
            },
            {
              "id": "chat_sample_161",
              "rewards": [
                0.613982981641874,
                0.7250977946107807,
                0.8547317430745052,
                1.4769746957003826,
                0.573240883553275,
                1.3362292659397674,
                1.5584588918775808
              ],
              "variance": 0.9118822317648276,
              "mean_reward": 1.0198166080568807,
              "min_reward": 0.573240883553275,
              "max_reward": 1.5584588918775808,
              "num_responses": 7,
              "rvariance": 0.15392699982519398
            },
            {
              "id": "chat_sample_296",
              "rewards": [
                -1.478679329272535,
                -1.5305329086580248,
                -1.5009022918663164,
                -1.9675845063357245
              ],
              "variance": 0.3511228089817451,
              "mean_reward": -1.61942475903315,
              "min_reward": -1.9675845063357245,
              "max_reward": -1.478679329272535,
              "num_responses": 4,
              "rvariance": 0.04074345548167987
            },
            {
              "id": "chat_sample_130",
              "rewards": [
                -0.36290141570976386,
                -1.0749621754855074,
                -0.971255016714528,
                -0.645318232005735,
                -0.6749488487974434,
                -0.8119904514590951,
                -0.9416243999228195
              ],
              "variance": 0.4803863747355732,
              "mean_reward": -0.7832857914421274,
              "min_reward": -1.0749621754855074,
              "max_reward": -0.36290141570976386,
              "num_responses": 7,
              "rvariance": 0.050542511294105766
            },
            {
              "id": "chat_sample_18",
              "rewards": [
                1.1288149483978083,
                -0.035112717451489146,
                0.21952539560225534,
                -0.3841984215288043,
                -0.10409649716968537,
                0.4584222434854047,
                0.21211774140432824
              ],
              "variance": 0.9427165923636992,
              "mean_reward": 0.21363895610568825,
              "min_reward": -0.3841984215288043,
              "max_reward": 1.1288149483978083,
              "num_responses": 7,
              "rvariance": 0.2025350946249846
            },
            {
              "id": "chat_sample_44",
              "rewards": [
                0.247304098844482,
                -0.5323515054873466,
                0.21396965495381,
                -0.05918759359475226,
                -0.01937145228089403,
                0.16211607556832022,
                0.24360027174551846
              ],
              "variance": 0.4935349609368938,
              "mean_reward": 0.0365827928213054,
              "min_reward": -0.5323515054873466,
              "max_reward": 0.247304098844482,
              "num_responses": 7,
              "rvariance": 0.06721049851112923
            },
            {
              "id": "chat_sample_215",
              "rewards": [
                -0.2466938404797823,
                -1.104592792277216,
                -0.9601435354176373,
                -0.8971784747352568,
                -1.0342200773969084,
                -0.83791724115184
              ],
              "variance": 0.527100894021251,
              "mean_reward": -0.84679099357644,
              "min_reward": -1.104592792277216,
              "max_reward": -0.2466938404797823,
              "num_responses": 6,
              "rvariance": 0.07952907708522212
            },
            {
              "id": "chat_sample_300",
              "rewards": [
                -0.31382570664849674,
                -0.21405386417016595,
                -0.5656859493780185,
                -0.21405386417016595,
                -0.6934679842922612,
                -0.7008756384901884
              ],
              "variance": 0.48311794722105894,
              "mean_reward": -0.4503271678582161,
              "min_reward": -0.7008756384901884,
              "max_reward": -0.21405386417016595,
              "num_responses": 6,
              "rvariance": 0.04424707303494791
            },
            {
              "id": "chat_sample_169",
              "rewards": [
                -0.26289808403774784,
                -0.5582782951800914,
                -0.3693831131329501,
                -0.8453248953497671,
                -0.8045827972611679,
                -0.45827496350807545
              ],
              "variance": 0.5088132477201186,
              "mean_reward": -0.5497903580783,
              "min_reward": -0.8453248953497671,
              "max_reward": -0.26289808403774784,
              "num_responses": 6,
              "rvariance": 0.04592681887292236
            },
            {
              "id": "chat_sample_82",
              "rewards": [
                -0.6971718113912247,
                -1.1971884697513049,
                -1.0082932877041635,
                -1.2342267407409404,
                -1.2564497033347217,
                -1.1823731613554507,
                -1.1749655071575236
              ],
              "variance": 0.35927122859946514,
              "mean_reward": -1.10723838306219,
              "min_reward": -1.2564497033347217,
              "max_reward": -0.6971718113912247,
              "num_responses": 7,
              "rvariance": 0.03352257178908394
            },
            {
              "id": "chat_sample_77",
              "rewards": [
                -0.18997898802690283,
                -1.0194047690010541,
                -1.1897808155533778,
                -1.3675645163036285,
                -1.0749621754855074,
                -0.9971818064072728
              ],
              "variance": 0.6850922687114154,
              "mean_reward": -0.9731455117962907,
              "min_reward": -1.3675645163036285,
              "max_reward": -0.18997898802690283,
              "num_responses": 6,
              "rvariance": 0.13815521754067955
            },
            {
              "id": "chat_sample_277",
              "rewards": [
                -0.8342134140528764,
                -1.5009022918663164,
                -1.323118591116066,
                -1.5453482170538793,
                -1.3675645163036285
              ],
              "variance": 0.49779436210070194,
              "mean_reward": -1.3142294060785535,
              "min_reward": -1.5453482170538793,
              "max_reward": -0.8342134140528764,
              "num_responses": 5,
              "rvariance": 0.06432033505374528
            },
            {
              "id": "chat_sample_73",
              "rewards": [
                -1.1897808155533778,
                -1.4638640208766809,
                -1.4120104414911911,
                -1.4934946376683893,
                -1.7231319178041298,
                -1.67127833841864
              ],
              "variance": 0.39630949958910033,
              "mean_reward": -1.4922600286354015,
              "min_reward": -1.7231319178041298,
              "max_reward": -1.1897808155533778,
              "num_responses": 6,
              "rvariance": 0.030681818757603216
            },
            {
              "id": "chat_sample_6",
              "rewards": [
                0.313972986625826,
                0.5065719957719309,
                1.0177001354289017,
                0.8621393972724324,
                0.673244215225291,
                0.4436069350895505,
                1.0177001354289017
              ],
              "variance": 0.625946779724841,
              "mean_reward": 0.6907051144061193,
              "min_reward": 0.313972986625826,
              "max_reward": 1.0177001354289017,
              "num_responses": 7,
              "rvariance": 0.0686336707986932
            },
            {
              "id": "chat_sample_80",
              "rewards": [
                -0.43975582801325763,
                -0.8082866243601314,
                -0.8082866243601314,
                -0.8564363766466577
              ],
              "variance": 0.29167638404338014,
              "mean_reward": -0.7281913633450446,
              "min_reward": -0.8564363766466577,
              "max_reward": -0.43975582801325763,
              "num_responses": 4,
              "rvariance": 0.028118085788253807
            },
            {
              "id": "chat_sample_224",
              "rewards": [
                -0.8897708205373297,
                -1.3157109369181388,
                -1.597201796439369,
                -1.5379405628559522,
                -1.3823798246994827,
                -1.471271675074608,
                -1.3157109369181388
              ],
              "variance": 0.416310165923504,
              "mean_reward": -1.358569507634717,
              "min_reward": -1.597201796439369,
              "max_reward": -0.8897708205373297,
              "num_responses": 7,
              "rvariance": 0.0465477110925243
            },
            {
              "id": "chat_sample_267",
              "rewards": [
                1.165853219387444,
                0.2713789749877451,
                0.3065653324278989,
                0.9139929766579221,
                0.43619928089162335,
                0.3510112576154616,
                0.040815738077263755
              ],
              "variance": 0.8355833935261784,
              "mean_reward": 0.49797382572076554,
              "min_reward": 0.040815738077263755,
              "max_reward": 1.165853219387444,
              "num_responses": 7,
              "rvariance": 0.13450355200360362
            },
            {
              "id": "chat_sample_308",
              "rewards": [
                0.2158215685032918,
                -1.0008856335062364,
                -0.4267924331668852,
                -0.46753453125548433,
                -0.23974916466922563,
                -0.21891513723755562,
                -0.14912114534146112
              ],
              "variance": 0.6777309123522253,
              "mean_reward": -0.32673949666765095,
              "min_reward": -1.0008856335062364,
              "max_reward": 0.2158215685032918,
              "num_responses": 7,
              "rvariance": 0.11848872059943802
            },
            {
              "id": "chat_sample_252",
              "rewards": [
                1.5140129666900182,
                2.684422329962502,
                2.15107122771175,
                3.3659265161717964,
                2.7436835635459187,
                2.565899862795668,
                2.8473907223168986
              ],
              "variance": 1.1585571165558006,
              "mean_reward": 2.553201027027793,
              "min_reward": 1.5140129666900182,
              "max_reward": 3.3659265161717964,
              "num_responses": 7,
              "rvariance": 0.2917649121796179
            },
            {
              "id": "chat_sample_159",
              "rewards": [
                0.11211440973231221,
                0.03063021355511398,
                7.363998866463924e-05,
                0.45471841638644117,
                -0.8008789701622043,
                -0.040668458099934475,
                0.18804286526106512
              ],
              "variance": 0.639465748636058,
              "mean_reward": -0.007995411905505956,
              "min_reward": -0.8008789701622043,
              "max_reward": 0.45471841638644117,
              "num_responses": 7,
              "rvariance": 0.12832148224328813
            },
            {
              "id": "chat_sample_188",
              "rewards": [
                1.7806885178153942,
                -0.1147450000792056,
                3.617786758901318,
                2.417746778837126,
                3.217773432213254,
                3.217773432213254,
                3.5140796001303385
              ],
              "variance": 2.5330473529811757,
              "mean_reward": 2.521586217147354,
              "min_reward": -0.1147450000792056,
              "max_reward": 3.617786758901318,
              "num_responses": 7,
              "rvariance": 1.523715190942338
            },
            {
              "id": "chat_sample_88",
              "rewards": [
                0.5584255751574208,
                -1.1082966193761796,
                0.14915268072194776,
                0.230636876899146,
                0.15285650782091134,
                0.0621127438963042,
                0.313972986625826
              ],
              "variance": 0.8178050234511532,
              "mean_reward": 0.051265821677910925,
              "min_reward": -1.1082966193761796,
              "max_reward": 0.5584255751574208,
              "num_responses": 7,
              "rvariance": 0.2461436086607134
            },
            {
              "id": "chat_sample_27",
              "rewards": [
                0.38804952860509717,
                0.23619261754759135,
                0.38804952860509717,
                -0.19044196641427327,
                0.029704256780373087,
                -0.3175295337474603,
                -0.22470236707968616
              ],
              "variance": 0.649882762351893,
              "mean_reward": 0.04418886632810559,
              "min_reward": -0.3175295337474603,
              "max_reward": 0.38804952860509717,
              "num_responses": 7,
              "rvariance": 0.07596426836420285
            },
            {
              "id": "chat_sample_167",
              "rewards": [
                0.3287882950216802,
                -1.0490353857927626,
                0.07877996584164021,
                0.12692971812816645,
                0.1213739774797211,
                -0.05455780972104781,
                0.2936019375815265
              ],
              "variance": 0.7600253207073215,
              "mean_reward": -0.022017043065867985,
              "min_reward": -1.0490353857927626,
              "max_reward": 0.3287882950216802,
              "num_responses": 7,
              "rvariance": 0.19020163763080314
            },
            {
              "id": "chat_sample_76",
              "rewards": [
                0.8917700140641408,
                -0.16706155785206583,
                -0.03789058777571181,
                -0.2624351056503774,
                0.25285983949292734,
                0.46582989768333183
              ],
              "variance": 0.893548287624958,
              "mean_reward": 0.1905120833270408,
              "min_reward": -0.2624351056503774,
              "max_reward": 0.8917700140641408,
              "num_responses": 6,
              "rvariance": 0.15943961200967113
            },
            {
              "id": "chat_sample_209",
              "rewards": [
                -0.1769721889567144,
                -0.29623252792841986,
                -0.20282663827643266,
                -0.4193847789689581,
                -0.5138323699925288,
                -0.6934679842922612,
                0.060260830346822426
              ],
              "variance": 0.5036076344771222,
              "mean_reward": -0.32035080829549895,
              "min_reward": -0.6934679842922612,
              "max_reward": 0.060260830346822426,
              "num_responses": 7,
              "rvariance": 0.05232507700398522
            },
            {
              "id": "chat_sample_61",
              "rewards": [
                -0.2209985399807226,
                -1.104592792277216,
                -1.0268124231989813,
                -0.5638340358285368,
                -1.3527492079077743,
                -0.5434629867842372,
                -0.5342034190368283
              ],
              "variance": 0.7949338911150534,
              "mean_reward": -0.7638076292877567,
              "min_reward": -1.3527492079077743,
              "max_reward": -0.2209985399807226,
              "num_responses": 7,
              "rvariance": 0.13829417604596542
            },
            {
              "id": "chat_sample_118",
              "rewards": [
                -0.015667625181930475,
                -0.2503976675787458,
                0.7028748320169994,
                0.4695337247822954,
                0.48064520607918604,
                0.13618928587557533,
                0.8621393972724324
              ],
              "variance": 0.8761403002598293,
              "mean_reward": 0.34075959332368744,
              "min_reward": -0.2503976675787458,
              "max_reward": 0.8621393972724324,
              "num_responses": 7,
              "rvariance": 0.13678162679245434
            },
            {
              "id": "chat_sample_150",
              "rewards": [
                0.8917700140641408,
                1.0177001354289017,
                0.08063187939112199,
                0.48805286027711314,
                0.4695337247822954,
                0.49916434157400386,
                0.48064520607918604
              ],
              "variance": 0.6281690759842191,
              "mean_reward": 0.5610711659423947,
              "min_reward": 0.08063187939112199,
              "max_reward": 1.0177001354289017,
              "num_responses": 7,
              "rvariance": 0.08181503114355992
            },
            {
              "id": "chat_sample_120",
              "rewards": [
                -0.36567928603398653,
                -0.3017882685768652,
                -0.11243010814235338,
                0.513979649969858,
                0.26767514788878155,
                0.08063187939112199,
                0.18804286526106512
              ],
              "variance": 0.6935416242809259,
              "mean_reward": 0.03863312567966023,
              "min_reward": -0.36567928603398653,
              "max_reward": 0.513979649969858,
              "num_responses": 7,
              "rvariance": 0.08638244060479154
            },
            {
              "id": "chat_sample_244",
              "rewards": [
                0.8917700140641408,
                -0.040668458099934475,
                0.6362059442356554,
                0.23804453109707313,
                0.17322755686521088,
                1.0621460606164643
              ],
              "variance": 0.9106784879576644,
              "mean_reward": 0.493454274796435,
              "min_reward": -0.040668458099934475,
              "max_reward": 1.0621460606164643,
              "num_responses": 6,
              "rvariance": 0.15925169939758357
            },
            {
              "id": "chat_sample_8",
              "rewards": [
                1.7214272842319773,
                1.3880828453252574,
                1.165853219387444,
                0.34730743051649804,
                1.6547583964506334,
                1.5880895086692894,
                1.7362425926278315
              ],
              "variance": 0.8889185037512533,
              "mean_reward": 1.3716801824584188,
              "min_reward": 0.34730743051649804,
              "max_reward": 1.7362425926278315,
              "num_responses": 7,
              "rvariance": 0.21059548268754397
            },
            {
              "id": "chat_sample_40",
              "rewards": [
                2.81776010552519,
                0.6176868087408376,
                2.076994685732479,
                2.7881294887334813,
                2.1955171528993125,
                2.1214406109200414,
                1.158445565189517
              ],
              "variance": 1.8578396728401199,
              "mean_reward": 1.9679963453915514,
              "min_reward": 0.6176868087408376,
              "max_reward": 2.81776010552519,
              "num_responses": 7,
              "rvariance": 0.5658023757156574
            },
            {
              "id": "chat_sample_286",
              "rewards": [
                0.163967989117802,
                1.0547384064185372,
                1.0621460606164643,
                1.3584522285335487,
                1.4769746957003826,
                1.3584522285335487,
                1.4177134621169658
              ],
              "variance": 0.7429877160520895,
              "mean_reward": 1.1274921530053212,
              "min_reward": 0.163967989117802,
              "max_reward": 1.4769746957003826,
              "num_responses": 7,
              "rvariance": 0.17871337181644878
            },
            {
              "id": "chat_sample_307",
              "rewards": [
                -0.37864268088035896,
                -0.361975458935023,
                -0.19206239077006984,
                -0.6416144049067715,
                -0.5360553325863101,
                -0.8527325495476942,
                -0.6527258862036621
              ],
              "variance": 0.43871831987223325,
              "mean_reward": -0.5165441005471271,
              "min_reward": -0.8527325495476942,
              "max_reward": -0.19206239077006984,
              "num_responses": 7,
              "rvariance": 0.042255438241439125
            },
            {
              "id": "chat_sample_206",
              "rewards": [
                0.2565636665918909,
                -0.09344799426016516,
                -0.3777167241056181,
                -0.30641805245056963,
                0.07137231164371309,
                0.3065653324278989,
                0.45471841638644117
              ],
              "variance": 0.7007640871239049,
              "mean_reward": 0.044519565176227315,
              "min_reward": -0.3777167241056181,
              "max_reward": 0.45471841638644117,
              "num_responses": 7,
              "rvariance": 0.08615579935937547
            },
            {
              "id": "chat_sample_261",
              "rewards": [
                -1.0045894606052,
                -1.8786926559605992,
                -1.8120237681792553,
                -1.5601635254497335,
                -1.8268390765751095,
                -1.7749854971896197,
                -1.871285001762672
              ],
              "variance": 0.5363141639299231,
              "mean_reward": -1.6755112836745985,
              "min_reward": -1.8786926559605992,
              "max_reward": -1.0045894606052,
              "num_responses": 7,
              "rvariance": 0.08492601360293206
            },
            {
              "id": "chat_sample_79",
              "rewards": [
                1.106591985804027,
                0.21767348205277356,
                0.6880595236211452,
                0.46582989768333183,
                0.4843490331781496,
                0.706578659115963,
                0.5880561919491292
              ],
              "variance": 0.5000166583600801,
              "mean_reward": 0.6081626819149314,
              "min_reward": 0.21767348205277356,
              "max_reward": 1.106591985804027,
              "num_responses": 7,
              "rvariance": 0.0647107868695425
            },
            {
              "id": "chat_sample_69",
              "rewards": [
                -0.511980456443047,
                -0.8675478579435484,
                -0.8342134140528764,
                -0.911993783131111,
                -1.1453348903658152,
                -0.9490320541207466
              ],
              "variance": 0.37408653699531924,
              "mean_reward": -0.8700170760095242,
              "min_reward": -1.1453348903658152,
              "max_reward": -0.511980456443047,
              "num_responses": 6,
              "rvariance": 0.035547254967761184
            },
            {
              "id": "chat_sample_203",
              "rewards": [
                0.6436135984335826,
                0.7621360656004164,
                0.2621194072403362,
                0.7436169301055985,
                1.4399364247107471,
                1.1880761819812253
              ],
              "variance": 0.8611398005090267,
              "mean_reward": 0.8399164346786511,
              "min_reward": 0.2621194072403362,
              "max_reward": 1.4399364247107471,
              "num_responses": 6,
              "rvariance": 0.1448244644848803
            },
            {
              "id": "chat_sample_168",
              "rewards": [
                -0.02863102002830292,
                0.012111078060296196,
                0.24174835819603668,
                0.3287882950216802,
                0.42138397249576914,
                0.263971320789818,
                0.4324954537926598
              ],
              "variance": 0.4300143261896689,
              "mean_reward": 0.2388382083325653,
              "min_reward": -0.02863102002830292,
              "max_reward": 0.4324954537926598,
              "num_responses": 7,
              "rvariance": 0.028928889266281732
            },
            {
              "id": "chat_sample_265",
              "rewards": [
                0.4028648370009514,
                -0.0304829335777847,
                -0.4054954273478448,
                -0.1775653800155328,
                0.1565603349198749,
                -0.0221493226051167
              ],
              "variance": 0.571242989642102,
              "mean_reward": -0.012711315270908782,
              "min_reward": -0.4054954273478448,
              "max_reward": 0.4028648370009514,
              "num_responses": 6,
              "rvariance": 0.06386959294299548
            },
            {
              "id": "chat_sample_301",
              "rewards": [
                -0.9860703251103822,
                -1.4564563666787538,
                -1.3601568621057014,
                -1.1120004464751432,
                -1.2416343949388675,
                -1.2490420491367946,
                -1.1897808155533778
              ],
              "variance": 0.3370482660056837,
              "mean_reward": -1.227877322857003,
              "min_reward": -1.4564563666787538,
              "max_reward": -0.9860703251103822,
              "num_responses": 7,
              "rvariance": 0.02053326813672346
            },
            {
              "id": "chat_sample_196",
              "rewards": [
                0.052853176148895314,
                -0.13094924363717117,
                -0.2800282843704543,
                -0.0814105561885336,
                0.012111078060296196,
                -0.48790558029978387,
                -0.7082832926881155
              ],
              "variance": 0.6044645825508523,
              "mean_reward": -0.23194467185355241,
              "min_reward": -0.7082832926881155,
              "max_reward": 0.052853176148895314,
              "num_responses": 7,
              "rvariance": 0.06689430313376644
            },
            {
              "id": "chat_sample_225",
              "rewards": [
                -0.1189118055655396,
                0.03525999742881842,
                0.06952039809423131,
                0.2658232343392998,
                0.0880395335890491,
                0.004703423862369084,
                0.11026249618283043
              ],
              "variance": 0.21722945935421262,
              "mean_reward": 0.06495675399015122,
              "min_reward": -0.1189118055655396,
              "max_reward": 0.2658232343392998,
              "num_responses": 7,
              "rvariance": 0.011610514728548514
            },
            {
              "id": "chat_sample_126",
              "rewards": [
                0.33989977631857093,
                0.13989311297453888,
                0.8917700140641408,
                1.2769680323563506,
                0.4399031079905869,
                1.9288416017739365,
                1.6103124712630708
              ],
              "variance": 1.477827012486459,
              "mean_reward": 0.9467983023915993,
              "min_reward": 0.13989311297453888,
              "max_reward": 1.9288416017739365,
              "num_responses": 7,
              "rvariance": 0.39900925728868997
            },
            {
              "id": "chat_sample_162",
              "rewards": [
                -0.2249338562733714,
                -1.104592792277216,
                -0.9527358812197102,
                -0.8193981056570222,
                -1.1971884697513049,
                -0.8527325495476942,
                -0.7860636617663501
              ],
              "variance": 0.5800193236976932,
              "mean_reward": -0.8482350452132383,
              "min_reward": -1.1971884697513049,
              "max_reward": -0.2249338562733714,
              "num_responses": 7,
              "rvariance": 0.08451852305491045
            },
            {
              "id": "chat_sample_49",
              "rewards": [
                0.6843556965221816,
                0.7954705094910883,
                0.3213806408237531,
                0.2917500240320447,
                0.01859277548348242,
                -0.032334847127266475,
                -0.32030740407168296
              ],
              "variance": 0.8763254916147774,
              "mean_reward": 0.25127248502194294,
              "min_reward": -0.32030740407168296,
              "max_reward": 0.7954705094910883,
              "num_responses": 7,
              "rvariance": 0.1359346683271003
            },
            {
              "id": "chat_sample_177",
              "rewards": [
                0.3213806408237531,
                -0.17474953099547114,
                0.014888948384518864,
                -0.6008723068181724,
                0.08248379294060376
              ],
              "variance": 0.6562450981595853,
              "mean_reward": -0.07137369113295355,
              "min_reward": -0.6008723068181724,
              "max_reward": 0.3213806408237531,
              "num_responses": 5,
              "rvariance": 0.09528493638651384
            },
            {
              "id": "chat_sample_273",
              "rewards": [
                -0.1376624302540426,
                -0.6027242203676542,
                -0.4842017532008203,
                -0.7156909468860426,
                -0.6712450216984799,
                -0.5564263816306096,
                -0.4267924331668852
              ],
              "variance": 0.377882959771757,
              "mean_reward": -0.5135347410292193,
              "min_reward": -0.7156909468860426,
              "max_reward": -0.1376624302540426,
              "num_responses": 7,
              "rvariance": 0.032171252344148464
            },
            {
              "id": "chat_sample_285",
              "rewards": [
                -0.5823531713233545,
                -0.29021380889260406,
                0.06581657099526776,
                -0.0388165445504527,
                -0.1284028625066337,
                -0.2726206301725272,
                -0.24808277564189363
              ],
              "variance": 0.41010625553273977,
              "mean_reward": -0.21352474601317115,
              "min_reward": -0.5823531713233545,
              "max_reward": 0.06581657099526776,
              "num_responses": 7,
              "rvariance": 0.03748606610236547
            },
            {
              "id": "chat_sample_293",
              "rewards": [
                -0.5267957648389012,
                -0.11381904330446471,
                -0.5249438512894194,
                -0.3934579892762132,
                -0.5156842835420106,
                -0.3101218795495332,
                -0.25549042983982073
              ],
              "variance": 0.3268627414835339,
              "mean_reward": -0.37718760594862333,
              "min_reward": -0.5267957648389012,
              "max_reward": -0.11381904330446471,
              "num_responses": 7,
              "rvariance": 0.021761654063046598
            },
            {
              "id": "chat_sample_233",
              "rewards": [
                0.14915268072194776,
                -0.10826330265601938,
                0.2065620007558829,
                0.21211774140432824,
                -0.345308236989687,
                -0.17096793799550394,
                0.16026416201883845
              ],
              "variance": 0.44948835460843817,
              "mean_reward": 0.014793872465683857,
              "min_reward": -0.345308236989687,
              "max_reward": 0.21211774140432824,
              "num_responses": 7,
              "rvariance": 0.04203566665550333
            },
            {
              "id": "chat_sample_235",
              "rewards": [
                -1.0564430399906897,
                -1.2564497033347217,
                -1.2564497033347217,
                -0.9971818064072728,
                -1.2564497033347217,
                -1.2638573575326488,
                -1.1601501987616694
              ],
              "variance": 0.22667421845656976,
              "mean_reward": -1.1781402160994925,
              "min_reward": -1.2638573575326488,
              "max_reward": -0.9971818064072728,
              "num_responses": 7,
              "rvariance": 0.010517763591944953
            },
            {
              "id": "chat_sample_158",
              "rewards": [
                -0.20039600174273783,
                -0.9082899560321475,
                -0.9601435354176373,
                -0.7971751430632408,
                -0.9860703251103822,
                -0.937920572823856,
                -0.8527325495476942
              ],
              "variance": 0.4120507647596958,
              "mean_reward": -0.8061040119625279,
              "min_reward": -0.9860703251103822,
              "max_reward": -0.20039600174273783,
              "num_responses": 7,
              "rvariance": 0.06472425148551222
            },
            {
              "id": "chat_sample_216",
              "rewards": [
                -0.678652675896407,
                -0.7082832926881155,
                -0.6934679842922612,
                -0.9897741522093457,
                -0.43790391446377586,
                -0.7971751430632408,
                -0.9453282270217831
              ],
              "variance": 0.3807534257734537,
              "mean_reward": -0.7500836270907042,
              "min_reward": -0.9897741522093457,
              "max_reward": -0.43790391446377586,
              "num_responses": 7,
              "rvariance": 0.029328680748641655
            },
            {
              "id": "chat_sample_242",
              "rewards": [
                1.3880828453252574,
                1.1954838361791524,
                1.1880761819812253,
                1.5362359292837995,
                0.8547317430745052,
                0.7584322385014528,
                1.365859882731476
              ],
              "variance": 0.63113213766339,
              "mean_reward": 1.183843236725267,
              "min_reward": 0.7584322385014528,
              "max_reward": 1.5362359292837995,
              "num_responses": 7,
              "rvariance": 0.0697809715652975
            },
            {
              "id": "chat_sample_92",
              "rewards": [
                4.299290945110613,
                1.5584588918775808,
                3.0696203482547118,
                2.699237638358356,
                3.677047992484735,
                2.9066519559003154,
                1.3732675369294032
              ],
              "variance": 2.441562823636777,
              "mean_reward": 2.797653615559388,
              "min_reward": 1.3732675369294032,
              "max_reward": 4.299290945110613,
              "num_responses": 7,
              "rvariance": 0.9554658071891241
            },
            {
              "id": "chat_sample_250",
              "rewards": [
                -0.8008789701622043,
                -1.3749721705015556,
                -1.5379405628559522,
                -1.471271675074608,
                -1.1453348903658152,
                -1.4268257498870454
              ],
              "variance": 0.5314991887012704,
              "mean_reward": -1.2928706698078634,
              "min_reward": -1.5379405628559522,
              "max_reward": -0.8008789701622043,
              "num_responses": 6,
              "rvariance": 0.06339890496496003
            },
            {
              "id": "chat_sample_283",
              "rewards": [
                -0.4054954273478448,
                -0.3841984215288043,
                -0.2638240408124887,
                -0.22956364014707584,
                -0.5860569984223181,
                -0.44716348221118474,
                -0.8305095869539129
              ],
              "variance": 0.43371815328863245,
              "mean_reward": -0.44954451391766126,
              "min_reward": -0.8305095869539129,
              "max_reward": -0.22956364014707584,
              "num_responses": 7,
              "rvariance": 0.03612426105493507
            },
            {
              "id": "chat_sample_140",
              "rewards": [
                -0.24484192693030052,
                -0.4416077415627394,
                -0.5230919377399377,
                -0.4342000873648123,
                -0.7156909468860426,
                -0.42123669251843987,
                -0.6064280474666177
              ],
              "variance": 0.29945442095120367,
              "mean_reward": -0.48387105435269856,
              "min_reward": -0.7156909468860426,
              "max_reward": -0.24484192693030052,
              "num_responses": 7,
              "rvariance": 0.01937290520530904
            },
            {
              "id": "chat_sample_232",
              "rewards": [
                -0.4342000873648123,
                -0.018445495506153143,
                0.0204446890329642,
                0.0287783000056322,
                0.197302433008474,
                0.21396965495381,
                0.26026749369085445
              ],
              "variance": 0.4172361226982446,
              "mean_reward": 0.03830242683153849,
              "min_reward": -0.4342000873648123,
              "max_reward": 0.26026749369085445,
              "num_responses": 7,
              "rvariance": 0.04747100404412633
            },
            {
              "id": "chat_sample_0",
              "rewards": [
                0.9362159392517034,
                0.4436069350895505,
                1.0917766774081727,
                0.7658398926993799,
                -0.7823598346673866,
                0.39916100990198783,
                1.0547384064185372
              ],
              "variance": 1.1430010427401531,
              "mean_reward": 0.5584255751574209,
              "min_reward": -0.7823598346673866,
              "max_reward": 1.0917766774081727,
              "num_responses": 7,
              "rvariance": 0.3646843028746455
            },
            {
              "id": "chat_sample_34",
              "rewards": [
                1.7140196300340502,
                0.6250944629387647,
                1.3954904995231845,
                1.625127779658925,
                0.9732542102413391,
                1.158445565189517,
                2.0029181437532078
              ],
              "variance": 0.9955887242014041,
              "mean_reward": 1.3563357559055695,
              "min_reward": 0.6250944629387647,
              "max_reward": 2.0029181437532078,
              "num_responses": 7,
              "rvariance": 0.19148780154534203
            },
            {
              "id": "chat_sample_68",
              "rewards": [
                0.03063021355511398,
                -0.4045694705731039,
                0.197302433008474,
                0.18804286526106512,
                -0.5767974306749092,
                0.11211440973231221,
                -0.18639090552478188
              ],
              "variance": 0.6652073469738546,
              "mean_reward": -0.09138112645940423,
              "min_reward": -0.5767974306749092,
              "max_reward": 0.197302433008474,
              "num_responses": 7,
              "rvariance": 0.08006513577187288
            },
            {
              "id": "chat_sample_149",
              "rewards": [
                0.13063354522713,
                -0.6675411945995163,
                -0.6897641571932976,
                -0.257805321776673,
                -0.30641805245056963,
                -0.8749555121414755,
                -0.578649344224391
              ],
              "variance": 0.6614109241974171,
              "mean_reward": -0.46350000530839897,
              "min_reward": -0.8749555121414755,
              "max_reward": 0.13063354522713,
              "num_responses": 7,
              "rvariance": 0.09933757090434002
            },
            {
              "id": "chat_sample_309",
              "rewards": [
                -0.0027042303355580277,
                -1.0490353857927626,
                -0.8934746476362933,
                -0.6823565029953705,
                -0.8860669934383661,
                -0.9860703251103822,
                -0.9231052644280018
              ],
              "variance": 0.6007607554518891,
              "mean_reward": -0.774687621390962,
              "min_reward": -1.0490353857927626,
              "max_reward": -0.0027042303355580277,
              "num_responses": 7,
              "rvariance": 0.11042517909144753
            },
            {
              "id": "chat_sample_243",
              "rewards": [
                -0.29623252792841986,
                -0.5304995919378648,
                -0.43975582801325763,
                -0.43790391446377586,
                -0.6064280474666177,
                -0.8305095869539129,
                -0.42308860606792165
              ],
              "variance": 0.3237144884494148,
              "mean_reward": -0.5092025861188244,
              "min_reward": -0.8305095869539129,
              "max_reward": -0.29623252792841986,
              "num_responses": 7,
              "rvariance": 0.02511753680196659
            },
            {
              "id": "chat_sample_281",
              "rewards": [
                -1.4268257498870454,
                -1.7157242636062027,
                -1.737947226199984,
                -1.478679329272535,
                -1.7009089552103485,
                -1.6860936468144943,
                -1.7305395720020569
              ],
              "variance": 0.27556473616288857,
              "mean_reward": -1.6395312489989526,
              "min_reward": -1.737947226199984,
              "max_reward": -1.4268257498870454,
              "num_responses": 7,
              "rvariance": 0.014403692005919502
            },
            {
              "id": "chat_sample_99",
              "rewards": [
                2.032548760544916,
                -0.3916060757267314,
                -0.17568814733549168,
                0.2047100872064011,
                0.5028681686729674,
                0.16952372976624733,
                0.07322422519319487
              ],
              "variance": 1.376795724113735,
              "mean_reward": 0.3450829640459291,
              "min_reward": -0.3916060757267314,
              "max_reward": 2.032548760544916,
              "num_responses": 7,
              "rvariance": 0.5443975771582049
            },
            {
              "id": "chat_sample_43",
              "rewards": [
                0.8917700140641408,
                -0.1439126384835436,
                0.2936019375815265,
                0.7139863133138901,
                0.32508446792271667,
                0.2843423698341176,
                -0.4842017532008203
              ],
              "variance": 1.0651280779844448,
              "mean_reward": 0.26866724443314677,
              "min_reward": -0.4842017532008203,
              "max_reward": 0.8917700140641408,
              "num_responses": 7,
              "rvariance": 0.18966433908593774
            },
            {
              "id": "chat_sample_148",
              "rewards": [
                0.7028748320169994,
                0.0880395335890491,
                -0.03140889035252559,
                -0.23187853208392806
              ],
              "variance": 0.6901618820531217,
              "mean_reward": 0.13190673579239873,
              "min_reward": -0.23187853208392806,
              "max_reward": 0.7028748320169994,
              "num_responses": 4,
              "rvariance": 0.12173515330061349
            },
            {
              "id": "chat_sample_249",
              "rewards": [
                0.7325054488087078,
                -0.2133593965891103,
                -0.361975458935023,
                0.16581990266728378,
                -0.3166035769727194,
                -0.5212400241904559,
                -0.5842050848728363
              ],
              "variance": 0.9389201695872617,
              "mean_reward": -0.15700831286916475,
              "min_reward": -0.5842050848728363,
              "max_reward": 0.7325054488087078,
              "num_responses": 7,
              "rvariance": 0.18303889063289122
            },
            {
              "id": "chat_sample_100",
              "rewards": [
                -0.04252037164941626,
                0.5510179209594936,
                0.3917533557040607,
                -0.5434629867842372,
                0.48805286027711314,
                0.5806485377512021
              ],
              "variance": 0.8588249085721746,
              "mean_reward": 0.2375815527097027,
              "min_reward": -0.5434629867842372,
              "max_reward": 0.5806485377512021,
              "num_responses": 6,
              "rvariance": 0.16515496577052077
            },
            {
              "id": "chat_sample_141",
              "rewards": [
                -1.078666002584471,
                -1.0157009419020906,
                -1.1527425445637423,
                -1.0823698296834345,
                -1.0934813109803254,
                -1.1749655071575236,
                -1.4120104414911911
              ],
              "variance": 0.21630350257947173,
              "mean_reward": -1.1442766540518257,
              "min_reward": -1.4120104414911911,
              "max_reward": -1.0157009419020906,
              "num_responses": 7,
              "rvariance": 0.01427770729509181
            },
            {
              "id": "chat_sample_97",
              "rewards": [
                2.417746778837126,
                1.106591985804027,
                2.1955171528993125,
                1.8843956765863739,
                1.699204321638196,
                2.0621793773366246,
                2.1214406109200414
              ],
              "variance": 0.8222496159699098,
              "mean_reward": 1.9267251291459573,
              "min_reward": 1.106591985804027,
              "max_reward": 2.417746778837126,
              "num_responses": 7,
              "rvariance": 0.15654132255788095
            },
            {
              "id": "chat_sample_137",
              "rewards": [
                -0.28975083050523365,
                -0.45086730931014835,
                -0.32123336084642384,
                0.247304098844482,
                -0.2804912627578247,
                -0.07909566425168138,
                -0.37864268088035896
              ],
              "variance": 0.4589967732390588,
              "mean_reward": -0.22182528710102695,
              "min_reward": -0.45086730931014835,
              "max_reward": 0.247304098844482,
              "num_responses": 7,
              "rvariance": 0.047920515742571924
            },
            {
              "id": "chat_sample_207",
              "rewards": [
                0.573240883553275,
                0.40656866409991493,
                0.27878662918567226,
                0.747320757204562,
                0.12322589102920288,
                0.3213806408237531,
                0.6028715003449834
              ],
              "variance": 0.4440888691657303,
              "mean_reward": 0.43619928089162335,
              "min_reward": 0.12322589102920288,
              "max_reward": 0.747320757204562,
              "num_responses": 7,
              "rvariance": 0.040021283122613056
            },
            {
              "id": "chat_sample_190",
              "rewards": [
                -0.8305095869539129,
                -0.34808610731390965,
                -0.3767907673308772,
                -0.02955697680304381,
                -0.004556143885039806,
                0.07877996584164021,
                0.015814905159259752
              ],
              "variance": 0.5992792246123034,
              "mean_reward": -0.21355781589798334,
              "min_reward": -0.8305095869539129,
              "max_reward": 0.07877996584164021,
              "num_responses": 7,
              "rvariance": 0.09156908241761794
            },
            {
              "id": "chat_sample_254",
              "rewards": [
                -0.08187353457590404,
                -0.1624317739783614,
                -0.2707687166230454,
                -0.0471501555231207,
                -0.34901206408865054,
                -0.47309027190392966,
                -0.09020714554857204
              ],
              "variance": 0.3306591642599715,
              "mean_reward": -0.21064766603451196,
              "min_reward": -0.47309027190392966,
              "max_reward": -0.0471501555231207,
              "num_responses": 7,
              "rvariance": 0.021682896120902777
            },
            {
              "id": "chat_sample_171",
              "rewards": [
                0.09359527423749443,
                -0.3823465079793225,
                -0.6823565029953705,
                -0.44531156866170296,
                -0.3073440092253105,
                -0.23303597805235418,
                -0.34160440989072344
              ],
              "variance": 0.43774606525875537,
              "mean_reward": -0.32834338608104136,
              "min_reward": -0.6823565029953705,
              "max_reward": 0.09359527423749443,
              "num_responses": 7,
              "rvariance": 0.04709367764796278
            },
            {
              "id": "chat_sample_131",
              "rewards": [
                1.158445565189517,
                1.7140196300340502,
                1.8695803681905196,
                2.1807018445034583,
                1.9140262933780823,
                1.5880895086692894,
                2.239963078086875
              ],
              "variance": 0.7881744066594443,
              "mean_reward": 1.809260898293113,
              "min_reward": 1.158445565189517,
              "max_reward": 2.239963078086875,
              "num_responses": 7,
              "rvariance": 0.11709075017531734
            },
            {
              "id": "chat_sample_272",
              "rewards": [
                -0.23465640240815072,
                -0.5693897764769821,
                -1.0305162502979448,
                -0.4990170615966745,
                -0.7601368720736053,
                -0.6138357016645448,
                -0.9490320541207466
              ],
              "variance": 0.588352934670361,
              "mean_reward": -0.6652263026626642,
              "min_reward": -1.0305162502979448,
              "max_reward": -0.23465640240815072,
              "num_responses": 7,
              "rvariance": 0.06397600729045469
            },
            {
              "id": "chat_sample_317",
              "rewards": [
                -0.30456613890108786,
                -0.28465806824415874,
                -0.23002661853444628,
                -0.34901206408865054,
                -0.5008689751461564,
                -0.2073406775532945,
                -0.44716348221118474
              ],
              "variance": 0.24769343724318782,
              "mean_reward": -0.3319480035255684,
              "min_reward": -0.5008689751461564,
              "max_reward": -0.2073406775532945,
              "num_responses": 7,
              "rvariance": 0.010143020319800298
            },
            {
              "id": "chat_sample_221",
              "rewards": [
                -0.778656007568423,
                -0.7601368720736053,
                -0.8342134140528764,
                -1.271265011730576,
                -0.6101318745655813,
                -0.9416243999228195,
                -0.83791724115184
              ],
              "variance": 0.3733457715755264,
              "mean_reward": -0.861992117295103,
              "min_reward": -1.271265011730576,
              "max_reward": -0.6101318745655813,
              "num_responses": 7,
              "rvariance": 0.03656426265750081
            },
            {
              "id": "chat_sample_263",
              "rewards": [
                -0.7934713159642772,
                -0.6564297133026257,
                -0.6934679842922612,
                -0.6064280474666177,
                -0.39993968669939944,
                -0.5156842835420106,
                -0.578649344224391
              ],
              "variance": 0.2640828721561015,
              "mean_reward": -0.606295767927369,
              "min_reward": -0.7934713159642772,
              "max_reward": -0.39993968669939944,
              "num_responses": 7,
              "rvariance": 0.013814958453071036
            },
            {
              "id": "chat_sample_112",
              "rewards": [
                1.1510379109915898,
                0.5806485377512021,
                0.7547284114024893,
                0.773247546897307,
                0.7954705094910883,
                1.0621460606164643,
                0.4250877995947327
              ],
              "variance": 0.5792785582779003,
              "mean_reward": 0.7917666823921248,
              "min_reward": 0.4250877995947327,
              "max_reward": 1.1510379109915898,
              "num_responses": 7,
              "rvariance": 0.05470480116958211
            },
            {
              "id": "chat_sample_138",
              "rewards": [
                -0.9564397083186738,
                -1.2490420491367946,
                -0.9416243999228195,
                -0.9601435354176373,
                -0.9897741522093457,
                -0.9823664980114186,
                -0.9860703251103822
              ],
              "variance": 0.14296772601999308,
              "mean_reward": -1.0093515240181532,
              "min_reward": -1.2490420491367946,
              "max_reward": -0.9416243999228195,
              "num_responses": 7,
              "rvariance": 0.009844725270100942
            },
            {
              "id": "chat_sample_1",
              "rewards": [
                -0.07955864263905182,
                -0.7934713159642772,
                -0.9342167457248924,
                -0.41568095186999454,
                -0.8490287224487306,
                -0.9453282270217831
              ],
              "variance": 0.6921526891188146,
              "mean_reward": -0.6695474342781216,
              "min_reward": -0.9453282270217831,
              "max_reward": -0.07955864263905182,
              "num_responses": 6,
              "rvariance": 0.1010350860789302
            },
            {
              "id": "chat_sample_42",
              "rewards": [
                -0.9823664980114186,
                -1.3749721705015556,
                -1.404602787293264,
                -1.5231252544600977,
                -1.5897941422414419,
                -1.5823864880435148,
                -1.3008956285222844
              ],
              "variance": 0.41186557340474783,
              "mean_reward": -1.394020424153368,
              "min_reward": -1.5897941422414419,
              "max_reward": -0.9823664980114186,
              "num_responses": 7,
              "rvariance": 0.03844045496774943
            },
            {
              "id": "chat_sample_101",
              "rewards": [
                -0.7564330449746417,
                -0.7008756384901884,
                -0.745321563677751,
                -0.7527292178756781,
                -0.8860669934383661,
                -0.7379139094798239,
                -0.7860636617663501
              ],
              "variance": 0.10296639335118685,
              "mean_reward": -0.7664862899575429,
              "min_reward": -0.8860669934383661,
              "max_reward": -0.7008756384901884,
              "num_responses": 7,
              "rvariance": 0.002934603864213345
            },
            {
              "id": "chat_sample_21",
              "rewards": [
                -0.495313234497711,
                -0.7564330449746417,
                -0.7638406991725688,
                -0.8416210682508035,
                -0.9675511896155644,
                -0.8119904514590951,
                -0.8860669934383661
              ],
              "variance": 0.2666755511253762,
              "mean_reward": -0.7889738116298215,
              "min_reward": -0.9675511896155644,
              "max_reward": -0.495313234497711,
              "num_responses": 7,
              "rvariance": 0.018935082088368006
            },
            {
              "id": "chat_sample_66",
              "rewards": [
                1.0028848270330475,
                1.0991843316060999,
                1.232522107168788,
                1.5510512376796537,
                1.299190994950132,
                1.2769680323563506,
                1.3880828453252574
              ],
              "variance": 0.392605672490137,
              "mean_reward": 1.2642691965884756,
              "min_reward": 1.0028848270330475,
              "max_reward": 1.5510512376796537,
              "num_responses": 7,
              "rvariance": 0.02793389001676692
            },
            {
              "id": "chat_sample_151",
              "rewards": [
                -0.13858838702878348,
                -0.971255016714528,
                -0.8934746476362933,
                -0.3323448421433145,
                -0.8823631663394026,
                -0.9453282270217831,
                -0.9156976102300746
              ],
              "variance": 0.700856682801379,
              "mean_reward": -0.7255788424448827,
              "min_reward": -0.971255016714528,
              "max_reward": -0.13858838702878348,
              "num_responses": 7,
              "rvariance": 0.09953611712179464
            },
            {
              "id": "chat_sample_33",
              "rewards": [
                0.056557003247858874,
                -0.07909566425168138,
                0.11581823683127578,
                -0.4416077415627394,
                -0.20340536126064573,
                -0.17251602197827387,
                -0.43790391446377586
              ],
              "variance": 0.5196469419845869,
              "mean_reward": -0.16602192334828308,
              "min_reward": -0.4416077415627394,
              "max_reward": 0.11581823683127578,
              "num_responses": 7,
              "rvariance": 0.04111978343089707
            },
            {
              "id": "chat_sample_219",
              "rewards": [
                0.029704256780373087,
                -0.43790391446377586,
                -0.5064247157946017,
                -0.6471701455552168
              ],
              "variance": 0.4943683220341607,
              "mean_reward": -0.3904486297583053,
              "min_reward": -0.6471701455552168,
              "max_reward": 0.029704256780373087,
              "num_responses": 4,
              "rvariance": 0.06453421032965578
            },
            {
              "id": "chat_sample_5",
              "rewards": [
                1.3584522285335487,
                1.0769613690123185,
                1.6177201254609979,
                1.43252877051282,
                1.3436369201376945,
                1.4473440789086742,
                1.5140129666900182
              ],
              "variance": 0.31852913051086595,
              "mean_reward": 1.3986652084651534,
              "min_reward": 1.0769613690123185,
              "max_reward": 1.6177201254609979,
              "num_responses": 7,
              "rvariance": 0.024706441691385195
            },
            {
              "id": "chat_sample_86",
              "rewards": [
                0.8695470514703595,
                -0.3832724647540634,
                0.21211774140432824,
                0.38434570150613356,
                0.5028681686729674,
                0.38064187440717,
                0.5547217480584572
              ],
              "variance": 0.7066902104822466,
              "mean_reward": 0.3601385458236218,
              "min_reward": -0.3832724647540634,
              "max_reward": 0.8695470514703595,
              "num_responses": 7,
              "rvariance": 0.12761540793060486
            },
            {
              "id": "chat_sample_108",
              "rewards": [
                0.9139929766579221,
                1.43252877051282,
                1.6103124712630708,
                1.4621593873045284,
                1.032515443824756,
                1.8843956765863739,
                1.5584588918775808
              ],
              "variance": 0.7348392964343697,
              "mean_reward": 1.4134805168610074,
              "min_reward": 0.9139929766579221,
              "max_reward": 1.8843956765863739,
              "num_responses": 7,
              "rvariance": 0.09698247046311938
            },
            {
              "id": "chat_sample_28",
              "rewards": [
                -1.2416343949388675,
                -1.0564430399906897,
                -1.1675578529595965,
                -1.1231119277720338,
                -1.3897874788974098,
                -1.0638506941886168,
                -1.0008856335062364
              ],
              "variance": 0.266675551125376,
              "mean_reward": -1.1490387174647787,
              "min_reward": -1.3897874788974098,
              "max_reward": -1.0008856335062364,
              "num_responses": 7,
              "rvariance": 0.015047053929212998
            },
            {
              "id": "chat_sample_255",
              "rewards": [
                0.30286150532893535,
                0.12507780457868467,
                0.3213806408237531,
                0.1898947788105469,
                0.8102858178869425,
                0.3361959492196074,
                0.3287882950216802
              ],
              "variance": 0.36186390756873965,
              "mean_reward": 0.34492639881002146,
              "min_reward": 0.12507780457868467,
              "max_reward": 0.8102858178869425,
              "num_responses": 7,
              "rvariance": 0.04165544480506043
            },
            {
              "id": "chat_sample_29",
              "rewards": [
                2.091809994128333,
                0.043593608401486426,
                1.6547583964506334,
                2.684422329962502,
                2.017733452149062,
                2.1955171528993125,
                2.2547783864827293
              ],
              "variance": 1.4163434826436636,
              "mean_reward": 1.8489447600677227,
              "min_reward": 0.043593608401486426,
              "max_reward": 2.684422329962502,
              "num_responses": 7,
              "rvariance": 0.6239014849609618
            },
            {
              "id": "chat_sample_60",
              "rewards": [
                2.6547917131707934,
                2.5362692460039598,
                2.0473640689407704,
                2.551084554399814,
                2.477008012420543,
                1.8399497513988112,
                2.314039620066146
              ],
              "variance": 0.6281690759842189,
              "mean_reward": 2.3457867094858336,
              "min_reward": 1.8399497513988112,
              "max_reward": 2.6547917131707934,
              "num_responses": 7,
              "rvariance": 0.07672412896202434
            },
            {
              "id": "chat_sample_125",
              "rewards": [
                -0.5230919377399377,
                -0.6638373675005528,
                -0.745321563677751,
                -0.6212433558624719,
                -0.6934679842922612,
                -1.0342200773969084,
                -0.678652675896407
              ],
              "variance": 0.2788981805519557,
              "mean_reward": -0.7085478517666128,
              "min_reward": -1.0342200773969084,
              "max_reward": -0.5230919377399377,
              "num_responses": 7,
              "rvariance": 0.021792975261988475
            },
            {
              "id": "chat_sample_314",
              "rewards": [
                0.056557003247858874,
                0.4843490331781496,
                0.1213739774797211,
                0.539906439662603,
                0.5028681686729674,
                0.163967989117802,
                0.14730076717246599
              ],
              "variance": 0.4222362892818454,
              "mean_reward": 0.2880461969330811,
              "min_reward": 0.056557003247858874,
              "max_reward": 0.539906439662603,
              "num_responses": 7,
              "rvariance": 0.037812631158791354
            },
            {
              "id": "chat_sample_310",
              "rewards": [
                0.8251011262827967,
                0.839916434678651,
                1.6769813590444147,
                1.9140262933780823,
                1.1214072941998812,
                1.7955038262112484,
                1.6473507422527063
              ],
              "variance": 1.0089225017576726,
              "mean_reward": 1.4028981537211114,
              "min_reward": 0.8251011262827967,
              "max_reward": 1.9140262933780823,
              "num_responses": 7,
              "rvariance": 0.1829006836553256
            },
            {
              "id": "chat_sample_222",
              "rewards": [
                0.25100792594344556,
                -0.004556143885039806,
                0.2398964446465549,
                0.49916434157400386,
                0.015814905159259752,
                0.6028715003449834,
                0.22693304980018245
              ],
              "variance": 0.5329807195408558,
              "mean_reward": 0.2615902890833414,
              "min_reward": -0.004556143885039806,
              "max_reward": 0.6028715003449834,
              "num_responses": 7,
              "rvariance": 0.04370535603323922
            },
            {
              "id": "chat_sample_143",
              "rewards": [
                -0.5508706409821643,
                -0.495313234497711,
                -0.22724874821022362,
                -0.5027208886956381,
                -0.43975582801325763,
                -0.4193847789689581,
                -0.17700112510592506
              ],
              "variance": 0.31483109064174447,
              "mean_reward": -0.4017564634962683,
              "min_reward": -0.5508706409821643,
              "max_reward": -0.17700112510592506,
              "num_responses": 7,
              "rvariance": 0.017700619503251924
            },
            {
              "id": "chat_sample_12",
              "rewards": [
                1.0917766774081727,
                0.4843490331781496,
                0.9362159392517034,
                1.2695603781584235,
                1.3362292659397674,
                0.9954771728351204,
                1.165853219387444
              ],
              "variance": 0.5407587564486791,
              "mean_reward": 1.039923098022683,
              "min_reward": 0.4843490331781496,
              "max_reward": 1.3362292659397674,
              "num_responses": 7,
              "rvariance": 0.06863871018712629
            },
            {
              "id": "chat_sample_248",
              "rewards": [
                -0.6101318745655813,
                -0.9194014373290381,
                -0.9156976102300746,
                -1.0157009419020906,
                -0.9675511896155644
              ],
              "variance": 0.2640828721561016,
              "mean_reward": -0.8856966107284698,
              "min_reward": -1.0157009419020906,
              "max_reward": -0.6101318745655813,
              "num_responses": 5,
              "rvariance": 0.020314659466495216
            },
            {
              "id": "chat_sample_64",
              "rewards": [
                0.35471508471442514,
                -0.4545711364091119,
                -0.45827496350807545,
                -0.3443822802149461,
                -0.4990170615966745,
                -0.44716348221118474,
                -1.0082932877041635
              ],
              "variance": 0.6379842177964727,
              "mean_reward": -0.4081410181328187,
              "min_reward": -1.0082932877041635,
              "max_reward": 0.35471508471442514,
              "num_responses": 7,
              "rvariance": 0.13723539047489036
            },
            {
              "id": "chat_sample_4",
              "rewards": [
                1.3140063033459861,
                1.3954904995231845,
                1.7806885178153942,
                2.2844090032744377,
                1.425121116314893,
                1.4028981537211116,
                1.8843956765863739
              ],
              "variance": 0.6815041862092943,
              "mean_reward": 1.6410013243687689,
              "min_reward": 1.3140063033459861,
              "max_reward": 2.2844090032744377,
              "num_responses": 7,
              "rvariance": 0.10903220813872917
            },
            {
              "id": "chat_sample_311",
              "rewards": [
                -0.07724375070219959,
                -0.43049626026584875,
                0.12878163167764822,
                -0.013815711632448695,
                -0.20386833964801618,
                -0.3175295337474603,
                -0.09020714554857204
              ],
              "variance": 0.40593945004640575,
              "mean_reward": -0.14348272998098532,
              "min_reward": -0.43049626026584875,
              "max_reward": 0.12878163167764822,
              "num_responses": 7,
              "rvariance": 0.0306403981245798
            },
            {
              "id": "chat_sample_117",
              "rewards": [
                -0.0017782735608171387,
                -0.20236365988906221,
                0.12878163167764822,
                0.006555337411850862,
                0.3436036034175345,
                -0.03326080390200736,
                -0.11844882717816915
              ],
              "variance": 0.36672518063612913,
              "mean_reward": 0.017584143996711103,
              "min_reward": -0.20236365988906221,
              "max_reward": 0.3436036034175345,
              "num_responses": 7,
              "rvariance": 0.026945331626231455
            },
            {
              "id": "chat_sample_39",
              "rewards": [
                0.4250877995947327,
                0.3361959492196074,
                0.48064520607918604,
                0.6806518694232181,
                0.7954705094910883,
                0.8991776682620679,
                0.11026249618283043
              ],
              "variance": 0.5911308049945836,
              "mean_reward": 0.5324987854646758,
              "min_reward": 0.11026249618283043,
              "max_reward": 0.8991776682620679,
              "num_responses": 7,
              "rvariance": 0.06522872401405642
            },
            {
              "id": "chat_sample_287",
              "rewards": [
                0.7325054488087078,
                1.1510379109915898,
                1.4621593873045284,
                1.0177001354289017,
                1.5510512376796537,
                1.565866546075508
              ],
              "variance": 0.683356099758776,
              "mean_reward": 1.2467201110481483,
              "min_reward": 0.7325054488087078,
              "max_reward": 1.565866546075508,
              "num_responses": 6,
              "rvariance": 0.09448465248061207
            },
            {
              "id": "chat_sample_313",
              "rewards": [
                -0.1697815558778672,
                -0.778656007568423,
                -0.9527358812197102,
                -0.8934746476362933,
                -0.9897741522093457,
                -0.9416243999228195,
                -0.9416243999228195
              ],
              "variance": 0.43244496272336397,
              "mean_reward": -0.8096672920510397,
              "min_reward": -0.9897741522093457,
              "max_reward": -0.1697815558778672,
              "num_responses": 7,
              "rvariance": 0.07216736955598632
            },
            {
              "id": "chat_sample_3",
              "rewards": [
                1.0251077896268288,
                0.4769413789802225,
                0.639909771334619,
                1.0991843316060999,
                0.8325087804807239,
                0.8251011262827967,
                0.16952372976624733
              ],
              "variance": 0.7007640871239048,
              "mean_reward": 0.7240395582967912,
              "min_reward": 0.16952372976624733,
              "max_reward": 1.0991843316060999,
              "num_responses": 7,
              "rvariance": 0.08985397555846375
            },
            {
              "id": "chat_sample_170",
              "rewards": [
                -0.7342100823808604,
                -1.1971884697513049,
                -0.7897674888653137,
                -0.8934746476362933,
                -0.9823664980114186,
                -0.9749588438134915
              ],
              "variance": 0.32778869825827484,
              "mean_reward": -0.9286610050764471,
              "min_reward": -1.1971884697513049,
              "max_reward": -0.7342100823808604,
              "num_responses": 6,
              "rvariance": 0.022579236510063386
            },
            {
              "id": "chat_sample_83",
              "rewards": [
                -0.2999363550273834,
                -0.6638373675005528,
                -0.5879089119718,
                -0.4416077415627394,
                -0.6138357016645448,
                -0.5564263816306096,
                -0.4693864448049661
              ],
              "variance": 0.24889718105035108,
              "mean_reward": -0.518991272023228,
              "min_reward": -0.6638373675005528,
              "max_reward": -0.2999363550273834,
              "num_responses": 7,
              "rvariance": 0.013222970295192859
            },
            {
              "id": "chat_sample_279",
              "rewards": [
                0.30286150532893535,
                -1.2860803201264301,
                -0.7527292178756781,
                -0.6601335404015892,
                -1.404602787293264,
                -1.1749655071575236,
                -1.0823698296834345
              ],
              "variance": 1.0585537848837847,
              "mean_reward": -0.8654313853155692,
              "min_reward": -1.404602787293264,
              "max_reward": 0.30286150532893535,
              "num_responses": 7,
              "rvariance": 0.2900403214713986
            },
            {
              "id": "chat_sample_55",
              "rewards": [
                -0.29113976566734495,
                -0.4601268770575572,
                -0.37864268088035896,
                -0.5916127390707635,
                -0.49716514804719275,
                -0.37956863765509985
              ],
              "variance": 0.2094977202851262,
              "mean_reward": -0.43304264139638615,
              "min_reward": -0.5916127390707635,
              "max_reward": -0.29113976566734495,
              "num_responses": 6,
              "rvariance": 0.009324163079572382
            },
            {
              "id": "chat_sample_103",
              "rewards": [
                -0.5582782951800914,
                -1.0045894606052,
                -0.4712383583544479,
                -0.7119871197870791,
                -0.6267990965109173,
                -0.5323515054873466,
                -0.5471668138832008
              ],
              "variance": 0.32112180948014035,
              "mean_reward": -0.6360586642583261,
              "min_reward": -1.0045894606052,
              "max_reward": -0.4712383583544479,
              "num_responses": 7,
              "rvariance": 0.02764832467222413
            },
            {
              "id": "chat_sample_113",
              "rewards": [
                0.16581990266728378,
                0.5287949583657123,
                0.45471841638644117,
                0.8325087804807239,
                0.4510145892874776,
                0.7880628552931612,
                0.5843523648501656
              ],
              "variance": 0.46890451072878614,
              "mean_reward": 0.5436102667615665,
              "min_reward": 0.16581990266728378,
              "max_reward": 0.8325087804807239,
              "num_responses": 7,
              "rvariance": 0.043471444420135785
            },
            {
              "id": "chat_sample_104",
              "rewards": [
                0.247304098844482,
                0.7102824862149265,
                0.906585322459995,
                0.8769547056682866,
                0.513979649969858,
                0.773247546897307,
                0.9658465560434119
              ],
              "variance": 0.5229803863736542,
              "mean_reward": 0.7134571951568952,
              "min_reward": 0.247304098844482,
              "max_reward": 0.9658465560434119,
              "num_responses": 7,
              "rvariance": 0.05548646630876201
            },
            {
              "id": "chat_sample_282",
              "rewards": [
                1.113999640001954,
                0.4028648370009514,
                0.4436069350895505,
                2.3436702368578546,
                1.2843756865542777,
                1.4843823498983097,
                1.4177134621169658
              ],
              "variance": 1.400787408828017,
              "mean_reward": 1.2129447353599805,
              "min_reward": 0.4028648370009514,
              "max_reward": 2.3436702368578546,
              "num_responses": 7,
              "rvariance": 0.3795930535879721
            },
            {
              "id": "chat_sample_62",
              "rewards": [
                1.3436369201376945,
                0.7139863133138901,
                0.7584322385014528,
                1.106591985804027,
                1.0251077896268288,
                0.4250877995947327,
                0.9584389018454847
              ],
              "variance": 0.602983051711267,
              "mean_reward": 0.9044688498320159,
              "min_reward": 0.4250877995947327,
              "max_reward": 1.3436369201376945,
              "num_responses": 7,
              "rvariance": 0.07694362232488862
            },
            {
              "id": "chat_sample_91",
              "rewards": [
                0.05007530582467265,
                -0.8268057598549493,
                -1.0564430399906897,
                -0.6638373675005528,
                -0.8712516850425119,
                -0.5434629867842372,
                -0.7823598346673866
              ],
              "variance": 0.63928055728111,
              "mean_reward": -0.6705836240022364,
              "min_reward": -1.0564430399906897,
              "max_reward": 0.05007530582467265,
              "num_responses": 7,
              "rvariance": 0.10880127116463144
            },
            {
              "id": "chat_sample_284",
              "rewards": [
                -0.7897674888653137,
                -0.5767974306749092,
                -0.5193881106409741,
                -0.5934646526202453,
                -0.8453248953497671,
                -0.611983788115063,
                -0.4934613209482292
              ],
              "variance": 0.3029730566952188,
              "mean_reward": -0.6328839553163573,
              "min_reward": -0.8453248953497671,
              "max_reward": -0.4934613209482292,
              "num_responses": 7,
              "rvariance": 0.015314281499179756
            },
            {
              "id": "chat_sample_84",
              "rewards": [
                0.38804952860509717,
                -0.2721576517851567,
                0.04729743550044998,
                0.6880595236211452,
                0.036185954203559315,
                0.04729743550044998,
                -0.37030906990769097
              ],
              "variance": 0.8194717456456869,
              "mean_reward": 0.080631879391122,
              "min_reward": -0.37030906990769097,
              "max_reward": 0.6880595236211452,
              "num_responses": 7,
              "rvariance": 0.11363999394999351
            },
            {
              "id": "chat_sample_175",
              "rewards": [
                1.3510445743356216,
                0.8028781636890154,
                1.2102991445750066,
                1.43252877051282,
                1.1732608735853711,
                1.299190994950132,
                1.4843823498983097
              ],
              "variance": 0.42816241264018706,
              "mean_reward": 1.250512124506611,
              "min_reward": 0.8028781636890154,
              "max_reward": 1.4843823498983097,
              "num_responses": 7,
              "rvariance": 0.04403753572078827
            },
            {
              "id": "chat_sample_185",
              "rewards": [
                0.47323755188125893,
                0.05100126259941354,
                -0.2582683001640434,
                -0.17270410694814312,
                0.4843490331781496,
                0.3065653324278989,
                0.47323755188125893
              ],
              "variance": 0.6846119286345185,
              "mean_reward": 0.19391690355082764,
              "min_reward": -0.2582683001640434,
              "max_reward": 0.4843490331781496,
              "num_responses": 7,
              "rvariance": 0.0874839776917569
            },
            {
              "id": "chat_sample_154",
              "rewards": [
                -1.1749655071575236,
                -1.0416277315948355,
                -0.9564397083186738,
                -1.0194047690010541,
                -1.1527425445637423,
                -1.0416277315948355,
                -1.1453348903658152
              ],
              "variance": 0.16741298487315281,
              "mean_reward": -1.0760204117994971,
              "min_reward": -1.1749655071575236,
              "max_reward": -0.9564397083186738,
              "num_responses": 7,
              "rvariance": 0.005764500435427672
            },
            {
              "id": "chat_sample_189",
              "rewards": [
                -1.011997114803127,
                -0.7823598346673866,
                -0.7490253907767146,
                -0.6601335404015892,
                -0.8453248953497671,
                -0.7082832926881155,
                -0.778656007568423
              ],
              "variance": 0.222970391357606,
              "mean_reward": -0.7908257251793033,
              "min_reward": -1.011997114803127,
              "max_reward": -0.6601335404015892,
              "num_responses": 7,
              "rvariance": 0.011106812106570491
            },
            {
              "id": "chat_sample_218",
              "rewards": [
                0.7954705094910883,
                0.4917566873760767,
                0.07692805229215843,
                -0.005482100659780695,
                0.32508446792271667,
                0.14730076717246599
              ],
              "variance": 0.6078906226173936,
              "mean_reward": 0.30517639726578755,
              "min_reward": -0.005482100659780695,
              "max_reward": 0.7954705094910883,
              "num_responses": 6,
              "rvariance": 0.07485459605194188
            },
            {
              "id": "chat_sample_257",
              "rewards": [
                -0.0027042303355580277,
                -0.478646012552375,
                -0.3601235453855412,
                -0.26937978146093405,
                -0.5897608255212817,
                -0.3517899344128732,
                -0.6564297133026257
              ],
              "variance": 0.4537188196230358,
              "mean_reward": -0.3869762918530269,
              "min_reward": -0.6564297133026257,
              "max_reward": -0.0027042303355580277,
              "num_responses": 7,
              "rvariance": 0.040797593911582775
            },
            {
              "id": "chat_sample_13",
              "rewards": [
                1.7362425926278315,
                0.4695337247822954,
                -0.5138323699925288,
                -0.2135908857827955,
                -0.6712450216984799
              ],
              "variance": 1.8378390065057166,
              "mean_reward": 0.16142160798726451,
              "min_reward": -0.6712450216984799,
              "max_reward": 1.7362425926278315,
              "num_responses": 5,
              "rvariance": 0.7729860463267182
            },
            {
              "id": "chat_sample_237",
              "rewards": [
                -0.8934746476362933,
                -0.9231052644280018,
                -0.9897741522093457,
                -0.9786626709124551,
                -0.9156976102300746,
                -0.9786626709124551,
                -1.2860803201264301
              ],
              "variance": 0.2014881941836174,
              "mean_reward": -0.9950653337792936,
              "min_reward": -1.2860803201264301,
              "max_reward": -0.8934746476362933,
              "num_responses": 7,
              "rvariance": 0.015293424030387163
            },
            {
              "id": "chat_sample_89",
              "rewards": [
                0.513979649969858,
                -0.9082899560321475,
                -1.1971884697513049,
                -1.0268124231989813,
                -0.9490320541207466,
                -0.9453282270217831,
                -0.9082899560321475
              ],
              "variance": 0.7555807281885659,
              "mean_reward": -0.7744230623124648,
              "min_reward": -1.1971884697513049,
              "max_reward": 0.513979649969858,
              "num_responses": 7,
              "rvariance": 0.2854214420064309
            },
            {
              "id": "chat_sample_23",
              "rewards": [
                0.05007530582467265,
                -0.16312624155941705,
                0.049149349049931755,
                0.016740861934000643,
                0.18619095171158334,
                -0.10270756200757404,
                -0.2209985399807226
              ],
              "variance": 0.29079672510737625,
              "mean_reward": -0.026382267861075042,
              "min_reward": -0.2209985399807226,
              "max_reward": 0.18619095171158334,
              "num_responses": 7,
              "rvariance": 0.017285388853288907
            },
            {
              "id": "chat_sample_236",
              "rewards": [
                -0.20363685045433094,
                -0.23373044563340983,
                -0.4564230499585937,
                -0.38697629185302695,
                -0.43975582801325763,
                -0.48049792610185676,
                -0.2124334398143694
              ],
              "variance": 0.2571381963455449,
              "mean_reward": -0.34477911883269213,
              "min_reward": -0.48049792610185676,
              "max_reward": -0.20363685045433094,
              "num_responses": 7,
              "rvariance": 0.013064780742659819
            },
            {
              "id": "chat_sample_234",
              "rewards": [
                -1.0675545212875803,
                -1.2564497033347217,
                -1.204596123949232,
                -0.9453282270217831,
                -1.33793389951192,
                -1.1082966193761796,
                -1.323118591116066
              ],
              "variance": 0.3103807108931462,
              "mean_reward": -1.1776110979424976,
              "min_reward": -1.33793389951192,
              "max_reward": -0.9453282270217831,
              "num_responses": 7,
              "rvariance": 0.01781311824694128
            },
            {
              "id": "chat_sample_194",
              "rewards": [
                0.24360027174551846,
                0.20841391430536468,
                -0.2943806143789381,
                0.263971320789818,
                0.07692805229215843,
                0.08433570649008554,
                -0.11798584879079871
              ],
              "variance": 0.44029244638929277,
              "mean_reward": 0.06641182892188692,
              "min_reward": -0.2943806143789381,
              "max_reward": 0.263971320789818,
              "num_responses": 7,
              "rvariance": 0.036456519482928385
            },
            {
              "id": "chat_sample_70",
              "rewards": [
                -0.2219244967554635,
                -0.937920572823856,
                -0.5267957648389012,
                -0.07816970747694048,
                -0.7082832926881155,
                -0.878659339240439,
                -0.3675311995834683
              ],
              "variance": 0.7379412516297517,
              "mean_reward": -0.5313263390581692,
              "min_reward": -0.937920572823856,
              "max_reward": -0.07816970747694048,
              "num_responses": 7,
              "rvariance": 0.09217180770996578
            },
            {
              "id": "chat_sample_74",
              "rewards": [
                -0.055483766495788706,
                -0.39901372992465856,
                -0.22933215095339063,
                -0.2804912627578247,
                -0.4564230499585937,
                -0.528647678388383,
                -0.4990170615966745
              ],
              "variance": 0.3510765111430081,
              "mean_reward": -0.34977267143933055,
              "min_reward": -0.528647678388383,
              "max_reward": -0.055483766495788706,
              "num_responses": 7,
              "rvariance": 0.02485441904574367
            },
            {
              "id": "chat_sample_200",
              "rewards": [
                0.573240883553275,
                0.6621327339284003,
                0.6806518694232181,
                0.8028781636890154,
                0.5584255751574208,
                0.8251011262827967,
                0.9806618644392662
              ],
              "variance": 0.3200106613504512,
              "mean_reward": 0.7261560309247704,
              "min_reward": 0.5584255751574208,
              "max_reward": 0.9806618644392662,
              "num_responses": 7,
              "rvariance": 0.019733685172003627
            },
            {
              "id": "chat_sample_260",
              "rewards": [
                0.13433737232609355,
                -0.5971684797192088,
                0.16767181621676555,
                0.0454455219509682,
                -0.15595007655517518,
                0.1713756433157291,
                -0.06798418295479071
              ],
              "variance": 0.5015907848771396,
              "mean_reward": -0.04318176934565976,
              "min_reward": -0.5971684797192088,
              "max_reward": 0.1713756433157291,
              "num_responses": 7,
              "rvariance": 0.06429929805673977
            },
            {
              "id": "chat_sample_315",
              "rewards": [
                -0.08742927522434937,
                -0.3897541621772496,
                -0.37308694023191363,
                -0.28234317630730654,
                -0.3027142253516061,
                -0.30456613890108786,
                0.3065653324278989
              ],
              "variance": 0.44992239684659807,
              "mean_reward": -0.20476122653794487,
              "min_reward": -0.3897541621772496,
              "max_reward": 0.3065653324278989,
              "num_responses": 7,
              "rvariance": 0.0519074768954797
            },
            {
              "id": "chat_sample_240",
              "rewards": [
                -0.511980456443047,
                -0.09020714554857204,
                0.22693304980018245,
                0.17322755686521088,
                0.00840725096133264,
                -0.08928118877383115,
                -0.11659691362868738
              ],
              "variance": 0.46946008479363077,
              "mean_reward": -0.05707112096677309,
              "min_reward": -0.511980456443047,
              "max_reward": 0.22693304980018245,
              "num_responses": 7,
              "rvariance": 0.05008636790046522
            },
            {
              "id": "chat_sample_20",
              "rewards": [
                3.7066786092764437,
                2.773314180337627,
                2.1214406109200414,
                2.5066386292122513,
                1.9881028353573533,
                2.551084554399814,
                2.7881294887334813
              ],
              "variance": 1.0874436362557005,
              "mean_reward": 2.633626986891002,
              "min_reward": 1.9881028353573533,
              "max_reward": 3.7066786092764437,
              "num_responses": 7,
              "rvariance": 0.2709712756405172
            },
            {
              "id": "chat_sample_210",
              "rewards": [
                0.4028648370009514,
                0.8473240888765781,
                0.5658332293553479,
                0.839916434678651,
                0.9139929766579221,
                0.5028681686729674,
                0.9214006308558492
              ],
              "variance": 0.454089202332932,
              "mean_reward": 0.7134571951568953,
              "min_reward": 0.4028648370009514,
              "max_reward": 0.9214006308558492,
              "num_responses": 7,
              "rvariance": 0.03999650612948361
            },
            {
              "id": "chat_sample_93",
              "rewards": [
                -0.3101218795495332,
                -0.2809542411451952,
                -0.5712416900264639,
                -0.5360553325863101,
                -0.4545711364091119,
                -0.37216098345717274,
                -0.37864268088035896
              ],
              "variance": 0.25167505137457363,
              "mean_reward": -0.414821134864878,
              "min_reward": -0.5712416900264639,
              "max_reward": -0.2809542411451952,
              "num_responses": 7,
              "rvariance": 0.010393747392223932
            },
            {
              "id": "chat_sample_226",
              "rewards": [
                0.07692805229215843,
                0.14915268072194776,
                0.09915101488593976,
                0.3584189118133887,
                0.061186787121563314,
                0.06581657099526776,
                0.20100626010743755
              ],
              "variance": 0.20000666334403205,
              "mean_reward": 0.14452289684824332,
              "min_reward": 0.061186787121563314,
              "max_reward": 0.3584189118133887,
              "num_responses": 7,
              "rvariance": 0.009818653434110215
            },
            {
              "id": "chat_sample_30",
              "rewards": [
                1.8103191346071028,
                0.9288082850537763,
                0.6176868087408376,
                1.299190994950132,
                0.8991776682620679,
                1.1214072941998812,
                0.7658398926993799
              ],
              "variance": 0.7970635916969574,
              "mean_reward": 1.063204296930454,
              "min_reward": 0.6176868087408376,
              "max_reward": 1.8103191346071028,
              "num_responses": 7,
              "rvariance": 0.13559090504530574
            },
            {
              "id": "chat_sample_142",
              "rewards": [
                0.05563104647311798,
                -0.035112717451489146,
                -0.18523345955635578,
                0.06766848454474954,
                -0.3832724647540634,
                -0.32030740407168296,
                -0.2795653059830838
              ],
              "variance": 0.40593945004640575,
              "mean_reward": -0.15431311725697253,
              "min_reward": -0.3832724647540634,
              "max_reward": 0.06766848454474954,
              "num_responses": 7,
              "rvariance": 0.029168826163797547
            },
            {
              "id": "chat_sample_136",
              "rewards": [
                -0.3323448421433145,
                -0.025853149704080255,
                0.38804952860509717,
                0.38804952860509717,
                0.21952539560225534,
                0.05748296002259976,
                0.42138397249576914
              ],
              "variance": 0.5498331328411399,
              "mean_reward": 0.15947048478334627,
              "min_reward": -0.3323448421433145,
              "max_reward": 0.42138397249576914,
              "num_responses": 7,
              "rvariance": 0.06619009234493081
            },
            {
              "id": "chat_sample_16",
              "rewards": [
                3.158512198629837,
                2.7436835635459187,
                2.4473773956288345,
                2.3733008536495634,
                2.6696070215666476,
                2.417746778837126,
                2.8918366475044612
              ],
              "variance": 0.5985384591925107,
              "mean_reward": 2.671723494194627,
              "min_reward": 2.3733008536495634,
              "max_reward": 3.158512198629837,
              "num_responses": 7,
              "rvariance": 0.07064102719121458
            },
            {
              "id": "chat_sample_22",
              "rewards": [
                0.45471841638644117,
                -0.03326080390200736,
                0.04637147872570909,
                -0.021223365830375807,
                0.23434070399810958,
                -0.026779106478821143,
                0.18619095171158334
              ],
              "variance": 0.351863574401538,
              "mean_reward": 0.12005118208723412,
              "min_reward": -0.03326080390200736,
              "max_reward": 0.45471841638644117,
              "num_responses": 7,
              "rvariance": 0.02855565956045467
            },
            {
              "id": "chat_sample_217",
              "rewards": [
                -0.34160440989072344,
                -0.6416144049067715,
                -0.7082832926881155,
                -0.9156976102300746,
                -0.5527225545316461,
                -0.9786626709124551,
                -0.9675511896155644
              ],
              "variance": 0.5037204854590438,
              "mean_reward": -0.7294480189679072,
              "min_reward": -0.9786626709124551,
              "max_reward": -0.34160440989072344,
              "num_responses": 7,
              "rvariance": 0.04904388816305721
            }
          ]
        },
        "semantic_benchmark_chat_hard_filtered.json": {
          "file_name": "semantic_benchmark_chat_hard_filtered.json",
          "processed_samples": 200,
          "global_mean": -14.562488130712698,
          "global_std": 11.802315253833779,
          "mean_variance": 0.9566743461912043,
          "mean_rvariance": 0.2648538975981543,
          "sample_results": [
            {
              "id": "chat_hard_sample_121",
              "rewards": [
                1.9434736013564669,
                -0.4607156945346821,
                1.9434736013564669,
                -0.4607156945346821,
                1.9434736013564669,
                -0.4607156945346821
              ],
              "variance": 2.404189295891149,
              "mean_reward": 0.7413789534108924,
              "min_reward": -0.4607156945346821,
              "max_reward": 1.9434736013564669,
              "num_responses": 6,
              "rvariance": 1.4450315426193943
            },
            {
              "id": "chat_hard_sample_77",
              "rewards": [
                0.9373150854548847,
                0.04236356341610898,
                1.542334087779915,
                1.2274130917666402,
                0.052954705688757216,
                1.542334087779915,
                2.5630554243063886
              ],
              "variance": 1.9019043736108068,
              "mean_reward": 1.1296814351703728,
              "min_reward": 0.04236356341610898,
              "max_reward": 2.5630554243063886,
              "num_responses": 7,
              "rvariance": 0.6833260442233412
            },
            {
              "id": "chat_hard_sample_265",
              "rewards": [
                1.0736760422152307,
                1.0736760422152307,
                -0.3018485604449586,
                -0.5772182595338127,
                1.0736760422152307,
                -0.22771056453642097,
                0.24889083773274953
              ],
              "variance": 1.485672482295731,
              "mean_reward": 0.3375916542661785,
              "min_reward": -0.5772182595338127,
              "max_reward": 1.0736760422152307,
              "num_responses": 7,
              "rvariance": 0.456950868365772
            },
            {
              "id": "chat_hard_sample_334",
              "rewards": [
                2.9814055440759932,
                0.6566498152297066,
                1.676047258972099,
                -1.096184230893576,
                -0.7890411049867774,
                -0.06884343044669747
              ],
              "variance": 3.271339069464223,
              "mean_reward": 0.5600056419917913,
              "min_reward": -1.096184230893576,
              "max_reward": 2.9814055440759932,
              "num_responses": 6,
              "rvariance": 2.0127349415590836
            },
            {
              "id": "chat_hard_sample_61",
              "rewards": [
                2.536577568624768,
                1.243341176825115,
                0.9690885122728294,
                2.3671192922623963,
                -0.09002571499199394,
                -0.015887719083456302,
                0.3971668295498248
              ],
              "variance": 2.4804455202542166,
              "mean_reward": 1.0581971350656405,
              "min_reward": -0.09002571499199394,
              "max_reward": 2.536577568624768,
              "num_responses": 7,
              "rvariance": 0.9785913764147777
            },
            {
              "id": "chat_hard_sample_133",
              "rewards": [
                2.0546805952192733,
                -0.4924891213526268,
                0.3336199759139354,
                -0.41835112544408914,
                -0.5560359749885162,
                -0.9479082390765008
              ],
              "variance": 1.9461223925991127,
              "mean_reward": -0.004413981621420741,
              "min_reward": -0.9479082390765008,
              "max_reward": 2.0546805952192733,
              "num_responses": 6,
              "rvariance": 0.9930278285497462
            },
            {
              "id": "chat_hard_sample_62",
              "rewards": [
                1.9646558859017633,
                -0.21711942226377273,
                1.1001538978968513,
                1.362284669144895
              ],
              "variance": 1.6058819470902885,
              "mean_reward": 1.0524937576699342,
              "min_reward": -0.21711942226377273,
              "max_reward": 1.9646558859017633,
              "num_responses": 4,
              "rvariance": 0.6355498181601839
            },
            {
              "id": "chat_hard_sample_84",
              "rewards": [
                0.6487064585252204,
                -0.48189797907997856,
                0.7996302359104577,
                -0.38657769862614444,
                -0.38657769862614444,
                -0.48189797907997856
              ],
              "variance": 1.2060663262978175,
              "mean_reward": -0.04810244349609466,
              "min_reward": -0.48189797907997856,
              "max_reward": 0.7996302359104577,
              "num_responses": 6,
              "rvariance": 0.3016135786209475
            },
            {
              "id": "chat_hard_sample_343",
              "rewards": [
                0.12709270159729485,
                -1.3715539299824302,
                -1.3927362145277267,
                -0.3336219872629033
              ],
              "variance": 1.375259824103373,
              "mean_reward": -0.7427048575439413,
              "min_reward": -1.3927362145277267,
              "max_reward": 0.12709270159729485,
              "num_responses": 4,
              "rvariance": 0.4354721274035885
            },
            {
              "id": "chat_hard_sample_87",
              "rewards": [
                1.0246920092042326,
                -0.8102233895320738,
                -0.6407651131697021,
                -0.8843613854406114,
                -0.7784499627141291
              ],
              "variance": 1.2132153473318552,
              "mean_reward": -0.41782156833045675,
              "min_reward": -0.8843613854406114,
              "max_reward": 1.0246920092042326,
              "num_responses": 5,
              "rvariance": 0.5264481349249369
            },
            {
              "id": "chat_hard_sample_110",
              "rewards": [
                1.6733994734039368,
                -0.6407651131697021,
                -0.7043119668055915,
                -0.725494251350888,
                -0.7043119668055915,
                -0.6301739708970538,
                -0.7043119668055915
              ],
              "variance": 1.0040402874470533,
              "mean_reward": -0.3479956803472116,
              "min_reward": -0.725494251350888,
              "max_reward": 1.6733994734039368,
              "num_responses": 7,
              "rvariance": 0.6821094221653928
            },
            {
              "id": "chat_hard_sample_150",
              "rewards": [
                2.049385024082949,
                0.07413699023405368,
                0.5189649656852795,
                1.5502774444844012,
                -0.4077599831714409,
                1.3642705083210165,
                1.0193964380679086
              ],
              "variance": 1.8685422754519647,
              "mean_reward": 0.8812387696720239,
              "min_reward": -0.4077599831714409,
              "max_reward": 2.049385024082949,
              "num_responses": 7,
              "rvariance": 0.6441084283181147
            },
            {
              "id": "chat_hard_sample_65",
              "rewards": [
                0.22241298205112894,
                -0.22771056453642097,
                0.6089896750027894,
                0.021181278870812514,
                0.770504594660675,
                -0.4607156945346821,
                0.770504594660675
              ],
              "variance": 1.0914172111964004,
              "mean_reward": 0.24359526659642544,
              "min_reward": -0.4607156945346821,
              "max_reward": 0.770504594660675,
              "num_responses": 7,
              "rvariance": 0.2081256773200985
            },
            {
              "id": "chat_hard_sample_46",
              "rewards": [
                1.1233220216182693,
                2.2082521581726726,
                3.3415043813460334,
                3.277957527710144,
                3.3203220968007368,
                3.3097309545280886,
                3.638056364980184
              ],
              "variance": 1.6858450712487825,
              "mean_reward": 2.888449357879447,
              "min_reward": 1.1233220216182693,
              "max_reward": 3.638056364980184,
              "num_responses": 7,
              "rvariance": 0.6944601605359023
            },
            {
              "id": "chat_hard_sample_114",
              "rewards": [
                2.2082521581726726,
                0.19593512636950836,
                0.7890390936378094,
                0.7890390936378094
              ],
              "variance": 1.4086219222622152,
              "mean_reward": 0.9955663679544499,
              "min_reward": 0.19593512636950836,
              "max_reward": 2.2082521581726726,
              "num_responses": 4,
              "rvariance": 0.5488309945972981
            },
            {
              "id": "chat_hard_sample_371",
              "rewards": [
                0.8817115885234814,
                -0.31243970271760685,
                -0.8102233895320738,
                0.4236446852314454
              ],
              "variance": 1.4051798010236043,
              "mean_reward": 0.04567329537631151,
              "min_reward": -0.8102233895320738,
              "max_reward": 0.8817115885234814,
              "num_responses": 4,
              "rvariance": 0.42565661344960837
            },
            {
              "id": "chat_hard_sample_223",
              "rewards": [
                2.3406414365807757,
                2.5524642820337404,
                2.5683509954427124,
                0.9306956215344795,
                3.4474158040725156
              ],
              "variance": 1.6011159330675966,
              "mean_reward": 2.3679136279328445,
              "min_reward": 0.9306956215344795,
              "max_reward": 3.4474158040725156,
              "num_responses": 5,
              "rvariance": 0.6611796801700949
            },
            {
              "id": "chat_hard_sample_52",
              "rewards": [
                1.133251217498877,
                1.1041255762490945,
                0.4818959677310107,
                0.41834911409512127,
                1.8243232507891742,
                0.43953139864041774,
                1.7475374693124746
              ],
              "variance": 1.3471932970808553,
              "mean_reward": 1.0212877134737386,
              "min_reward": 0.41834911409512127,
              "max_reward": 1.8243232507891742,
              "num_responses": 7,
              "rvariance": 0.3120887913763675
            },
            {
              "id": "chat_hard_sample_372",
              "rewards": [
                0.4818959677310107,
                -0.503080263625275,
                -0.8949525277132596,
                -0.4924891213526268
              ],
              "variance": 0.9669712894927839,
              "mean_reward": -0.3521564862400377,
              "min_reward": -0.8949525277132596,
              "max_reward": 0.4818959677310107,
              "num_responses": 4,
              "rvariance": 0.2581855684179998
            },
            {
              "id": "chat_hard_sample_346",
              "rewards": [
                2.213547729308997,
                1.2522360814681595,
                0.5666251059121965,
                0.4818959677310107,
                1.4403943434056758
              ],
              "variance": 1.3884987519441836,
              "mean_reward": 1.1909398455652078,
              "min_reward": 0.4818959677310107,
              "max_reward": 2.213547729308997,
              "num_responses": 5,
              "rvariance": 0.4008447547531649
            },
            {
              "id": "chat_hard_sample_108",
              "rewards": [
                2.2294344427179693,
                0.10061484591567427,
                1.0167486524997464,
                1.0167486524997464,
                1.5542491228366442
              ],
              "variance": 1.4922919462161361,
              "mean_reward": 1.1835591432939563,
              "min_reward": 0.10061484591567427,
              "max_reward": 2.2294344427179693,
              "num_responses": 5,
              "rvariance": 0.49193720675615565
            },
            {
              "id": "chat_hard_sample_64",
              "rewards": [
                2.589533279988009,
                0.5083738234126313,
                1.0875769164480815,
                1.4787872341440256,
                0.8737682318189953,
                2.1658875890820797
              ],
              "variance": 1.6866394069192312,
              "mean_reward": 1.4506545124823038,
              "min_reward": 0.5083738234126313,
              "max_reward": 2.589533279988009,
              "num_responses": 6,
              "rvariance": 0.5269851115864905
            },
            {
              "id": "chat_hard_sample_233",
              "rewards": [
                0.5851596048893309,
                -0.7784499627141291,
                -0.2700751336270139,
                0.5639773203440345,
                -0.14298142635523511,
                -0.18534599544582803,
                -0.3548042718081998
              ],
              "variance": 1.0967127823327245,
              "mean_reward": -0.08321712353100578,
              "min_reward": -0.7784499627141291,
              "max_reward": 0.5851596048893309,
              "num_responses": 7,
              "rvariance": 0.21023062476746585
            },
            {
              "id": "chat_hard_sample_47",
              "rewards": [
                0.38657568727717656,
                -1.0326373772576867,
                -0.7466765358961844,
                -1.1067753731662244
              ],
              "variance": 1.1311339947188315,
              "mean_reward": -0.6248783997607297,
              "min_reward": -1.1067753731662244,
              "max_reward": 0.38657568727717656,
              "num_responses": 4,
              "rvariance": 0.3590915582146238
            },
            {
              "id": "chat_hard_sample_26",
              "rewards": [
                0.20123069750583247,
                -0.5878094018064609,
                -0.7678588204414809,
                -0.5666271172611644,
                0.09002370364302603,
                -1.0114550927123902,
                0.15886612841523953
              ],
              "variance": 1.0411092854013213,
              "mean_reward": -0.3548042718081998,
              "min_reward": -1.0114550927123902,
              "max_reward": 0.20123069750583247,
              "num_responses": 7,
              "rvariance": 0.21026696630169847
            },
            {
              "id": "chat_hard_sample_379",
              "rewards": [
                0.2541864088690736,
                -0.7043119668055915,
                -0.9796816658944455,
                -0.1747548531731798,
                -0.3336219872629033,
                -1.318598218619189,
                -0.4395334099893856
              ],
              "variance": 1.1120699386280646,
              "mean_reward": -0.5280450989822316,
              "min_reward": -1.318598218619189,
              "max_reward": 0.2541864088690736,
              "num_responses": 7,
              "rvariance": 0.23462208962148193
            },
            {
              "id": "chat_hard_sample_247",
              "rewards": [
                1.5171801248823755,
                1.996429312719708,
                0.4236446852314454,
                1.9646558859017633
              ],
              "variance": 1.2351919675476,
              "mean_reward": 1.475477502183823,
              "min_reward": 0.4236446852314454,
              "max_reward": 1.996429312719708,
              "num_responses": 4,
              "rvariance": 0.40469441588885613
            },
            {
              "id": "chat_hard_sample_215",
              "rewards": [
                1.542334087779915,
                1.7925498239712294,
                1.2299367623862947,
                0.5189649656852795,
                1.6839906156765851,
                1.7819586816985813,
                0.29125540682334244
              ],
              "variance": 1.3583139964671358,
              "mean_reward": 1.262998620574461,
              "min_reward": 0.29125540682334244,
              "max_reward": 1.7925498239712294,
              "num_responses": 7,
              "rvariance": 0.3291386606836904
            },
            {
              "id": "chat_hard_sample_49",
              "rewards": [
                -0.6089916863517574,
                -2.09175160452251,
                -1.8587464745242488,
                -1.9434756127054347,
                -2.261209880884882,
                -0.7360853936235362,
                -1.9858401817960276
              ],
              "variance": 1.4742870043526344,
              "mean_reward": -1.6408715477726281,
              "min_reward": -2.261209880884882,
              "max_reward": -0.6089916863517574,
              "num_responses": 7,
              "rvariance": 0.38993836693285405
            },
            {
              "id": "chat_hard_sample_415",
              "rewards": [
                0.3389155470502595,
                0.47130482545836244,
                0.9717362978409915,
                0.7201966688655959,
                0.6142852461391136,
                1.0339592586928,
                1.449661592894243
              ],
              "variance": 0.781891078278256,
              "mean_reward": 0.8000084909916236,
              "min_reward": 0.3389155470502595,
              "max_reward": 1.449661592894243,
              "num_responses": 7,
              "rvariance": 0.12396977249744238
            },
            {
              "id": "chat_hard_sample_297",
              "rewards": [
                0.8208125204557541,
                -0.4289422677167374,
                0.16416169955156365,
                -0.6301739708970538,
                0.03706799227978486,
                -0.0794345727193457,
                -0.8314056740773703
              ],
              "variance": 1.1374886800824204,
              "mean_reward": -0.13541632473191495,
              "min_reward": -0.8314056740773703,
              "max_reward": 0.8208125204557541,
              "num_responses": 7,
              "rvariance": 0.2646213107460334
            },
            {
              "id": "chat_hard_sample_80",
              "rewards": [
                2.393597147944017,
                2.393597147944017,
                2.298276867490183,
                2.298276867490183,
                0.24889083773274953
              ],
              "variance": 1.324951898308294,
              "mean_reward": 1.9265277737202298,
              "min_reward": 0.24889083773274953,
              "max_reward": 2.393597147944017,
              "num_responses": 5,
              "rvariance": 0.7054336134205248
            },
            {
              "id": "chat_hard_sample_413",
              "rewards": [
                -0.11120799953729041,
                -1.0220462349850385,
                -1.6681059136165808,
                -1.19150451134741,
                -0.6725385399876468,
                -1.7316527672524702
              ],
              "variance": 1.3080060706720569,
              "mean_reward": -1.066175994454406,
              "min_reward": -1.7316527672524702,
              "max_reward": -0.11120799953729041,
              "num_responses": 6,
              "rvariance": 0.31495799206813646
            },
            {
              "id": "chat_hard_sample_306",
              "rewards": [
                0.7652090235243509,
                -1.3397805031644854,
                -1.3503716454371337,
                -0.5666271172611644,
                -1.3291893608918373,
                -0.545444832715868,
                -0.8102233895320738
              ],
              "variance": 1.3228336698537648,
              "mean_reward": -0.7394896893540303,
              "min_reward": -1.3503716454371337,
              "max_reward": 0.7652090235243509,
              "num_responses": 7,
              "rvariance": 0.48827541087456494
            },
            {
              "id": "chat_hard_sample_43",
              "rewards": [
                0.47130482545836244,
                -0.0794345727193457,
                -0.5560359749885162,
                -0.9479082390765008,
                -0.28066627589966214,
                0.03706799227978486,
                -0.6089916863517574
              ],
              "variance": 0.9553210329928707,
              "mean_reward": -0.28066627589966214,
              "min_reward": -0.9479082390765008,
              "max_reward": 0.47130482545836244,
              "num_responses": 7,
              "rvariance": 0.1908210977952692
            },
            {
              "id": "chat_hard_sample_102",
              "rewards": [
                1.8905178899932258,
                1.039254829829124,
                2.409483861352989,
                0.3071421202323148,
                2.2453211561269413,
                2.0229071684013284
              ],
              "variance": 1.6542040337092456,
              "mean_reward": 1.6524378376559874,
              "min_reward": 0.3071421202323148,
              "max_reward": 2.409483861352989,
              "num_responses": 6,
              "rvariance": 0.5507288193444081
            },
            {
              "id": "chat_hard_sample_187",
              "rewards": [
                -0.365395414080848,
                -1.4033273568003748,
                -0.5348536904432197,
                -0.5242625481705715,
                -0.8208145318047221,
                -0.5348536904432197
              ],
              "variance": 0.6672419631768387,
              "mean_reward": -0.6972512052904926,
              "min_reward": -1.4033273568003748,
              "max_reward": -0.365395414080848,
              "num_responses": 6,
              "rvariance": 0.11776844578315693
            },
            {
              "id": "chat_hard_sample_360",
              "rewards": [
                2.483621857261527,
                1.3794952753379484,
                1.3794952753379484,
                0.9823274401136397,
                1.493350054768917,
                1.493350054768917
              ],
              "variance": 0.807574598289428,
              "mean_reward": 1.5352733262648162,
              "min_reward": 0.9823274401136397,
              "max_reward": 2.483621857261527,
              "num_responses": 6,
              "rvariance": 0.20952713549035237
            },
            {
              "id": "chat_hard_sample_236",
              "rewards": [
                1.5780791929501028,
                -1.1491399422568174,
                -0.13239028408258688,
                0.4236446852314454,
                -0.05295671703772512,
                -0.6619473977149986,
                -1.096184230893576
              ],
              "variance": 2.0027850037577815,
              "mean_reward": -0.15584209911487942,
              "min_reward": -1.1491399422568174,
              "max_reward": 1.5780791929501028,
              "num_responses": 7,
              "rvariance": 0.7829214104344938
            },
            {
              "id": "chat_hard_sample_259",
              "rewards": [
                2.727218129532436,
                -0.38657769862614444,
                1.1286175927545934,
                2.674262418169195,
                0.5136693945489553,
                0.5719206770485207,
                2.2612078695359137
              ],
              "variance": 2.5418741454355755,
              "mean_reward": 1.3557597689947813,
              "min_reward": -0.38657769862614444,
              "max_reward": 2.727218129532436,
              "num_responses": 7,
              "rvariance": 1.2642909819203432
            },
            {
              "id": "chat_hard_sample_127",
              "rewards": [
                1.0273397947723946,
                -0.4713068368073303,
                0.9849752256818017,
                0.06354584796140544,
                -1.0220462349850385
              ],
              "variance": 1.8121444428501128,
              "mean_reward": 0.11650155932464656,
              "min_reward": -1.0220462349850385,
              "max_reward": 1.0273397947723946,
              "num_responses": 5,
              "rvariance": 0.6456973796332178
            },
            {
              "id": "chat_hard_sample_280",
              "rewards": [
                0.8049258070467817,
                -0.28066627589966214,
                0.4289402563677695,
                -0.48189797907997856,
                -0.15357256862788332,
                -0.05295671703772512,
                -0.026478861356104534
              ],
              "variance": 0.9404934338111632,
              "mean_reward": 0.034041951630456806,
              "min_reward": -0.48189797907997856,
              "max_reward": 0.8049258070467817,
              "num_responses": 7,
              "rvariance": 0.16598180222413375
            },
            {
              "id": "chat_hard_sample_421",
              "rewards": [
                0.5586817492077103,
                -0.6513562554423503,
                -1.127957657711521,
                -0.22771056453642097,
                -1.2444602227106514,
                -1.223277938165355,
                -0.8843613854406114
              ],
              "variance": 1.3185972129447052,
              "mean_reward": -0.6857774678284569,
              "min_reward": -1.2444602227106514,
              "max_reward": 0.5586817492077103,
              "num_responses": 7,
              "rvariance": 0.37081155992775905
            },
            {
              "id": "chat_hard_sample_270",
              "rewards": [
                3.3097309545280886,
                2.404188290216665,
                1.6072048341998855,
                2.5524642820337404,
                1.4721677702236204,
                2.414779432489313
              ],
              "variance": 1.3914113160691617,
              "mean_reward": 2.293422593948552,
              "min_reward": 1.4721677702236204,
              "max_reward": 3.3097309545280886,
              "num_responses": 6,
              "rvariance": 0.3787226834943675
            },
            {
              "id": "chat_hard_sample_276",
              "rewards": [
                0.8896549452279676,
                -0.9267259545312043,
                -0.6089916863517574,
                -0.3230308449902551,
                -0.9055436699859079,
                -0.6513562554423503
              ],
              "variance": 1.1994468623774124,
              "mean_reward": -0.42099891101225123,
              "min_reward": -0.9267259545312043,
              "max_reward": 0.8896549452279676,
              "num_responses": 6,
              "rvariance": 0.3843934214242406
            },
            {
              "id": "chat_hard_sample_349",
              "rewards": [
                0.770504594660675,
                0.770504594660675,
                0.11650155932464662,
                0.11650155932464662,
                0.10591041705199838,
                0.11650155932464662,
                -0.1747548531731798
              ],
              "variance": 0.7768602856987479,
              "mean_reward": 0.26023849016772976,
              "min_reward": -0.1747548531731798,
              "max_reward": 0.770504594660675,
              "num_responses": 7,
              "rvariance": 0.11368003907941364
            },
            {
              "id": "chat_hard_sample_267",
              "rewards": [
                0.8022780214786197,
                -1.8375641899789523,
                -0.8525879586226667,
                -0.10061685726464217,
                -1.180913369074762,
                -1.2868247918012443,
                -1.180913369074762
              ],
              "variance": 1.7676616453049905,
              "mean_reward": -0.8053060734769157,
              "min_reward": -1.8375641899789523,
              "max_reward": 0.8022780214786197,
              "num_responses": 7,
              "rvariance": 0.6661039809509293
            },
            {
              "id": "chat_hard_sample_14",
              "rewards": [
                1.0577893288062583,
                0.2382996954601013,
                0.22241298205112894,
                0.6089896750027894,
                0.16416169955156365,
                -0.5560359749885162
              ],
              "variance": 1.029326639623,
              "mean_reward": 0.28926956764722095,
              "min_reward": -0.5560359749885162,
              "max_reward": 1.0577893288062583,
              "num_responses": 6,
              "rvariance": 0.23835079005297954
            },
            {
              "id": "chat_hard_sample_13",
              "rewards": [
                0.9783557617613966,
                0.9492301205116139,
                1.0889008092321626,
                0.4818959677310107,
                0.7996302359104577,
                0.29655097795966656,
                0.7043099554566236
              ],
              "variance": 0.61481580892723,
              "mean_reward": 0.7569819755089903,
              "min_reward": 0.29655097795966656,
              "max_reward": 1.0889008092321626,
              "num_responses": 7,
              "rvariance": 0.06977114938114101
            },
            {
              "id": "chat_hard_sample_147",
              "rewards": [
                0.9240761576140744,
                -0.13239028408258688,
                0.9915946896022069,
                -0.015887719083456302,
                -0.5560359749885162
              ],
              "variance": 1.3511649754330983,
              "mean_reward": 0.24227137381234437,
              "min_reward": -0.5560359749885162,
              "max_reward": 0.9915946896022069,
              "num_responses": 5,
              "rvariance": 0.37413105861841156
            },
            {
              "id": "chat_hard_sample_173",
              "rewards": [
                1.9593603147654393,
                0.1112059881883225,
                1.1094211473854185,
                0.1112059881883225,
                1.1094211473854185,
                0.1112059881883225
              ],
              "variance": 1.4231847428871063,
              "mean_reward": 0.7519700956835407,
              "min_reward": 0.1112059881883225,
              "max_reward": 1.9593603147654393,
              "num_responses": 6,
              "rvariance": 0.4908449290371038
            },
            {
              "id": "chat_hard_sample_345",
              "rewards": [
                -0.21711942226377273,
                -0.8419968163500186,
                -1.233869080438003,
                -0.5666271172611644,
                -1.0326373772576867,
                -0.9267259545312043
              ],
              "variance": 0.7413799590853763,
              "mean_reward": -0.8031626280169749,
              "min_reward": -1.233869080438003,
              "max_reward": -0.21711942226377273,
              "num_responses": 6,
              "rvariance": 0.10905639756615759
            },
            {
              "id": "chat_hard_sample_412",
              "rewards": [
                1.6575127599949646,
                0.4924871100036589,
                1.29145640519656,
                1.768719753857771,
                0.4924871100036589,
                1.29145640519656,
                0.4660092543220383
              ],
              "variance": 1.2200995898090765,
              "mean_reward": 1.0657326855107445,
              "min_reward": 0.4660092543220383,
              "max_reward": 1.768719753857771,
              "num_responses": 7,
              "rvariance": 0.2804551490958502
            },
            {
              "id": "chat_hard_sample_21",
              "rewards": [
                1.1587361535924368,
                0.3018465490959907,
                -0.02118329021978042,
                0.1376838438699431,
                -0.5772182595338127,
                0.11650155932464662
              ],
              "variance": 1.0294921262210104,
              "mean_reward": 0.18606109268823734,
              "min_reward": -0.5772182595338127,
              "max_reward": 1.1587361535924368,
              "num_responses": 6,
              "rvariance": 0.26537125611349416
            },
            {
              "id": "chat_hard_sample_357",
              "rewards": [
                0.6195808172754377,
                0.05825027682508133,
                0.18534398409686012,
                -0.2594839913543657,
                0.01059013659816428,
                -0.6513562554423503,
                -1.0114550927123902
              ],
              "variance": 1.1544345077186575,
              "mean_reward": -0.14979001781622325,
              "min_reward": -1.0114550927123902,
              "max_reward": 0.6195808172754377,
              "num_responses": 7,
              "rvariance": 0.2541881427293106
            },
            {
              "id": "chat_hard_sample_184",
              "rewards": [
                0.7334355967064062,
                0.2806642645506942,
                0.9095133369891831,
                0.015885707734488396,
                0.09531927477935015,
                0.6540020296615444
              ],
              "variance": 0.7658719755908754,
              "mean_reward": 0.4481367017369444,
              "min_reward": 0.015885707734488396,
              "max_reward": 0.9095133369891831,
              "num_responses": 6,
              "rvariance": 0.1126687446778613
            },
            {
              "id": "chat_hard_sample_348",
              "rewards": [
                0.5851596048893309,
                0.3071421202323148,
                2.1447053045367834,
                0.3071421202323148,
                0.3071421202323148,
                0.40775797182247303
              ],
              "variance": 1.0577903344807424,
              "mean_reward": 0.676508206990922,
              "min_reward": 0.3071421202323148,
              "max_reward": 2.1447053045367834,
              "num_responses": 6,
              "rvariance": 0.4409113152322008
            },
            {
              "id": "chat_hard_sample_283",
              "rewards": [
                -0.15357256862788332,
                -0.6195828286244056,
                -1.0538196618029831,
                -1.2126867958927066,
                -1.2656425072559478,
                -0.34421312953555155
              ],
              "variance": 0.9902718024926096,
              "mean_reward": -0.7749195819565798,
              "min_reward": -1.2656425072559478,
              "max_reward": -0.15357256862788332,
              "num_responses": 6,
              "rvariance": 0.18432400726924622
            },
            {
              "id": "chat_hard_sample_0",
              "rewards": [
                0.04236356341610898,
                -0.3548042718081998,
                -0.38657769862614444,
                0.015885707734488396,
                -0.6937208245329433,
                -0.2594839913543657,
                -0.19593713771847626
              ],
              "variance": 0.5359117989960005,
              "mean_reward": -0.2617535218413617,
              "min_reward": -0.6937208245329433,
              "max_reward": 0.04236356341610898,
              "num_responses": 7,
              "rvariance": 0.054963279758092
            },
            {
              "id": "chat_hard_sample_258",
              "rewards": [
                0.5666251059121965,
                -1.7104704827071737,
                -1.4351007836183196,
                -0.8208145318047221,
                -1.1597310845294655,
                -1.3291893608918373,
                -1.0644108040756315
              ],
              "variance": 1.279409986535907,
              "mean_reward": -0.9932988488164219,
              "min_reward": -1.7104704827071737,
              "max_reward": 0.5666251059121965,
              "num_responses": 7,
              "rvariance": 0.4740309602244158
            },
            {
              "id": "chat_hard_sample_161",
              "rewards": [
                1.1507927968879506,
                -0.3971688408987927,
                0.3706889738682042,
                -0.503080263625275,
                0.29125540682334244
              ],
              "variance": 1.2994669622147343,
              "mean_reward": 0.18249761461108588,
              "min_reward": -0.503080263625275,
              "max_reward": 1.1507927968879506,
              "num_responses": 5,
              "rvariance": 0.35817400637139385
            },
            {
              "id": "chat_hard_sample_4",
              "rewards": [
                0.5030782522763071,
                -0.7890411049867774,
                -1.000863950439742,
                -0.2700751336270139,
                -0.7149031090782397,
                -0.9161348122585561,
                -1.1597310845294655
              ],
              "variance": 1.1035970248099463,
              "mean_reward": -0.6210958489490697,
              "min_reward": -1.1597310845294655,
              "max_reward": 0.5030782522763071,
              "num_responses": 7,
              "rvariance": 0.2779125830455599
            },
            {
              "id": "chat_hard_sample_238",
              "rewards": [
                0.632819745116248,
                -0.005296576810808069,
                0.7334355967064062,
                -0.11120799953729041,
                -0.09532128612831806,
                -0.5878094018064609
              ],
              "variance": 1.0326363715832028,
              "mean_reward": 0.09443667958996277,
              "min_reward": -0.5878094018064609,
              "max_reward": 0.7334355967064062,
              "num_responses": 6,
              "rvariance": 0.20864669982357273
            },
            {
              "id": "chat_hard_sample_8",
              "rewards": [
                -0.06354785931037335,
                -0.03177443249242865,
                0.270073122278046,
                -0.24889284908171744,
                0.40775797182247303,
                0.16945727068788777,
                -0.2594839913543657
              ],
              "variance": 0.5782763680865936,
              "mean_reward": 0.0347984617927888,
              "min_reward": -0.2594839913543657,
              "max_reward": 0.40775797182247303,
              "num_responses": 7,
              "rvariance": 0.05625326114644597
            },
            {
              "id": "chat_hard_sample_32",
              "rewards": [
                0.4607136831857142,
                -0.21711942226377273,
                -0.1747548531731798,
                0.4289402563677695,
                0.1112059881883225,
                0.6910710276158133,
                -0.12179914180993863
              ],
              "variance": 0.7445573017671708,
              "mean_reward": 0.16832250544438976,
              "min_reward": -0.21711942226377273,
              "max_reward": 0.6910710276158133,
              "num_responses": 7,
              "rvariance": 0.11148295010430676
            },
            {
              "id": "chat_hard_sample_109",
              "rewards": [
                2.780173840895677,
                -0.18534599544582803,
                1.580726978518265,
                2.298276867490183,
                1.580726978518265,
                1.580726978518265,
                0.8393470194328886
              ],
              "variance": 2.0615658433709787,
              "mean_reward": 1.496376095418245,
              "min_reward": -0.18534599544582803,
              "max_reward": 2.780173840895677,
              "num_responses": 7,
              "rvariance": 0.7960575873674527
            },
            {
              "id": "chat_hard_sample_188",
              "rewards": [
                1.18852374123426,
                0.5666251059121965,
                -1.0220462349850385,
                -0.09002571499199394,
                0.19063955523318424,
                -1.0056744839526915e-06,
                0.12709270159729485
              ],
              "variance": 1.2782184830302339,
              "mean_reward": 0.1372583069036313,
              "min_reward": -1.0220462349850385,
              "max_reward": 1.18852374123426,
              "num_responses": 7,
              "rvariance": 0.3867075607222656
            },
            {
              "id": "chat_hard_sample_53",
              "rewards": [
                0.2065262686421566,
                -1.2126867958927066,
                0.02647685000713663,
                -0.015887719083456302,
                -0.6089916863517574,
                -0.365395414080848,
                -0.3548042718081998
              ],
              "variance": 0.9489663476292817,
              "mean_reward": -0.33210896693823927,
              "min_reward": -1.2126867958927066,
              "max_reward": 0.2065262686421566,
              "num_responses": 7,
              "rvariance": 0.19605885718578192
            },
            {
              "id": "chat_hard_sample_356",
              "rewards": [
                -0.18534599544582803,
                -0.9267259545312043,
                -1.4456919258909677,
                -1.4774653527089125,
                -0.5878094018064609,
                -0.683129682260295,
                -1.8799287590695453
              ],
              "variance": 1.211626675990958,
              "mean_reward": -1.0265852959590307,
              "min_reward": -1.8799287590695453,
              "max_reward": -0.18534599544582803,
              "num_responses": 7,
              "rvariance": 0.30503996450429033
            },
            {
              "id": "chat_hard_sample_63",
              "rewards": [
                1.2279095515606706,
                0.31773326250496303,
                0.38128011614085244,
                1.0299875803405567,
                0.8923027307961297,
                0.632819745116248,
                0.4236446852314454
              ],
              "variance": 0.7532949941421057,
              "mean_reward": 0.7008110959558379,
              "min_reward": 0.31773326250496303,
              "max_reward": 1.2279095515606706,
              "num_responses": 7,
              "rvariance": 0.10759310036463805
            },
            {
              "id": "chat_hard_sample_159",
              "rewards": [
                0.5083738234126313,
                -0.19593713771847626,
                -0.005296576810808069,
                -0.2912574181723104
              ],
              "variance": 0.6169340373817598,
              "mean_reward": 0.003970672677759135,
              "min_reward": -0.2912574181723104,
              "max_reward": 0.5083738234126313,
              "num_responses": 4,
              "rvariance": 0.09540779466718587
            },
            {
              "id": "chat_hard_sample_152",
              "rewards": [
                1.0273397947723946,
                -0.5666271172611644,
                -0.37598655635349626,
                -1.096184230893576,
                -0.725494251350888,
                0.15886612841523953
              ],
              "variance": 1.5039422027160492,
              "mean_reward": -0.2630143721119151,
              "min_reward": -1.096184230893576,
              "max_reward": 1.0273397947723946,
              "num_responses": 6,
              "rvariance": 0.4760000164055447
            },
            {
              "id": "chat_hard_sample_318",
              "rewards": [
                1.0538176504540153,
                1.4112687021558932,
                1.333820974287153,
                0.270073122278046,
                1.086914970056041,
                1.1929918793805334
              ],
              "variance": 0.7105994518554924,
              "mean_reward": 1.058147883101947,
              "min_reward": 0.270073122278046,
              "max_reward": 1.4112687021558932,
              "num_responses": 6,
              "rvariance": 0.14013016570659576
            },
            {
              "id": "chat_hard_sample_176",
              "rewards": [
                -0.8843613854406114,
                -0.9902728081670937,
                -1.2550513649832995,
                -0.8631791008953149,
                -1.8587464745242488,
                -1.3715539299824302,
                -0.7678588204414809
              ],
              "variance": 0.7413799590853763,
              "mean_reward": -1.1415748406334971,
              "min_reward": -1.8587464745242488,
              "max_reward": -0.7678588204414809,
              "num_responses": 7,
              "rvariance": 0.1266173391124375
            },
            {
              "id": "chat_hard_sample_274",
              "rewards": [
                -0.19593713771847626,
                -2.345939019066068,
                -2.1976630272489923,
                -2.0282047508866206,
                -1.9222933281601382,
                -2.324756734520771
              ],
              "variance": 1.2762326438541125,
              "mean_reward": -1.835798999600178,
              "min_reward": -2.345939019066068,
              "max_reward": -0.19593713771847626,
              "num_responses": 6,
              "rvariance": 0.5606527080934696
            },
            {
              "id": "chat_hard_sample_389",
              "rewards": [
                -0.09532128612831806,
                -1.318598218619189,
                -0.5242625481705715,
                -1.3291893608918373,
                -1.5198299217995055,
                -1.4774653527089125,
                -1.233869080438003
              ],
              "variance": 1.1417251369914796,
              "mean_reward": -1.0712193955366196,
              "min_reward": -1.5198299217995055,
              "max_reward": -0.09532128612831806,
              "num_responses": 7,
              "rvariance": 0.25314654285051547
            },
            {
              "id": "chat_hard_sample_42",
              "rewards": [
                1.0246920092042326,
                0.19063955523318424,
                0.06354584796140544,
                0.29125540682334244,
                0.44482696977674185,
                0.22770855318745306,
                0.4871915388673348
              ],
              "variance": 0.5623896546776214,
              "mean_reward": 0.38997998300767067,
              "min_reward": 0.06354584796140544,
              "max_reward": 1.0246920092042326,
              "num_responses": 7,
              "rvariance": 0.08538457775660573
            },
            {
              "id": "chat_hard_sample_5",
              "rewards": [
                0.2753686934143701,
                -0.5878094018064609,
                -0.545444832715868,
                -0.3971688408987927,
                -0.5136714058979233,
                0.03706799227978486,
                -0.4713068368073303
              ],
              "variance": 0.6947789330857242,
              "mean_reward": -0.31470923320460287,
              "min_reward": -0.5878094018064609,
              "max_reward": 0.2753686934143701,
              "num_responses": 7,
              "rvariance": 0.09581001962038134
            },
            {
              "id": "chat_hard_sample_17",
              "rewards": [
                1.359636883576733,
                0.2065262686421566,
                1.4152403805081362,
                1.269612174259223,
                1.2706050938472837,
                1.408620916587731
              ],
              "variance": 0.6738614270972437,
              "mean_reward": 1.1550402862368772,
              "min_reward": 0.2065262686421566,
              "max_reward": 1.4152403805081362,
              "num_responses": 6,
              "rvariance": 0.18333796277461142
            },
            {
              "id": "chat_hard_sample_182",
              "rewards": [
                2.3883015768076925,
                1.7766631105622572,
                0.16945727068788777,
                1.6363304754496681
              ],
              "variance": 1.5952908048176404,
              "mean_reward": 1.4926881083768764,
              "min_reward": 0.16945727068788777,
              "max_reward": 2.3883015768076925,
              "num_responses": 4,
              "rvariance": 0.6635845665325601
            },
            {
              "id": "chat_hard_sample_140",
              "rewards": [
                -0.365395414080848,
                -1.5198299217995055,
                -1.318598218619189,
                -1.3080070763465408,
                -1.2020956536200584
              ],
              "variance": 0.7392617306308467,
              "mean_reward": -1.1427852568932282,
              "min_reward": -1.5198299217995055,
              "max_reward": -0.365395414080848,
              "num_responses": 5,
              "rvariance": 0.16164476346727105
            },
            {
              "id": "chat_hard_sample_251",
              "rewards": [
                0.8022780214786197,
                -0.3548042718081998,
                -0.3018485604449586,
                0.2382996954601013,
                -0.2594839913543657,
                -0.10061685726464217
              ],
              "variance": 0.8486152745959398,
              "mean_reward": 0.003970672677759131,
              "min_reward": -0.3548042718081998,
              "max_reward": 0.8022780214786197,
              "num_responses": 6,
              "rvariance": 0.1657994149376648
            },
            {
              "id": "chat_hard_sample_98",
              "rewards": [
                0.01059013659816428,
                -0.6937208245329433,
                -0.15357256862788332,
                -0.2700751336270139,
                -0.9055436699859079,
                -0.41835112544408914,
                -0.38657769862614444
              ],
              "variance": 0.6905424761766648,
              "mean_reward": -0.4024644120351168,
              "min_reward": -0.9055436699859079,
              "max_reward": 0.01059013659816428,
              "num_responses": 7,
              "rvariance": 0.08407313483228752
            },
            {
              "id": "chat_hard_sample_409",
              "rewards": [
                0.860529303978185,
                -0.2383017068090692,
                -0.015887719083456302,
                -0.22771056453642097,
                -0.19593713771847626,
                -0.5878094018064609
              ],
              "variance": 0.8353763467551294,
              "mean_reward": -0.06751953766261644,
              "min_reward": -0.5878094018064609,
              "max_reward": 0.860529303978185,
              "num_responses": 6,
              "rvariance": 0.20099347238080054
            },
            {
              "id": "chat_hard_sample_248",
              "rewards": [
                0.06884141909772956,
                -1.9646578972507311,
                -1.6257413445259878,
                -1.3080070763465408,
                -1.2550513649832995,
                -0.6937208245329433,
                -1.6045590599806914
              ],
              "variance": 1.3726120385352114,
              "mean_reward": -1.1975565926460663,
              "min_reward": -1.9646578972507311,
              "max_reward": 0.06884141909772956,
              "num_responses": 7,
              "rvariance": 0.40150813789424006
            },
            {
              "id": "chat_hard_sample_382",
              "rewards": [
                0.015885707734488396,
                -2.0070224663413243,
                -0.7466765358961844,
                -0.7996322472594256,
                -1.5198299217995055,
                -0.5136714058979233,
                -1.2974159340738924
              ],
              "variance": 1.4128583791712743,
              "mean_reward": -0.9811946862191095,
              "min_reward": -2.0070224663413243,
              "max_reward": 0.015885707734488396,
              "num_responses": 7,
              "rvariance": 0.39187963439926793
            },
            {
              "id": "chat_hard_sample_254",
              "rewards": [
                0.9201044792618314,
                -0.958499381349149,
                -0.09532128612831806,
                -0.7466765358961844,
                -1.3715539299824302,
                -1.0750019463482796
              ],
              "variance": 1.6356695347321115,
              "mean_reward": -0.5544914334070883,
              "min_reward": -1.3715539299824302,
              "max_reward": 0.9201044792618314,
              "num_responses": 6,
              "rvariance": 0.5873250304705373
            },
            {
              "id": "chat_hard_sample_2",
              "rewards": [
                -0.047661145901401004,
                -0.2700751336270139,
                -0.6407651131697021,
                -0.7043119668055915,
                -0.9161348122585561,
                -0.9479082390765008,
                -0.7678588204414809
              ],
              "variance": 0.7477346444489653,
              "mean_reward": -0.6135307473257495,
              "min_reward": -0.9479082390765008,
              "max_reward": -0.047661145901401004,
              "num_responses": 7,
              "rvariance": 0.09633539802078459
            },
            {
              "id": "chat_hard_sample_203",
              "rewards": [
                0.8499381617055368,
                -1.0538196618029831,
                -1.180913369074762,
                -2.45185044179255,
                -1.3503716454371337,
                -1.4351007836183196,
                -1.9858401817960276
              ],
              "variance": 1.879927753395062,
              "mean_reward": -1.229708274545177,
              "min_reward": -2.45185044179255,
              "max_reward": 0.8499381617055368,
              "num_responses": 7,
              "rvariance": 0.9257656738125458
            },
            {
              "id": "chat_hard_sample_68",
              "rewards": [
                -0.047661145901401004,
                0.3918712584135007,
                -0.2700751336270139,
                -0.3548042718081998,
                0.3389155470502595
              ],
              "variance": 0.6916015904039297,
              "mean_reward": 0.011649250825429091,
              "min_reward": -0.3548042718081998,
              "max_reward": 0.3918712584135007,
              "num_responses": 5,
              "rvariance": 0.0937693079809239
            },
            {
              "id": "chat_hard_sample_220",
              "rewards": [
                0.3706889738682042,
                -1.1173665154388726,
                -1.498647637254209,
                -1.5621944908900984,
                -1.6257413445259878,
                -1.583376775435395,
                -2.0070224663413243
              ],
              "variance": 1.2561094735360812,
              "mean_reward": -1.2890943222882405,
              "min_reward": -2.0070224663413243,
              "max_reward": 0.3706889738682042,
              "num_responses": 7,
              "rvariance": 0.5168887890834558
            },
            {
              "id": "chat_hard_sample_11",
              "rewards": [
                0.3918712584135007,
                0.40775797182247303,
                -0.5136714058979233,
                -0.2383017068090692
              ],
              "variance": 0.8340524539710483,
              "mean_reward": 0.011914029382245325,
              "min_reward": -0.5136714058979233,
              "max_reward": 0.40775797182247303,
              "num_responses": 4,
              "rvariance": 0.15997697176903447
            },
            {
              "id": "chat_hard_sample_6",
              "rewards": [
                -0.0794345727193457,
                -0.8419968163500186,
                -0.6937208245329433,
                -0.41835112544408914,
                -1.180913369074762,
                -0.6513562554423503
              ],
              "variance": 0.7625622436306728,
              "mean_reward": -0.6442954939272515,
              "min_reward": -1.180913369074762,
              "max_reward": -0.0794345727193457,
              "num_responses": 6,
              "rvariance": 0.11660933207188233
            },
            {
              "id": "chat_hard_sample_286",
              "rewards": [
                -0.3018485604449586,
                -0.37598655635349626,
                -0.21711942226377273,
                -1.5198299217995055,
                -0.15357256862788332,
                -0.31243970271760685
              ],
              "variance": 0.7625622436306727,
              "mean_reward": -0.48013278870120385,
              "min_reward": -1.5198299217995055,
              "max_reward": -0.15357256862788332,
              "num_responses": 6,
              "rvariance": 0.22125673527929382
            },
            {
              "id": "chat_hard_sample_400",
              "rewards": [
                0.5957507471619792,
                0.13238827273361897,
                -0.2912574181723104,
                -0.37598655635349626,
                -0.4395334099893856,
                -0.41835112544408914,
                -0.3548042718081998
              ],
              "variance": 0.7445573017671709,
              "mean_reward": -0.16454196598169757,
              "min_reward": -0.4395334099893856,
              "max_reward": 0.5957507471619792,
              "num_responses": 7,
              "rvariance": 0.12903104652387626
            },
            {
              "id": "chat_hard_sample_209",
              "rewards": [
                -0.5666271172611644,
                -0.3018485604449586,
                -0.9267259545312043,
                -0.4289422677167374,
                -0.7149031090782397,
                -0.9055436699859079,
                -0.958499381349149
              ],
              "variance": 0.5613305404503564,
              "mean_reward": -0.6861557229096231,
              "min_reward": -0.958499381349149,
              "max_reward": -0.3018485604449586,
              "num_responses": 7,
              "rvariance": 0.05844863319867573
            },
            {
              "id": "chat_hard_sample_337",
              "rewards": [
                1.2088785927895058,
                0.0476591345524331,
                0.4554181120493901,
                0.6540020296615444,
                0.5507383925032242,
                0.23300412432377718,
                0.38128011614085244
              ],
              "variance": 0.7170865264974897,
              "mean_reward": 0.5044257860029611,
              "min_reward": 0.0476591345524331,
              "max_reward": 1.2088785927895058,
              "num_responses": 7,
              "rvariance": 0.11723482394220652
            },
            {
              "id": "chat_hard_sample_268",
              "rewards": [
                2.70603584498714,
                1.3550032588324494,
                2.134114162264135,
                1.3550032588324494,
                1.3550032588324494,
                1.9646558859017633
              ],
              "variance": 1.065071744793188,
              "mean_reward": 1.811635944941731,
              "min_reward": 1.3550032588324494,
              "max_reward": 2.70603584498714,
              "num_responses": 6,
              "rvariance": 0.2588164523750363
            },
            {
              "id": "chat_hard_sample_249",
              "rewards": [
                0.9280478359663175,
                -0.31243970271760685,
                -0.45012455226203385,
                -0.2700751336270139,
                -0.9690905236217973,
                -0.7466765358961844,
                -0.31243970271760685
              ],
              "variance": 1.0448161851967486,
              "mean_reward": -0.3046854735537036,
              "min_reward": -0.9690905236217973,
              "max_reward": 0.9280478359663175,
              "num_responses": 7,
              "rvariance": 0.3112703199331466
            },
            {
              "id": "chat_hard_sample_295",
              "rewards": [
                0.953201798863857,
                1.4629005207350532,
                1.328525403150829,
                1.273583852611466,
                1.5635163723252115,
                1.362284669144895,
                1.7607763971532848
              ],
              "variance": 0.49698935114401843,
              "mean_reward": 1.386398430569228,
              "min_reward": 0.953201798863857,
              "max_reward": 1.7607763971532848,
              "num_responses": 7,
              "rvariance": 0.05452848692407091
            },
            {
              "id": "chat_hard_sample_153",
              "rewards": [
                0.2859598356870183,
                0.2859598356870183,
                0.2859598356870183,
                0.2541864088690736,
                0.2859598356870183,
                -0.725494251350888
              ],
              "variance": 0.5216137569279256,
              "mean_reward": 0.11208858337770981,
              "min_reward": -0.725494251350888,
              "max_reward": 0.2859598356870183,
              "num_responses": 6,
              "rvariance": 0.1404436077599661
            },
            {
              "id": "chat_hard_sample_192",
              "rewards": [
                -0.545444832715868,
                -1.7104704827071737,
                -1.5621944908900984,
                -1.8375641899789523,
                -1.7316527672524702
              ],
              "variance": 0.8430549249027992,
              "mean_reward": -1.4774653527089125,
              "min_reward": -1.8375641899789523,
              "max_reward": -0.545444832715868,
              "num_responses": 5,
              "rvariance": 0.22488301629322222
            },
            {
              "id": "chat_hard_sample_363",
              "rewards": [
                -0.37598655635349626,
                -1.3291893608918373,
                -0.8208145318047221,
                -1.276233649528596,
                -1.096184230893576,
                -1.498647637254209
              ],
              "variance": 0.815517954993914,
              "mean_reward": -1.0661759944544063,
              "min_reward": -1.498647637254209,
              "max_reward": -0.37598655635349626,
              "num_responses": 6,
              "rvariance": 0.13963269554663485
            },
            {
              "id": "chat_hard_sample_129",
              "rewards": [
                1.4059731310195691,
                -0.41835112544408914,
                -0.4289422677167374,
                -0.22771056453642097,
                -0.22771056453642097
              ],
              "variance": 1.1772054636048512,
              "mean_reward": 0.02065172175718013,
              "min_reward": -0.4289422677167374,
              "max_reward": 1.4059731310195691,
              "num_responses": 5,
              "rvariance": 0.4874682625377188
            },
            {
              "id": "chat_hard_sample_359",
              "rewards": [
                0.587807390457493,
                0.5136693945489553,
                0.587807390457493,
                -0.10591242840096629,
                0.10061484591567427,
                0.23300412432377718,
                -0.15357256862788332
              ],
              "variance": 0.7127838749492261,
              "mean_reward": 0.2519168783820776,
              "min_reward": -0.15357256862788332,
              "max_reward": 0.587807390457493,
              "num_responses": 7,
              "rvariance": 0.08712467909258188
            },
            {
              "id": "chat_hard_sample_7",
              "rewards": [
                -0.2700751336270139,
                -0.15357256862788332,
                0.22770855318745306,
                -0.13239028408258688,
                0.11650155932464662,
                -0.11650357067361451
              ],
              "variance": 0.38392890738349844,
              "mean_reward": -0.05472190741649982,
              "min_reward": -0.2700751336270139,
              "max_reward": 0.22770855318745306,
              "num_responses": 6,
              "rvariance": 0.029180376091630458
            },
            {
              "id": "chat_hard_sample_316",
              "rewards": [
                -0.3971688408987927,
                -1.3080070763465408,
                -1.5621944908900984,
                -1.318598218619189,
                -1.3397805031644854,
                -1.3715539299824302,
                -1.6045590599806914
              ],
              "variance": 0.6354685363588943,
              "mean_reward": -1.271694588554604,
              "min_reward": -1.6045590599806914,
              "max_reward": -0.3971688408987927,
              "num_responses": 7,
              "rvariance": 0.13973005143274203
            },
            {
              "id": "chat_hard_sample_41",
              "rewards": [
                0.8261080915920782,
                0.5242605368216036,
                0.7599134523880268,
                0.7890390936378094,
                0.5507383925032242,
                0.5586817492077103
              ],
              "variance": 0.27007412795253005,
              "mean_reward": 0.6681235526917421,
              "min_reward": 0.5242605368216036,
              "max_reward": 0.8261080915920782,
              "num_responses": 6,
              "rvariance": 0.01574306996294318
            },
            {
              "id": "chat_hard_sample_143",
              "rewards": [
                1.6257393331770198,
                -0.19593713771847626,
                -0.34421312953555155,
                -0.5666271172611644
              ],
              "variance": 1.579139312851852,
              "mean_reward": 0.1297404871654569,
              "min_reward": -0.5666271172611644,
              "max_reward": 1.6257393331770198,
              "num_responses": 4,
              "rvariance": 0.7634095834742015
            },
            {
              "id": "chat_hard_sample_370",
              "rewards": [
                0.360097831595556,
                -0.7360853936235362,
                -1.541012206344802,
                -1.583376775435395,
                -0.6619473977149986,
                -1.233869080438003,
                -1.2868247918012443
              ],
              "variance": 1.3048287279902626,
              "mean_reward": -0.954716830537489,
              "min_reward": -1.583376775435395,
              "max_reward": 0.360097831595556,
              "num_responses": 7,
              "rvariance": 0.3984897874762371
            },
            {
              "id": "chat_hard_sample_91",
              "rewards": [
                0.35480226045923186,
                -0.10061685726464217,
                0.02647685000713663,
                0.44482696977674185,
                -0.37598655635349626,
                0.031772421143460745,
                -0.04236557476507689
              ],
              "variance": 0.6015768810864197,
              "mean_reward": 0.04841564471476511,
              "min_reward": -0.37598655635349626,
              "max_reward": 0.44482696977674185,
              "num_responses": 7,
              "rvariance": 0.06604887846812597
            },
            {
              "id": "chat_hard_sample_245",
              "rewards": [
                0.2806642645506942,
                -1.541012206344802,
                -1.3609627877097819,
                -1.3503716454371337,
                -1.4033273568003748,
                -1.3609627877097819,
                -0.7890411049867774
              ],
              "variance": 1.0972423394463573,
              "mean_reward": -1.0750019463482796,
              "min_reward": -1.541012206344802,
              "max_reward": 0.2806642645506942,
              "num_responses": 7,
              "rvariance": 0.35484904178522353
            },
            {
              "id": "chat_hard_sample_131",
              "rewards": [
                0.8870071596598056,
                -0.4289422677167374,
                -0.3018485604449586,
                -0.4395334099893856,
                -0.4289422677167374,
                -0.4289422677167374
              ],
              "variance": 0.7268171384604849,
              "mean_reward": -0.19020026898745845,
              "min_reward": -0.4395334099893856,
              "max_reward": 0.8870071596598056,
              "num_responses": 6,
              "rvariance": 0.2343335710653115
            },
            {
              "id": "chat_hard_sample_171",
              "rewards": [
                0.360097831595556,
                0.01059013659816428,
                -0.10061685726464217,
                0.4342358275040936,
                0.1376838438699431,
                0.06354584796140544,
                0.6619453863660306
              ],
              "variance": 0.5592123119958268,
              "mean_reward": 0.22392600237579297,
              "min_reward": -0.10061685726464217,
              "max_reward": 0.6619453863660306,
              "num_responses": 7,
              "rvariance": 0.06266196193916465
            },
            {
              "id": "chat_hard_sample_329",
              "rewards": [
                1.3563271516165305,
                0.6884232420476513,
                1.0154247597156654,
                0.7149010977292718,
                0.7149010977292718
              ],
              "variance": 0.5209518105358849,
              "mean_reward": 0.8979954697676782,
              "min_reward": 0.6884232420476513,
              "max_reward": 1.3563271516165305,
              "num_responses": 5,
              "rvariance": 0.06696503709997953
            },
            {
              "id": "chat_hard_sample_384",
              "rewards": [
                0.4871915388673348,
                0.7043099554566236,
                -0.026478861356104534,
                0.5957507471619792,
                -0.015887719083456302,
                0.180048412960536,
                0.29655097795966656
              ],
              "variance": 0.6592986064723526,
              "mean_reward": 0.3173550074237971,
              "min_reward": -0.026478861356104534,
              "max_reward": 0.7043099554566236,
              "num_responses": 7,
              "rvariance": 0.07209158853420206
            },
            {
              "id": "chat_hard_sample_29",
              "rewards": [
                0.38657568727717656,
                -0.2700751336270139,
                -0.41835112544408914,
                -0.6407651131697021,
                -0.3230308449902551,
                -0.24889284908171744,
                -0.8525879586226667
              ],
              "variance": 0.7307888168127282,
              "mean_reward": -0.3381610482368954,
              "min_reward": -0.8525879586226667,
              "max_reward": 0.38657568727717656,
              "num_responses": 7,
              "rvariance": 0.12867306810399362
            },
            {
              "id": "chat_hard_sample_106",
              "rewards": [
                0.21711741091480483,
                -0.15357256862788332,
                -0.2912574181723104,
                -0.03177443249242865,
                -0.3548042718081998,
                0.2118218397784807,
                -0.45012455226203385
              ],
              "variance": 0.6068724522227438,
              "mean_reward": -0.12179914180993864,
              "min_reward": -0.45012455226203385,
              "max_reward": 0.21711741091480483,
              "num_responses": 7,
              "rvariance": 0.060869494455435866
            },
            {
              "id": "chat_hard_sample_320",
              "rewards": [
                0.5931029615938171,
                -0.4395334099893856,
                0.47130482545836244,
                -0.047661145901401004,
                -0.1747548531731798,
                -0.11120799953729041
              ],
              "variance": 0.8393480251073725,
              "mean_reward": 0.04854172974182047,
              "min_reward": -0.4395334099893856,
              "max_reward": 0.5931029615938171,
              "num_responses": 6,
              "rvariance": 0.13302154093132076
            },
            {
              "id": "chat_hard_sample_23",
              "rewards": [
                0.44482696977674185,
                0.015885707734488396,
                0.19063955523318424,
                -0.21711942226377273,
                0.22770855318745306,
                0.2806642645506942,
                0.31773326250496303
              ],
              "variance": 0.44588708967849067,
              "mean_reward": 0.180048412960536,
              "min_reward": -0.21711942226377273,
              "max_reward": 0.44482696977674185,
              "num_responses": 7,
              "rvariance": 0.04089481370284911
            },
            {
              "id": "chat_hard_sample_235",
              "rewards": [
                -0.5666271172611644,
                -0.9690905236217973,
                -1.3397805031644854,
                -1.4033273568003748,
                -1.1491399422568174,
                -1.541012206344802,
                -1.3609627877097819
              ],
              "variance": 0.6502961355406016,
              "mean_reward": -1.1899914910227463,
              "min_reward": -1.541012206344802,
              "max_reward": -0.5666271172611644,
              "num_responses": 7,
              "rvariance": 0.09420641365313738
            },
            {
              "id": "chat_hard_sample_202",
              "rewards": [
                1.0048336174430172,
                0.23300412432377718,
                0.180048412960536,
                0.49778268113998303,
                0.3918712584135007,
                0.180048412960536,
                -0.21711942226377273
              ],
              "variance": 0.6794217767903843,
              "mean_reward": 0.3243527264253682,
              "min_reward": -0.21711942226377273,
              "max_reward": 1.0048336174430172,
              "num_responses": 7,
              "rvariance": 0.12012500986791176
            },
            {
              "id": "chat_hard_sample_304",
              "rewards": [
                0.8366992338647264,
                0.540147250230576,
                0.5454428213669,
                0.360097831595556,
                0.11650155932464662,
                0.45012254091306597,
                0.3442111181865836
              ],
              "variance": 0.4088180917242219,
              "mean_reward": 0.45617462221172206,
              "min_reward": 0.11650155932464662,
              "max_reward": 0.8366992338647264,
              "num_responses": 7,
              "rvariance": 0.04242859813975623
            },
            {
              "id": "chat_hard_sample_277",
              "rewards": [
                1.763424182721447,
                -0.2065282799911245,
                -0.6195828286244056,
                -0.6619473977149986,
                -1.0114550927123902,
                0.10591041705199838
              ],
              "variance": 1.771368545100417,
              "mean_reward": -0.10502983321157892,
              "min_reward": -1.0114550927123902,
              "max_reward": 1.763424182721447,
              "num_responses": 6,
              "rvariance": 0.8237411405563364
            },
            {
              "id": "chat_hard_sample_196",
              "rewards": [
                0.6063418894346274,
                -0.24889284908171744,
                -0.4289422677167374,
                0.3336199759139354,
                -0.07413900158302159,
                0.10061484591567427,
                0.13238827273361897
              ],
              "variance": 0.7636213578579376,
              "mean_reward": 0.06014155223091138,
              "min_reward": -0.4289422677167374,
              "max_reward": 0.6063418894346274,
              "num_responses": 7,
              "rvariance": 0.10467420628121567
            },
            {
              "id": "chat_hard_sample_185",
              "rewards": [
                -1.233869080438003,
                -2.218845311794289,
                -2.0282047508866206,
                -1.9011110436148417,
                -2.1976630272489923,
                -2.1129338890678064,
                -2.0493870354319172
              ],
              "variance": 0.5719216827230051,
              "mean_reward": -1.9631448769260673,
              "min_reward": -2.218845311794289,
              "max_reward": -1.233869080438003,
              "num_responses": 7,
              "rvariance": 0.09859715775759692
            },
            {
              "id": "chat_hard_sample_160",
              "rewards": [
                -0.13239028408258688,
                -0.9055436699859079,
                -1.043228519530335,
                -0.8949525277132596,
                -1.0114550927123902,
                -0.8631791008953149,
                -0.7572676781688327
              ],
              "variance": 0.516847742905234,
              "mean_reward": -0.8011452675840897,
              "min_reward": -1.043228519530335,
              "max_reward": -0.13239028408258688,
              "num_responses": 7,
              "rvariance": 0.08222000274023333
            },
            {
              "id": "chat_hard_sample_163",
              "rewards": [
                2.1129318777188386,
                2.0123160261286803,
                2.0123160261286803,
                0.6540020296615444,
                2.0123160261286803,
                1.8984612466977118
              ],
              "variance": 0.7863923137441315,
              "mean_reward": 1.783723872077356,
              "min_reward": 0.6540020296615444,
              "max_reward": 2.1129318777188386,
              "num_responses": 6,
              "rvariance": 0.25909618933767725
            },
            {
              "id": "chat_hard_sample_266",
              "rewards": [
                -0.8631791008953149,
                -2.09175160452251,
                -1.6045590599806914,
                -1.9646578972507311,
                -1.9222933281601382,
                -1.8799287590695453,
                -1.6681059136165808
              ],
              "variance": 0.7074883038129021,
              "mean_reward": -1.7134965233565016,
              "min_reward": -2.09175160452251,
              "max_reward": -0.8631791008953149,
              "num_responses": 7,
              "rvariance": 0.14491744775219215
            },
            {
              "id": "chat_hard_sample_289",
              "rewards": [
                -0.14298142635523511,
                -0.6937208245329433,
                -0.21711942226377273,
                -0.24889284908171744,
                -0.365395414080848,
                -0.48189797907997856,
                -0.5242625481705715
              ],
              "variance": 0.4045816348151625,
              "mean_reward": -0.3820386376521524,
              "min_reward": -0.6937208245329433,
              "max_reward": -0.14298142635523511,
              "num_responses": 7,
              "rvariance": 0.03281383002780112
            },
            {
              "id": "chat_hard_sample_69",
              "rewards": [
                0.19593512636950836,
                -0.8314056740773703,
                -0.6937208245329433,
                -0.5666271172611644,
                -0.4395334099893856,
                -0.6725385399876468,
                -0.8314056740773703
              ],
              "variance": 0.6460596786315425,
              "mean_reward": -0.5484708733651961,
              "min_reward": -0.8314056740773703,
              "max_reward": 0.19593512636950836,
              "num_responses": 7,
              "rvariance": 0.10899026424051982
            },
            {
              "id": "chat_hard_sample_40",
              "rewards": [
                0.35480226045923186,
                -0.5878094018064609,
                -0.03177443249242865,
                0.08472813250670191,
                -0.6089916863517574,
                -0.19593713771847626,
                -0.4713068368073303
              ],
              "variance": 0.7890400993122935,
              "mean_reward": -0.20804130031578855,
              "min_reward": -0.6089916863517574,
              "max_reward": 0.35480226045923186,
              "num_responses": 7,
              "rvariance": 0.11543101426027834
            },
            {
              "id": "chat_hard_sample_313",
              "rewards": [
                0.4871915388673348,
                -0.28066627589966214,
                -0.8314056740773703,
                -0.6619473977149986,
                -0.6937208245329433,
                -0.4607156945346821,
                -0.3548042718081998
              ],
              "variance": 0.775271614357851,
              "mean_reward": -0.39943837138578875,
              "min_reward": -0.8314056740773703,
              "max_reward": 0.4871915388673348,
              "num_responses": 7,
              "rvariance": 0.16401077476118298
            },
            {
              "id": "chat_hard_sample_226",
              "rewards": [
                1.3013856010771676,
                1.388100578434475,
                1.1160406113058237,
                1.489378376416674,
                1.1160406113058237,
                2.319459152035479,
                1.1160406113058237
              ],
              "variance": 0.7053700753583727,
              "mean_reward": 1.4066350774116094,
              "min_reward": 1.1160406113058237,
              "max_reward": 2.319459152035479,
              "num_responses": 7,
              "rvariance": 0.15783580797972757
            },
            {
              "id": "chat_hard_sample_28",
              "rewards": [
                0.4289402563677695,
                -0.3230308449902551,
                -0.5984005440791091,
                -0.06884343044669747,
                -0.3336219872629033,
                -0.3971688408987927,
                -0.6513562554423503
              ],
              "variance": 0.7498528729034951,
              "mean_reward": -0.2776402352503341,
              "min_reward": -0.6513562554423503,
              "max_reward": 0.4289402563677695,
              "num_responses": 7,
              "rvariance": 0.11498346969697182
            },
            {
              "id": "chat_hard_sample_323",
              "rewards": [
                0.6513542440933824,
                0.5083738234126313,
                0.1376838438699431,
                0.20123069750583247
              ],
              "variance": 0.4517122179284472,
              "mean_reward": 0.37466065222044725,
              "min_reward": 0.1376838438699431,
              "max_reward": 0.6513542440933824,
              "num_responses": 4,
              "rvariance": 0.0451686282055304
            },
            {
              "id": "chat_hard_sample_116",
              "rewards": [
                1.3536793660483684,
                0.47660039659468656,
                1.0994919515048107,
                0.4818959677310107,
                0.45012254091306597,
                0.767856809092513,
                0.767856809092513
              ],
              "variance": 0.7351576630001956,
              "mean_reward": 0.771071977282424,
              "min_reward": 0.45012254091306597,
              "max_reward": 1.3536793660483684,
              "num_responses": 7,
              "rvariance": 0.10295093436635806
            },
            {
              "id": "chat_hard_sample_36",
              "rewards": [
                0.015885707734488396,
                -0.4395334099893856,
                -0.5984005440791091,
                -0.31243970271760685,
                -0.4395334099893856,
                -0.09002571499199394,
                -0.3336219872629033
              ],
              "variance": 0.45541911772387406,
              "mean_reward": -0.3139527230422709,
              "min_reward": -0.5984005440791091,
              "max_reward": 0.015885707734488396,
              "num_responses": 7,
              "rvariance": 0.03882534932827591
            },
            {
              "id": "chat_hard_sample_351",
              "rewards": [
                0.2753686934143701,
                -0.10591242840096629,
                -0.14298142635523511,
                0.6672409575023548,
                0.5692728914803585,
                0.19593512636950836,
                0.25948198000539774
              ],
              "variance": 0.7292001454718309,
              "mean_reward": 0.24548654200225545,
              "min_reward": -0.14298142635523511,
              "max_reward": 0.6672409575023548,
              "num_responses": 7,
              "rvariance": 0.08009244914165044
            },
            {
              "id": "chat_hard_sample_296",
              "rewards": [
                0.4818959677310107,
                0.06354584796140544,
                0.21711741091480483,
                -0.14298142635523511,
                -0.3548042718081998,
                0.2382996954601013
              ],
              "variance": 0.6089906806772734,
              "mean_reward": 0.08384553731731455,
              "min_reward": -0.3548042718081998,
              "max_reward": 0.4818959677310107,
              "num_responses": 6,
              "rvariance": 0.07405630471583598
            },
            {
              "id": "chat_hard_sample_338",
              "rewards": [
                -0.4395334099893856,
                -1.7316527672524702,
                -1.4668742104362642,
                -1.0750019463482796,
                -1.583376775435395,
                -1.4139184990730231,
                -1.4668742104362642
              ],
              "variance": 0.8218726403575032,
              "mean_reward": -1.311033116995869,
              "min_reward": -1.7316527672524702,
              "max_reward": -0.4395334099893856,
              "num_responses": 7,
              "rvariance": 0.16078181513691805
            },
            {
              "id": "chat_hard_sample_354",
              "rewards": [
                0.40775797182247303,
                0.6963665987521374,
                0.3918712584135007,
                0.6142852461391136,
                0.38128011614085244,
                0.6169330317072756,
                0.5507383925032242
              ],
              "variance": 0.26107165702077895,
              "mean_reward": 0.5227475164969395,
              "min_reward": 0.38128011614085244,
              "max_reward": 0.6963665987521374,
              "num_responses": 7,
              "rvariance": 0.01407733682344143
            },
            {
              "id": "chat_hard_sample_186",
              "rewards": [
                0.7890390936378094,
                0.587807390457493,
                0.2065262686421566,
                -0.1747548531731798,
                -0.03707000362875277,
                0.3918712584135007
              ],
              "variance": 0.7943356704486175,
              "mean_reward": 0.29390319239150453,
              "min_reward": -0.1747548531731798,
              "max_reward": 0.7890390936378094,
              "num_responses": 6,
              "rvariance": 0.11299255454402755
            },
            {
              "id": "chat_hard_sample_54",
              "rewards": [
                1.205237887633283,
                0.9320195143185606,
                0.6884232420476513,
                0.7307878111382441,
                1.039254829829124,
                0.773152380228837,
                1.0101291885793413
              ],
              "variance": 0.3918060694487807,
              "mean_reward": 0.9112864076821489,
              "min_reward": 0.6884232420476513,
              "max_reward": 1.205237887633283,
              "num_responses": 7,
              "rvariance": 0.030615984309993825
            },
            {
              "id": "chat_hard_sample_241",
              "rewards": [
                1.131927324714796,
                -0.5878094018064609,
                -0.5984005440791091,
                -0.5666271172611644,
                -1.000863950439742,
                -0.7890411049867774,
                -0.958499381349149
              ],
              "variance": 1.0882398685146066,
              "mean_reward": -0.48133059645822956,
              "min_reward": -1.000863950439742,
              "max_reward": 1.131927324714796,
              "num_responses": 7,
              "rvariance": 0.46103006250648465
            },
            {
              "id": "chat_hard_sample_67",
              "rewards": [
                1.4377465578375137,
                -0.3971688408987927,
                -1.1597310845294655,
                -0.8208145318047221,
                -0.6089916863517574,
                -0.8949525277132596,
                -0.6513562554423503
              ],
              "variance": 1.3376612690354723,
              "mean_reward": -0.44218119555754765,
              "min_reward": -1.1597310845294655,
              "max_reward": 1.4377465578375137,
              "num_responses": 7,
              "rvariance": 0.6387110487538684
            },
            {
              "id": "chat_hard_sample_262",
              "rewards": [
                0.8525859472736989,
                0.3018465490959907,
                0.5507383925032242,
                0.9306956215344795,
                0.021181278870812514,
                0.5295561079579277,
                0.5931029615938171
              ],
              "variance": 0.6942493759720917,
              "mean_reward": 0.539958122689993,
              "min_reward": 0.021181278870812514,
              "max_reward": 0.9306956215344795,
              "num_responses": 7,
              "rvariance": 0.08275532498563333
            },
            {
              "id": "chat_hard_sample_244",
              "rewards": [
                -0.8102233895320738,
                -1.774017336343063,
                -1.9011110436148417,
                -1.9858401817960276,
                -1.7951996208883594,
                -1.8163819054336559,
                -2.0493870354319172
              ],
              "variance": 0.6227591656317166,
              "mean_reward": -1.733165787577134,
              "min_reward": -2.0493870354319172,
              "max_reward": -0.8102233895320738,
              "num_responses": 7,
              "rvariance": 0.1509014962866327
            },
            {
              "id": "chat_hard_sample_85",
              "rewards": [
                1.1620458855526394,
                0.16945727068788777,
                0.06884141909772956,
                0.5983985327301412,
                -0.2065282799911245,
                0.2065262686421566,
                0.1429794150062672
              ],
              "variance": 0.8651639343969527,
              "mean_reward": 0.305960073103671,
              "min_reward": -0.2065282799911245,
              "max_reward": 1.1620458855526394,
              "num_responses": 7,
              "rvariance": 0.17033650436163342
            },
            {
              "id": "chat_hard_sample_398",
              "rewards": [
                0.4554181120493901,
                -0.7149031090782397,
                -0.7149031090782397,
                -0.2383017068090692,
                -0.5772182595338127,
                -0.7149031090782397,
                -0.5242625481705715
              ],
              "variance": 0.7540893298125544,
              "mean_reward": -0.43272481852839745,
              "min_reward": -0.7149031090782397,
              "max_reward": 0.4554181120493901,
              "num_responses": 7,
              "rvariance": 0.1563899264172071
            },
            {
              "id": "chat_hard_sample_319",
              "rewards": [
                -0.9690905236217973,
                -1.085593088620928,
                -0.7784499627141291,
                -0.9055436699859079,
                -1.4456919258909677,
                -1.2974159340738924,
                -0.8737702431679631
              ],
              "variance": 0.521084199814293,
              "mean_reward": -1.050793621153655,
              "min_reward": -1.4456919258909677,
              "max_reward": -0.7784499627141291,
              "num_responses": 7,
              "rvariance": 0.050179932622394334
            },
            {
              "id": "chat_hard_sample_190",
              "rewards": [
                0.40775797182247303,
                0.4024624006861489,
                0.4660092543220383,
                0.5136693945489553,
                0.6645931719341927,
                0.8075735926149439
              ],
              "variance": 0.3309731960202573,
              "mean_reward": 0.5436776309881254,
              "min_reward": 0.4024624006861489,
              "max_reward": 0.8075735926149439,
              "num_responses": 6,
              "rvariance": 0.02160173543505083
            },
            {
              "id": "chat_hard_sample_20",
              "rewards": [
                0.5348516790942518,
                0.3971668295498248,
                0.5083738234126313,
                0.2382996954601013,
                0.41834911409512127,
                0.6513542440933824,
                0.031772421143460745
              ],
              "variance": 0.42576391936045904,
              "mean_reward": 0.3971668295498248,
              "min_reward": 0.031772421143460745,
              "max_reward": 0.6513542440933824,
              "num_responses": 7,
              "rvariance": 0.036447983451069865
            },
            {
              "id": "chat_hard_sample_264",
              "rewards": [
                0.2753686934143701,
                -0.21711942226377273,
                -0.365395414080848,
                -0.047661145901401004,
                -0.1747548531731798,
                -0.2383017068090692,
                -0.2065282799911245
              ],
              "variance": 0.37068997954268834,
              "mean_reward": -0.13919887554357505,
              "min_reward": -0.365395414080848,
              "max_reward": 0.2753686934143701,
              "num_responses": 7,
              "rvariance": 0.036157251177208354
            },
            {
              "id": "chat_hard_sample_27",
              "rewards": [
                0.5772162481848447,
                0.25948198000539774,
                -0.10591242840096629,
                0.021181278870812514,
                0.35480226045923186,
                -0.5136714058979233,
                -0.5772182595338127
              ],
              "variance": 0.9828580029017561,
              "mean_reward": 0.0022685248125120833,
              "min_reward": -0.5772182595338127,
              "max_reward": 0.5772162481848447,
              "num_responses": 7,
              "rvariance": 0.16215191959287162
            },
            {
              "id": "chat_hard_sample_115",
              "rewards": [
                0.10591041705199838,
                -0.38657769862614444,
                -0.7360853936235362,
                -1.000863950439742,
                -0.8102233895320738,
                -1.085593088620928,
                -1.0644108040756315
              ],
              "variance": 0.8833012655388629,
              "mean_reward": -0.7111205582665797,
              "min_reward": -1.085593088620928,
              "max_reward": 0.10591041705199838,
              "num_responses": 7,
              "rvariance": 0.1617581719463821
            },
            {
              "id": "chat_hard_sample_260",
              "rewards": [
                0.6884232420476513,
                -0.4607156945346821,
                -0.6407651131697021,
                -1.1067753731662244,
                -0.6089916863517574,
                -1.180913369074762,
                -0.5348536904432197
              ],
              "variance": 1.135370451627891,
              "mean_reward": -0.5492273835275281,
              "min_reward": -1.180913369074762,
              "max_reward": 0.6884232420476513,
              "num_responses": 7,
              "rvariance": 0.32309398086498897
            },
            {
              "id": "chat_hard_sample_175",
              "rewards": [
                -0.09002571499199394,
                -1.1491399422568174,
                -0.5348536904432197,
                -0.4924891213526268,
                -0.7149031090782397,
                -0.22771056453642097,
                -0.8208145318047221
              ],
              "variance": 0.77950807126691,
              "mean_reward": -0.5757052392091486,
              "min_reward": -1.1491399422568174,
              "max_reward": -0.09002571499199394,
              "num_responses": 7,
              "rvariance": 0.1105515194434611
            },
            {
              "id": "chat_hard_sample_200",
              "rewards": [
                1.8508011064707948,
                0.9598212627842622,
                0.5454428213669,
                1.236380396796314
              ],
              "variance": 0.9967185397763418,
              "mean_reward": 1.148111396854568,
              "min_reward": 0.5454428213669,
              "max_reward": 1.8508011064707948,
              "num_responses": 4,
              "rvariance": 0.22505670770495045
            },
            {
              "id": "chat_hard_sample_240",
              "rewards": [
                0.19593512636950836,
                -0.4713068368073303,
                -0.7149031090782397,
                -0.21711942226377273
              ],
              "variance": 0.713842989176491,
              "mean_reward": -0.3018485604449586,
              "min_reward": -0.7149031090782397,
              "max_reward": 0.19593512636950836,
              "num_responses": 4,
              "rvariance": 0.11357444832246984
            },
            {
              "id": "chat_hard_sample_130",
              "rewards": [
                1.5992614774953993,
                0.26477755114172186,
                0.1429794150062672,
                0.15357055727891544,
                1.543657980563996,
                -0.3230308449902551,
                0.9306956215344795
              ],
              "variance": 1.6093240683288992,
              "mean_reward": 0.6159873940043605,
              "min_reward": -0.3230308449902551,
              "max_reward": 1.5992614774953993,
              "num_responses": 7,
              "rvariance": 0.4813016278399093
            },
            {
              "id": "chat_hard_sample_374",
              "rewards": [
                0.6434108873888962,
                -0.24889284908171744,
                -0.07413900158302159,
                0.3442111181865836,
                0.4554181120493901,
                0.3336199759139354,
                0.4024624006861489
              ],
              "variance": 0.6746557627676926,
              "mean_reward": 0.26515580622288787,
              "min_reward": -0.24889284908171744,
              "max_reward": 0.6434108873888962,
              "num_responses": 7,
              "rvariance": 0.08406197483358616
            },
            {
              "id": "chat_hard_sample_257",
              "rewards": [
                0.35480226045923186,
                0.3071421202323148,
                -0.2383017068090692,
                0.19063955523318424,
                -0.3230308449902551,
                -0.19593713771847626,
                -0.08473014385566982
              ],
              "variance": 0.5983995384046252,
              "mean_reward": 0.0015120146501800705,
              "min_reward": -0.3230308449902551,
              "max_reward": 0.35480226045923186,
              "num_responses": 7,
              "rvariance": 0.06617936460678822
            },
            {
              "id": "chat_hard_sample_237",
              "rewards": [
                -1.000863950439742,
                -1.4351007836183196,
                -0.6619473977149986,
                -0.7784499627141291,
                -0.6089916863517574,
                -1.0220462349850385,
                -1.096184230893576
              ],
              "variance": 0.5909857388137714,
              "mean_reward": -0.9433691781025086,
              "min_reward": -1.4351007836183196,
              "max_reward": -0.6089916863517574,
              "num_responses": 7,
              "rvariance": 0.07040757334554563
            },
            {
              "id": "chat_hard_sample_22",
              "rewards": [
                0.29125540682334244,
                0.44482696977674185,
                0.4554181120493901,
                0.38657568727717656,
                0.15357055727891544
              ],
              "variance": 0.24253715804364456,
              "mean_reward": 0.3463293466411133,
              "min_reward": 0.15357055727891544,
              "max_reward": 0.4554181120493901,
              "num_responses": 5,
              "rvariance": 0.0126821996319392
            },
            {
              "id": "chat_hard_sample_292",
              "rewards": [
                -0.2912574181723104,
                -1.043228519530335,
                -0.9267259545312043,
                -1.1067753731662244,
                -0.7572676781688327,
                -1.1491399422568174,
                -1.4351007836183196
              ],
              "variance": 0.6926607046311947,
              "mean_reward": -0.9584993813491491,
              "min_reward": -1.4351007836183196,
              "max_reward": -0.2912574181723104,
              "num_responses": 7,
              "rvariance": 0.11133901473644027
            },
            {
              "id": "chat_hard_sample_92",
              "rewards": [
                -0.11650357067361451,
                -0.7890411049867774,
                -0.3336219872629033,
                -0.7466765358961844,
                -0.6195828286244056,
                -0.6937208245329433
              ],
              "variance": 0.542796041473222,
              "mean_reward": -0.5498578086628046,
              "min_reward": -0.7890411049867774,
              "max_reward": -0.11650357067361451,
              "num_responses": 6,
              "rvariance": 0.059343038735624666
            },
            {
              "id": "chat_hard_sample_407",
              "rewards": [
                0.9320195143185606,
                0.72549224000192,
                1.0849291308799194,
                0.6725365286386789,
                0.9148089081255072
              ],
              "variance": 0.3300464710714006,
              "mean_reward": 0.8659572643929172,
              "min_reward": 0.6725365286386789,
              "max_reward": 1.0849291308799194,
              "num_responses": 5,
              "rvariance": 0.02236827727405798
            },
            {
              "id": "chat_hard_sample_44",
              "rewards": [
                0.3653934027318801,
                -0.2065282799911245,
                -0.4607156945346821,
                -0.3336219872629033,
                -0.18534599544582803,
                -0.41835112544408914
              ],
              "variance": 0.5295571136324116,
              "mean_reward": -0.20652827999112447,
              "min_reward": -0.4607156945346821,
              "max_reward": 0.3653934027318801,
              "num_responses": 6,
              "rvariance": 0.07552934505724743
            },
            {
              "id": "chat_hard_sample_119",
              "rewards": [
                0.6725365286386789,
                -0.18534599544582803,
                0.07413699023405368,
                0.3389155470502595,
                0.16416169955156365
              ],
              "variance": 0.6206409371771865,
              "mean_reward": 0.21288095400574553,
              "min_reward": -0.18534599544582803,
              "max_reward": 0.6725365286386789,
              "num_responses": 5,
              "rvariance": 0.08147522448843728
            },
            {
              "id": "chat_hard_sample_303",
              "rewards": [
                0.4660092543220383,
                -0.18534599544582803,
                0.16416169955156365,
                -0.11650357067361451,
                0.0052945654618401635,
                -0.2912574181723104,
                0.021181278870812514
              ],
              "variance": 0.5126112859961747,
              "mean_reward": 0.009077116273500245,
              "min_reward": -0.2912574181723104,
              "max_reward": 0.4660092543220383,
              "num_responses": 7,
              "rvariance": 0.05382438758292591
            },
            {
              "id": "chat_hard_sample_365",
              "rewards": [
                -0.7572676781688327,
                -1.000863950439742,
                -0.8525879586226667,
                -1.0538196618029831,
                -1.3609627877097819
              ],
              "variance": 0.4427097469966962,
              "mean_reward": -1.0051004073488012,
              "min_reward": -1.3609627877097819,
              "max_reward": -0.7572676781688327,
              "num_responses": 5,
              "rvariance": 0.04274213114942607
            },
            {
              "id": "chat_hard_sample_45",
              "rewards": [
                1.1676724298849837,
                0.2435952665964254,
                -0.16416371090053156,
                0.4660092543220383,
                -0.026478861356104534,
                0.15886612841523953,
                -0.545444832715868
              ],
              "variance": 1.0633506841738827,
              "mean_reward": 0.18572223917802613,
              "min_reward": -0.545444832715868,
              "max_reward": 1.1676724298849837,
              "num_responses": 7,
              "rvariance": 0.24984461400397226
            },
            {
              "id": "chat_hard_sample_78",
              "rewards": [
                -0.7360853936235362,
                -0.6513562554423503,
                -0.5136714058979233,
                -0.16416371090053156
              ],
              "variance": 0.44165063276943145,
              "mean_reward": -0.5163191914660853,
              "min_reward": -0.7360853936235362,
              "max_reward": -0.16416371090053156,
              "num_responses": 4,
              "rvariance": 0.04763817137970264
            },
            {
              "id": "chat_hard_sample_189",
              "rewards": [
                2.875494121349511,
                1.6654561166994508,
                0.7334355967064062,
                2.4730307149888784
              ],
              "variance": 1.7417133467370016,
              "mean_reward": 1.9368541374360617,
              "min_reward": 0.7334355967064062,
              "max_reward": 2.875494121349511,
              "num_responses": 4,
              "rvariance": 0.6726008528872338
            },
            {
              "id": "chat_hard_sample_39",
              "rewards": [
                0.6884232420476513,
                0.6222286028435997,
                0.8075735926149439,
                0.3971668295498248,
                1.4748155557917826
              ],
              "variance": 0.7207272316537124,
              "mean_reward": 0.7980415645695604,
              "min_reward": 0.3971668295498248,
              "max_reward": 1.4748155557917826,
              "num_responses": 5,
              "rvariance": 0.13234816441480582
            },
            {
              "id": "chat_hard_sample_387",
              "rewards": [
                -0.365395414080848,
                -1.2550513649832995,
                -1.4033273568003748,
                -1.4245096413456713,
                -1.456283068163616,
                -1.6045590599806914,
                -1.4245096413456713
              ],
              "variance": 0.6164044802681276,
              "mean_reward": -1.276233649528596,
              "min_reward": -1.6045590599806914,
              "max_reward": -0.365395414080848,
              "num_responses": 7,
              "rvariance": 0.14720209979403287
            },
            {
              "id": "chat_hard_sample_118",
              "rewards": [
                0.7916868792059715,
                -0.5666271172611644,
                -0.7784499627141291,
                -0.683129682260295,
                -0.6619473977149986,
                -0.5348536904432197
              ],
              "variance": 0.8592064168685879,
              "mean_reward": -0.4055534951979725,
              "min_reward": -0.7784499627141291,
              "max_reward": 0.7916868792059715,
              "num_responses": 6,
              "rvariance": 0.29298098577931775
            },
            {
              "id": "chat_hard_sample_154",
              "rewards": [
                1.5595446939729685,
                0.8658248751145091,
                1.0941963803684867,
                0.32832440477761127,
                0.8843593740916436,
                -0.5666271172611644,
                1.305688252625431
              ],
              "variance": 1.436887033202345,
              "mean_reward": 0.7816158376699265,
              "min_reward": -0.5666271172611644,
              "max_reward": 1.5595446939729685,
              "num_responses": 7,
              "rvariance": 0.43120162602552176
            },
            {
              "id": "chat_hard_sample_103",
              "rewards": [
                0.3389155470502595,
                0.06884141909772956,
                0.10061484591567427,
                0.0052945654618401635,
                0.2382996954601013,
                0.20123069750583247,
                -0.38657769862614444
              ],
              "variance": 0.43000037626951826,
              "mean_reward": 0.08094558169504183,
              "min_reward": -0.38657769862614444,
              "max_reward": 0.3389155470502595,
              "num_responses": 7,
              "rvariance": 0.04723025911947666
            },
            {
              "id": "chat_hard_sample_162",
              "rewards": [
                1.5224756960186996,
                0.19063955523318424,
                0.6619453863660306,
                0.47130482545836244
              ],
              "variance": 0.9894774668221615,
              "mean_reward": 0.7115913657690692,
              "min_reward": 0.19063955523318424,
              "max_reward": 1.5224756960186996,
              "num_responses": 4,
              "rvariance": 0.24728163266759604
            },
            {
              "id": "chat_hard_sample_321",
              "rewards": [
                0.8287558771602404,
                -0.06354785931037335,
                0.0794325613703778,
                0.19063955523318424,
                0.052954705688757216,
                0.0794325613703778,
                0.18534398409686012
              ],
              "variance": 0.43953240431490187,
              "mean_reward": 0.19328734080134627,
              "min_reward": -0.06354785931037335,
              "max_reward": 0.8287558771602404,
              "num_responses": 7,
              "rvariance": 0.07363910835412626
            },
            {
              "id": "chat_hard_sample_273",
              "rewards": [
                1.049845972101772,
                1.049845972101772,
                1.049845972101772,
                0.4871915388673348,
                1.049845972101772,
                0.4871915388673348,
                1.049845972101772
              ],
              "variance": 0.5626544332344373,
              "mean_reward": 0.8890875626062186,
              "min_reward": 0.4871915388673348,
              "max_reward": 1.049845972101772,
              "num_responses": 7,
              "rvariance": 0.06460816555885017
            },
            {
              "id": "chat_hard_sample_291",
              "rewards": [
                1.0862530236640004,
                0.40775797182247303,
                0.29655097795966656,
                0.12179713046097072,
                0.26477755114172186,
                0.1376838438699431,
                0.5295561079579277
              ],
              "variance": 0.6209057157340029,
              "mean_reward": 0.4063395152681005,
              "min_reward": 0.12179713046097072,
              "max_reward": 1.0862530236640004,
              "num_responses": 7,
              "rvariance": 0.09467146725286797
            },
            {
              "id": "chat_hard_sample_312",
              "rewards": [
                -1.3927362145277267,
                -1.3609627877097819,
                -1.6892881981618773,
                -1.3291893608918373,
                -1.318598218619189,
                -1.8587464745242488,
                -1.5621944908900984
              ],
              "variance": 0.43211860472404795,
              "mean_reward": -1.501673677903537,
              "min_reward": -1.8587464745242488,
              "max_reward": -1.318598218619189,
              "num_responses": 7,
              "rvariance": 0.037328192579414325
            },
            {
              "id": "chat_hard_sample_314",
              "rewards": [
                -0.09532128612831806,
                -0.4713068368073303,
                -0.45012455226203385,
                -0.41835112544408914,
                -0.5560359749885162,
                -1.0750019463482796
              ],
              "variance": 0.5586827548821943,
              "mean_reward": -0.5110236203297612,
              "min_reward": -1.0750019463482796,
              "max_reward": -0.09532128612831806,
              "num_responses": 6,
              "rvariance": 0.08446340094072073
            },
            {
              "id": "chat_hard_sample_399",
              "rewards": [
                0.3706889738682042,
                -0.6301739708970538,
                -0.8102233895320738,
                -0.7890411049867774,
                -0.6513562554423503,
                -0.725494251350888,
                -1.085593088620928
              ],
              "variance": 0.6905424761766652,
              "mean_reward": -0.6173132981374095,
              "min_reward": -1.085593088620928,
              "max_reward": 0.3706889738682042,
              "num_responses": 7,
              "rvariance": 0.18216666187925826
            },
            {
              "id": "chat_hard_sample_219",
              "rewards": [
                -0.6195828286244056,
                -1.9222933281601382,
                -1.9434756127054347,
                -1.498647637254209,
                -1.8587464745242488,
                -1.8375641899789523,
                -2.0493870354319172
              ],
              "variance": 0.8388184679937403,
              "mean_reward": -1.675671015239901,
              "min_reward": -2.0493870354319172,
              "max_reward": -0.6195828286244056,
              "num_responses": 7,
              "rvariance": 0.21122729849764252
            },
            {
              "id": "chat_hard_sample_406",
              "rewards": [
                0.7096055265929476,
                -0.22771056453642097,
                -0.03707000362875277,
                0.0794325613703778,
                0.16945727068788777,
                0.2435952665964254,
                0.2806642645506942
              ],
              "variance": 0.5655669973594157,
              "mean_reward": 0.17399633166187983,
              "min_reward": -0.22771056453642097,
              "max_reward": 0.7096055265929476,
              "num_responses": 7,
              "rvariance": 0.07399708677400887
            },
            {
              "id": "chat_hard_sample_253",
              "rewards": [
                1.1534405824561127,
                -0.08473014385566982,
                -0.37598655635349626,
                0.24889083773274953,
                0.5825118193211689,
                0.4660092543220383,
                0.19593512636950836
              ],
              "variance": 1.012116033429947,
              "mean_reward": 0.3122958457132016,
              "min_reward": -0.37598655635349626,
              "max_reward": 1.1534405824561127,
              "num_responses": 7,
              "rvariance": 0.20758446656576832
            },
            {
              "id": "chat_hard_sample_24",
              "rewards": [
                0.7281400255700821,
                1.0273397947723946,
                0.9426106565912088,
                0.6592976007978686,
                0.9121611225573452,
                0.6407631018207341
              ],
              "variance": 0.3349448743725003,
              "mean_reward": 0.8183853836849387,
              "min_reward": 0.6407631018207341,
              "max_reward": 1.0273397947723946,
              "num_responses": 6,
              "rvariance": 0.02214842931374296
            },
            {
              "id": "chat_hard_sample_60",
              "rewards": [
                0.7201966688655959,
                -0.05825228817404923,
                -0.31243970271760685,
                -0.4289422677167374,
                0.052954705688757216,
                -0.015887719083456302,
                -0.6619473977149986
              ],
              "variance": 0.8419958106755348,
              "mean_reward": -0.10061685726464219,
              "min_reward": -0.6619473977149986,
              "max_reward": 0.7201966688655959,
              "num_responses": 7,
              "rvariance": 0.16772161740629704
            },
            {
              "id": "chat_hard_sample_386",
              "rewards": [
                0.7652090235243509,
                0.18534398409686012,
                0.07413699023405368,
                0.6937188131839753,
                0.1376838438699431,
                0.360097831595556
              ],
              "variance": 0.6235535013021647,
              "mean_reward": 0.3693650810841232,
              "min_reward": 0.07413699023405368,
              "max_reward": 0.7652090235243509,
              "num_responses": 6,
              "rvariance": 0.07278053960787902
            },
            {
              "id": "chat_hard_sample_216",
              "rewards": [
                0.052954705688757216,
                -0.2700751336270139,
                0.20123069750583247,
                -0.2700751336270139,
                -0.3336219872629033,
                -0.16416371090053156
              ],
              "variance": 0.42894126204225347,
              "mean_reward": -0.13062509370381217,
              "min_reward": -0.3336219872629033,
              "max_reward": 0.20123069750583247,
              "num_responses": 6,
              "rvariance": 0.037509168968611575
            },
            {
              "id": "chat_hard_sample_300",
              "rewards": [
                1.4801111269281066,
                0.8419948050010506,
                1.628387118745182,
                2.398892719080341,
                1.7025251146537195,
                1.6919339723810713,
                1.7660719682896089
              ],
              "variance": 0.7943356704486177,
              "mean_reward": 1.6442738321541543,
              "min_reward": 0.8419948050010506,
              "max_reward": 2.398892719080341,
              "num_responses": 7,
              "rvariance": 0.18011465288726927
            },
            {
              "id": "chat_hard_sample_352",
              "rewards": [
                0.5666251059121965,
                0.5586817492077103,
                0.6407631018207341,
                0.49778268113998303,
                0.6672409575023548,
                0.6645931719341927
              ],
              "variance": 0.13768484954442706,
              "mean_reward": 0.5992811279195286,
              "min_reward": 0.49778268113998303,
              "max_reward": 0.6672409575023548,
              "num_responses": 6,
              "rvariance": 0.00393693595213829
            },
            {
              "id": "chat_hard_sample_311",
              "rewards": [
                -0.6513562554423503,
                -0.9267259545312043,
                -1.1491399422568174,
                -0.503080263625275,
                -1.127957657711521,
                -1.180913369074762,
                -0.9479082390765008
              ],
              "variance": 0.5698034542684751,
              "mean_reward": -0.9267259545312044,
              "min_reward": -1.180913369074762,
              "max_reward": -0.503080263625275,
              "num_responses": 7,
              "rvariance": 0.05861803625588639
            },
            {
              "id": "chat_hard_sample_419",
              "rewards": [
                0.5825118193211689,
                -0.37598655635349626,
                -0.24889284908171744,
                0.5639773203440345,
                -0.2594839913543657,
                0.360097831595556,
                -0.14298142635523511
              ],
              "variance": 0.8774761372889062,
              "mean_reward": 0.06846316401656354,
              "min_reward": -0.37598655635349626,
              "max_reward": 0.5825118193211689,
              "num_responses": 7,
              "rvariance": 0.1493342318536215
            },
            {
              "id": "chat_hard_sample_287",
              "rewards": [
                0.12179713046097072,
                -0.38657769862614444,
                -1.0056744839526915e-06,
                -0.3230308449902551,
                -0.34421312953555155,
                -0.11650357067361451,
                0.10591041705199838
              ],
              "variance": 0.473424059587376,
              "mean_reward": -0.13465981456958293,
              "min_reward": -0.38657769862614444,
              "max_reward": 0.12179713046097072,
              "num_responses": 7,
              "rvariance": 0.040709386032118544
            },
            {
              "id": "chat_hard_sample_55",
              "rewards": [
                -0.8102233895320738,
                -1.0644108040756315,
                -1.127957657711521,
                -1.127957657711521,
                -1.1067753731662244,
                -1.276233649528596,
                -1.2868247918012443
              ],
              "variance": 0.31773426817944705,
              "mean_reward": -1.1143404747895447,
              "min_reward": -1.2868247918012443,
              "max_reward": -0.8102233895320738,
              "num_responses": 7,
              "rvariance": 0.021624071329887622
            }
          ]
        },
        "semantic_benchmark_reasoning_filtered.json": {
          "file_name": "semantic_benchmark_reasoning_filtered.json",
          "processed_samples": 200,
          "global_mean": -3.342025093410326,
          "global_std": 14.101051038849779,
          "mean_variance": 0.6186844028690573,
          "mean_rvariance": 0.11091569494668048,
          "sample_results": [
            {
              "id": "reasoning_sample_9",
              "rewards": [
                1.7705790174522258,
                1.7971727797871637,
                1.9744645286867495,
                -0.525349130797412,
                -0.361354263065295,
                1.6642039681124743,
                2.1162979278064182
              ],
              "variance": 2.4581500984927587,
              "mean_reward": 1.2051449754260464,
              "min_reward": -0.525349130797412,
              "max_reward": 2.1162979278064182,
              "num_responses": 7,
              "rvariance": 1.1073613899019688
            },
            {
              "id": "reasoning_sample_5",
              "rewards": [
                1.7351206676723085,
                -0.8444742788166666,
                1.9655999412417702,
                1.7262560802273292,
                0.6159665027436724
              ],
              "variance": 2.1337061980065166,
              "mean_reward": 1.0396937826136827,
              "min_reward": -0.8444742788166666,
              "max_reward": 1.9655999412417702,
              "num_responses": 5,
              "rvariance": 1.1083845293945065
            },
            {
              "id": "reasoning_sample_85",
              "rewards": [
                -0.05995828993599892,
                -0.5918335366347567,
                -1.216786951505797,
                -0.013419205849857622
              ],
              "variance": 1.0019199959687848,
              "mean_reward": -0.47049949598160257,
              "min_reward": -1.216786951505797,
              "max_reward": -0.013419205849857622,
              "num_responses": 4,
              "rvariance": 0.23728334729557415
            },
            {
              "id": "reasoning_sample_65",
              "rewards": [
                1.690797730447412,
                1.34064652637073,
                -0.7602606980893633,
                -0.9331201532664596,
                1.4691830443229297,
                -1.0483597900511903,
                1.389401757318116
              ],
              "variance": 2.5370449267530746,
              "mean_reward": 0.4497554881503106,
              "min_reward": -1.0483597900511903,
              "max_reward": 1.690797730447412,
              "num_responses": 7,
              "rvariance": 1.4109819914227053
            },
            {
              "id": "reasoning_sample_256",
              "rewards": [
                -0.7425315231994046,
                -1.6156933865298653,
                -1.066088964941149,
                -1.5270475120800722
              ],
              "variance": 0.7495008684729995,
              "mean_reward": -1.2378403466876229,
              "min_reward": -1.6156933865298653,
              "max_reward": -0.7425315231994046,
              "num_responses": 4,
              "rvariance": 0.12531076799736618
            },
            {
              "id": "reasoning_sample_263",
              "rewards": [
                -0.09098434599342646,
                -0.16190104555326082,
                -0.8932295097640527,
                -0.3436250881753364,
                -1.1724640142809004,
                -0.4189740814576604
              ],
              "variance": 0.906404066249133,
              "mean_reward": -0.5135296808707729,
              "min_reward": -1.1724640142809004,
              "max_reward": -0.09098434599342646,
              "num_responses": 6,
              "rvariance": 0.15306033416824585
            },
            {
              "id": "reasoning_sample_203",
              "rewards": [
                -0.4943230747399844,
                -1.6511517363097823,
                -0.8577711599841356,
                -1.9880060592189956,
                -1.9880060592189956,
                -0.8577711599841356
              ],
              "variance": 1.3119589418569357,
              "mean_reward": -1.3061715415760047,
              "min_reward": -1.9880060592189956,
              "max_reward": -0.4943230747399844,
              "num_responses": 6,
              "rvariance": 0.35167194853081996
            },
            {
              "id": "reasoning_sample_61",
              "rewards": [
                0.27745006968852554,
                -0.14860416438579188,
                -1.1547348393909418,
                0.512915673695788,
                -0.4765938998500258,
                -0.4012449065677018,
                -0.37021885051027426
              ],
              "variance": 1.1194865869578225,
              "mean_reward": -0.25157584533148886,
              "min_reward": -1.1547348393909418,
              "max_reward": 0.512915673695788,
              "num_responses": 7,
              "rvariance": 0.25396073606902175
            },
            {
              "id": "reasoning_sample_319",
              "rewards": [
                0.8265004545619307,
                0.21373584742773682,
                -1.2345161263957554,
                0.34504254895649267,
                0.2599979131562225,
                0.14337318458321366
              ],
              "variance": 1.1313429726654824,
              "mean_reward": 0.09235563704830681,
              "min_reward": -1.2345161263957554,
              "max_reward": 0.8265004545619307,
              "num_responses": 6,
              "rvariance": 0.40147464058730603
            },
            {
              "id": "reasoning_sample_528",
              "rewards": [
                -0.6450210613046324,
                -1.1192764896110248,
                -1.1192764896110248,
                -1.402943287850362,
                -0.6450210613046324,
                -0.6450210613046324,
                -1.3497557631804864
              ],
              "variance": 0.7260097117438041,
              "mean_reward": -0.9894736020238278,
              "min_reward": -1.402943287850362,
              "max_reward": -0.6450210613046324,
              "num_responses": 7,
              "rvariance": 0.09862866491726874
            },
            {
              "id": "reasoning_sample_551",
              "rewards": [
                -0.17298177985948493,
                -0.9863076779363353,
                -0.7912867541467908,
                -0.4854584872950051,
                -1.5181829246350929,
                -0.7513961106443839,
                -0.8356096913716873
              ],
              "variance": 0.8385899722950414,
              "mean_reward": -0.7916033465555401,
              "min_reward": -1.5181829246350929,
              "max_reward": -0.17298177985948493,
              "num_responses": 7,
              "rvariance": 0.1493997511440406
            },
            {
              "id": "reasoning_sample_596",
              "rewards": [
                -1.5181829246350929,
                -1.4384016376302793,
                -0.6849117048070392,
                -0.6849117048070392,
                -1.4384016376302793,
                -0.8976618034865423,
                -1.4827245748551758
              ],
              "variance": 0.8119962099601035,
              "mean_reward": -1.163599426835921,
              "min_reward": -1.5181829246350929,
              "max_reward": -0.6849117048070392,
              "num_responses": 7,
              "rvariance": 0.1296585024399795
            },
            {
              "id": "reasoning_sample_456",
              "rewards": [
                0.028687584513794034,
                0.30653699724236383,
                -0.5430783056873706,
                -0.2062239827781573
              ],
              "variance": 0.6652041822383995,
              "mean_reward": -0.1035194266773425,
              "min_reward": -0.5430783056873706,
              "max_reward": 0.30653699724236383,
              "num_responses": 4,
              "rvariance": 0.09734629964158228
            },
            {
              "id": "reasoning_sample_306",
              "rewards": [
                -0.17076563299824013,
                -0.6804794110845496,
                -0.4278386689026397,
                -0.19292710161068835,
                -0.361354263065295,
                0.6314795307723862,
                -0.21065627650064694
              ],
              "variance": 0.6790273982854143,
              "mean_reward": -0.20179168905566766,
              "min_reward": -0.6804794110845496,
              "max_reward": 0.6314795307723862,
              "num_responses": 7,
              "rvariance": 0.14302287015900944
            },
            {
              "id": "reasoning_sample_231",
              "rewards": [
                -0.07768746482595751,
                -1.190193189170859,
                -0.1796302204432194,
                -0.5652397742998188,
                -0.5563751868548394,
                -0.11536196146711952,
                -0.24611462628056413
              ],
              "variance": 0.7149289774375801,
              "mean_reward": -0.41865748904891115,
              "min_reward": -1.190193189170859,
              "max_reward": -0.07768746482595751,
              "num_responses": 7,
              "rvariance": 0.13298195375716007
            },
            {
              "id": "reasoning_sample_526",
              "rewards": [
                0.2672003904552682,
                -0.18849480788819872,
                -0.4544324312375776,
                -0.2815729760604813,
                -0.6405887675821428
              ],
              "variance": 0.6510485441621983,
              "mean_reward": -0.25957771846262645,
              "min_reward": -0.6405887675821428,
              "max_reward": 0.2672003904552682,
              "num_responses": 5,
              "rvariance": 0.09323390524188091
            },
            {
              "id": "reasoning_sample_591",
              "rewards": [
                0.24219948367685004,
                -0.27714068233799166,
                -0.7248023483094461,
                0.07965896232242499,
                0.1356166705688568
              ],
              "variance": 0.7453040403545171,
              "mean_reward": -0.10889358281586121,
              "min_reward": -0.7248023483094461,
              "max_reward": 0.24219948367685004,
              "num_responses": 5,
              "rvariance": 0.12525087230741622
            },
            {
              "id": "reasoning_sample_23",
              "rewards": [
                -0.3879480254002329,
                -0.0954166397159161,
                -1.128141077056004,
                -0.5342137182423913,
                -0.6494533550271221,
                -0.8533388662616459
              ],
              "variance": 0.7490576391007505,
              "mean_reward": -0.6080852802838854,
              "min_reward": -1.128141077056004,
              "max_reward": -0.0954166397159161,
              "num_responses": 6,
              "rvariance": 0.10817753741452774
            },
            {
              "id": "reasoning_sample_275",
              "rewards": [
                -0.1685494861369953,
                -1.2699744761756726,
                -0.7159377608644668,
                -0.7159377608644668,
                -0.7159377608644668,
                -0.5652397742998188
              ],
              "variance": 0.6260614883016626,
              "mean_reward": -0.6919295032009812,
              "min_reward": -1.2699744761756726,
              "max_reward": -0.1685494861369953,
              "num_responses": 6,
              "rvariance": 0.10430701829339484
            },
            {
              "id": "reasoning_sample_656",
              "rewards": [
                -0.13530728321832294,
                -0.6051304178022257,
                -1.0838181398311075,
                -0.6494533550271221
              ],
              "variance": 0.6772544807964183,
              "mean_reward": -0.6184272989696946,
              "min_reward": -1.0838181398311075,
              "max_reward": -0.13530728321832294,
              "num_responses": 4,
              "rvariance": 0.11278325189513974
            },
            {
              "id": "reasoning_sample_405",
              "rewards": [
                0.8176358671169514,
                2.3024542641509833,
                2.355641788820859,
                1.7971727797871637,
                1.9390061789068325,
                2.5063397753855075
              ],
              "variance": 1.123586458651126,
              "mean_reward": 1.9530417756947163,
              "min_reward": 0.8176358671169514,
              "max_reward": 2.5063397753855075,
              "num_responses": 6,
              "rvariance": 0.3173255422026538
            },
            {
              "id": "reasoning_sample_330",
              "rewards": [
                -0.34805738189782603,
                -1.1547348393909418,
                -1.1458702519459625,
                -0.8533388662616459,
                -1.3674849380704448,
                -1.1547348393909418
              ],
              "variance": 0.6604117646509573,
              "mean_reward": -1.004036852826294,
              "min_reward": -1.3674849380704448,
              "max_reward": -0.34805738189782603,
              "num_responses": 6,
              "rvariance": 0.10844165658616461
            },
            {
              "id": "reasoning_sample_451",
              "rewards": [
                0.02203914393005956,
                -0.41454178773517075,
                -0.05995828993599892,
                0.05749749370997674,
                -0.3657865567877846,
                -1.1192764896110248,
                -1.278839063620652
              ],
              "variance": 1.2193240030569021,
              "mean_reward": -0.451266507150085,
              "min_reward": -1.278839063620652,
              "max_reward": 0.05749749370997674,
              "num_responses": 7,
              "rvariance": 0.2536786240850776
            },
            {
              "id": "reasoning_sample_314",
              "rewards": [
                -0.3303282070078674,
                -0.272708388615502,
                -0.11092966774462987,
                -1.004036852826294
              ],
              "variance": 0.6424609750748745,
              "mean_reward": -0.4295007790485733,
              "min_reward": -1.004036852826294,
              "max_reward": -0.11092966774462987,
              "num_responses": 4,
              "rvariance": 0.11649957644305842
            },
            {
              "id": "reasoning_sample_593",
              "rewards": [
                -0.23725003883558485,
                0.41762135866226063,
                -0.587401242912267,
                0.3854872291742107,
                0.3300835576430901
              ],
              "variance": 0.8521084681486348,
              "mean_reward": 0.061708172746341904,
              "min_reward": -0.587401242912267,
              "max_reward": 0.41762135866226063,
              "num_responses": 5,
              "rvariance": 0.1628502932555086
            },
            {
              "id": "reasoning_sample_599",
              "rewards": [
                0.28963887742537203,
                -0.09320049285467129,
                -0.18849480788819872,
                -1.3674849380704448,
                -0.18849480788819872,
                -0.18849480788819872,
                -0.18849480788819872
              ],
              "variance": 0.7200261152184433,
              "mean_reward": -0.2750036835789341,
              "min_reward": -1.3674849380704448,
              "max_reward": 0.28963887742537203,
              "num_responses": 7,
              "rvariance": 0.22504629365192422
            },
            {
              "id": "reasoning_sample_301",
              "rewards": [
                0.38991952289670034,
                -0.03336452760106104,
                -0.03336452760106104,
                -0.8976618034865423,
                0.02757951108317162,
                0.2105501363146974,
                -0.18849480788819872
              ],
              "variance": 0.7544594970750347,
              "mean_reward": -0.07497664232604197,
              "min_reward": -0.8976618034865423,
              "max_reward": 0.38991952289670034,
              "num_responses": 7,
              "rvariance": 0.14304744783598697
            },
            {
              "id": "reasoning_sample_77",
              "rewards": [
                0.08298318261429222,
                0.3129084194684427,
                0.9506046787916408,
                1.3628079949831782,
                1.3317819389257506,
                0.7733129298920549,
                1.1367610151362062
              ],
              "variance": 1.123254036621939,
              "mean_reward": 0.8501657371159379,
              "min_reward": 0.08298318261429222,
              "max_reward": 1.3628079949831782,
              "num_responses": 7,
              "rvariance": 0.2100145622944323
            },
            {
              "id": "reasoning_sample_511",
              "rewards": [
                1.314052764035792,
                0.3228810803440444,
                0.7888259579207686,
                0.7888259579207686,
                0.40210833063354684,
                0.48410576449960535,
                0.40210833063354684
              ],
              "variance": 0.6284992498490323,
              "mean_reward": 0.643272597998296,
              "min_reward": 0.3228810803440444,
              "max_reward": 1.314052764035792,
              "num_responses": 7,
              "rvariance": 0.10523182935666849
            },
            {
              "id": "reasoning_sample_12",
              "rewards": [
                2.7190898740650105,
                3.055944196974224,
                1.894683241681936,
                2.648173174505176,
                2.7722773987348863,
                2.018787465911646
              ],
              "variance": 0.957375444057764,
              "mean_reward": 2.5181592253121465,
              "min_reward": 1.894683241681936,
              "max_reward": 3.055944196974224,
              "num_responses": 6,
              "rvariance": 0.17485998844211928
            },
            {
              "id": "reasoning_sample_543",
              "rewards": [
                -0.07768746482595751,
                -0.5962658303572463,
                -0.23060159825185036,
                -0.6538856487496117,
                -0.1419557238020574,
                0.2467702865781675,
                0.02757951108317162
              ],
              "variance": 0.7345695789953626,
              "mean_reward": -0.20372092404648348,
              "min_reward": -0.6538856487496117,
              "max_reward": 0.2467702865781675,
              "num_responses": 7,
              "rvariance": 0.09051484977555165
            },
            {
              "id": "reasoning_sample_506",
              "rewards": [
                -0.4101094940126811,
                -1.066088964941149,
                -0.6538856487496117,
                -0.9685785030463767,
                -0.7779898729793219,
                -0.6450210613046324,
                -0.42340637518015006
              ],
              "variance": 0.589495065091123,
              "mean_reward": -0.7064399886019891,
              "min_reward": -1.066088964941149,
              "max_reward": -0.4101094940126811,
              "num_responses": 7,
              "rvariance": 0.0539482006441671
            },
            {
              "id": "reasoning_sample_531",
              "rewards": [
                0.733422286389648,
                -0.08211975854844716,
                -0.05995828993599892,
                -0.11092966774462987,
                0.2670618812764404,
                0.4076486977866589,
                0.20611784259220775
              ],
              "variance": 0.6316018554547749,
              "mean_reward": 0.19446328454512557,
              "min_reward": -0.11092966774462987,
              "max_reward": 0.733422286389648,
              "num_responses": 7,
              "rvariance": 0.08226065480792064
            },
            {
              "id": "reasoning_sample_274",
              "rewards": [
                0.9240109164567029,
                0.658073293107324,
                0.822068160839441,
                0.42759401953786236,
                -0.08433590540969199
              ],
              "variance": 0.7627977496404684,
              "mean_reward": 0.5494820969063277,
              "min_reward": -0.08433590540969199,
              "max_reward": 0.9240109164567029,
              "num_responses": 5,
              "rvariance": 0.12858980205623177
            },
            {
              "id": "reasoning_sample_597",
              "rewards": [
                -0.06882287738097823,
                0.19794580104136747,
                0.19794580104136747,
                0.3489208059636711,
                0.19794580104136747,
                0.19794580104136747,
                -0.9597139156013974
              ],
              "variance": 0.6835150956794347,
              "mean_reward": 0.016023888163823625,
              "min_reward": -0.9597139156013974,
              "max_reward": 0.3489208059636711,
              "num_responses": 7,
              "rvariance": 0.17178084610581837
            },
            {
              "id": "reasoning_sample_73",
              "rewards": [
                1.84149571701206,
                1.868089479346998,
                1.8858186542369566,
                1.992193703576708,
                -0.15303645810828154,
                2.3999647260457557,
                2.355641788820859
              ],
              "variance": 1.3296881167468941,
              "mean_reward": 1.741452515847294,
              "min_reward": -0.15303645810828154,
              "max_reward": 2.3999647260457557,
              "num_responses": 7,
              "rvariance": 0.6442447934595327
            },
            {
              "id": "reasoning_sample_412",
              "rewards": [
                0.3644338339923849,
                0.5118076002651657,
                0.5118076002651657,
                0.512915673695788,
                -0.7159377608644668,
                0.5118076002651657
              ],
              "variance": 0.6881136004165178,
              "mean_reward": 0.2828057579365339,
              "min_reward": -0.7159377608644668,
              "max_reward": 0.512915673695788,
              "num_responses": 6,
              "rvariance": 0.20240464397467306
            },
            {
              "id": "reasoning_sample_491",
              "rewards": [
                0.191297360457633,
                -0.0954166397159161,
                -0.4278386689026397,
                0.10569868794205166,
                -0.35692196934280535,
                0.23262503669037826,
                -0.7868544604243012
              ],
              "variance": 0.7792734164620354,
              "mean_reward": -0.16248723618508562,
              "min_reward": -0.7868544604243012,
              "max_reward": 0.23262503669037826,
              "num_responses": 7,
              "rvariance": 0.12225001183095403
            },
            {
              "id": "reasoning_sample_64",
              "rewards": [
                1.34064652637073,
                1.9212770040168738,
                1.6730685555574536,
                2.2758605018160454,
                1.3317819389257506,
                1.8149019546771221,
                2.4442876632706523
              ],
              "variance": 1.0061306750051502,
              "mean_reward": 1.8288320206620894,
              "min_reward": 1.3317819389257506,
              "max_reward": 2.4442876632706523,
              "num_responses": 7,
              "rvariance": 0.15671519290276387
            },
            {
              "id": "reasoning_sample_535",
              "rewards": [
                0.6226149433274069,
                -0.6583179424721014,
                -0.6139950052472049,
                -0.4012449065677018,
                -0.5563751868548394,
                -0.5563751868548394
              ],
              "variance": 0.7468414922395057,
              "mean_reward": -0.36061554744488,
              "min_reward": -0.6583179424721014,
              "max_reward": 0.6226149433274069,
              "num_responses": 6,
              "rvariance": 0.19964408021533697
            },
            {
              "id": "reasoning_sample_548",
              "rewards": [
                -0.24833077314180896,
                -1.066088964941149,
                -0.6405887675821428,
                -0.7957190478692805,
                -0.6139950052472049,
                -0.6139950052472049,
                -0.9685785030463767
              ],
              "variance": 0.5398533753992392,
              "mean_reward": -0.7067565810107383,
              "min_reward": -1.066088964941149,
              "max_reward": -0.24833077314180896,
              "num_responses": 7,
              "rvariance": 0.06247523174851066
            },
            {
              "id": "reasoning_sample_235",
              "rewards": [
                -0.13530728321832294,
                -1.1547348393909418,
                -0.512052249629943,
                -0.4544324312375776,
                -0.7779898729793219
              ],
              "variance": 0.741079510400269,
              "mean_reward": -0.6069033352912215,
              "min_reward": -1.1547348393909418,
              "max_reward": -0.13530728321832294,
              "num_responses": 5,
              "rvariance": 0.11680738032541327
            },
            {
              "id": "reasoning_sample_156",
              "rewards": [
                0.15999428604254984,
                -0.5696720680223084,
                -0.31924747270164333,
                -0.8710680411516045,
                -0.6317241801371635,
                -0.31924747270164333
              ],
              "variance": 0.6717695173148373,
              "mean_reward": -0.4251608247786356,
              "min_reward": -0.8710680411516045,
              "max_reward": 0.15999428604254984,
              "num_responses": 6,
              "rvariance": 0.10453782413846979
            },
            {
              "id": "reasoning_sample_587",
              "rewards": [
                -0.0577421430747541,
                -0.4455678437925983,
                -1.0838181398311075,
                -0.31259903211790885,
                -0.42340637518015006,
                -0.42340637518015006,
                -0.44113555007010863
              ],
              "variance": 0.49021168570735496,
              "mean_reward": -0.4553822084638254,
              "min_reward": -1.0838181398311075,
              "max_reward": -0.0577421430747541,
              "num_responses": 7,
              "rvariance": 0.08225436767731076
            },
            {
              "id": "reasoning_sample_594",
              "rewards": [
                0.06968630144682328,
                -0.05330984935226445,
                -0.16411719241450565,
                -0.5209168370749223,
                -0.5741043617447981,
                -0.05330984935226445,
                -0.49875536846247404
              ],
              "variance": 0.5380804579102433,
              "mean_reward": -0.2564038795649151,
              "min_reward": -0.5741043617447981,
              "max_reward": 0.06968630144682328,
              "num_responses": 7,
              "rvariance": 0.06099727917605495
            },
            {
              "id": "reasoning_sample_622",
              "rewards": [
                0.35335309968616074,
                0.38991952289670034,
                -0.3524896756203157,
                -0.35692196934280535,
                -0.22395315766811588,
                -0.0300403073091938,
                -0.22395315766811588
              ],
              "variance": 0.7222422620796882,
              "mean_reward": -0.06344080643224079,
              "min_reward": -0.35692196934280535,
              "max_reward": 0.38991952289670034,
              "num_responses": 7,
              "rvariance": 0.08593960189844708
            },
            {
              "id": "reasoning_sample_647",
              "rewards": [
                0.6514248525235895,
                0.4940784253752071,
                0.5040510862508087,
                0.5040510862508087,
                -0.7115054671419772
              ],
              "variance": 0.8217472561495807,
              "mean_reward": 0.2884199966516874,
              "min_reward": -0.7115054671419772,
              "max_reward": 0.6514248525235895,
              "num_responses": 5,
              "rvariance": 0.25338247628759825
            },
            {
              "id": "reasoning_sample_395",
              "rewards": [
                -0.12201040205085399,
                -0.24611462628056413,
                -0.6272918864146738,
                0.31844878662155474,
                -0.5652397742998188,
                -0.18406251416570907
              ],
              "variance": 0.6944850226425967,
              "mean_reward": -0.23771173609834417,
              "min_reward": -0.6272918864146738,
              "max_reward": 0.31844878662155474,
              "num_responses": 6,
              "rvariance": 0.09744958043973871
            },
            {
              "id": "reasoning_sample_252",
              "rewards": [
                0.30764507067298624,
                0.31955686005217715,
                0.5173479674182777,
                0.5173479674182777,
                0.21498243003718703,
                -0.4101094940126811
              ],
              "variance": 0.6149114994060247,
              "mean_reward": 0.24446180026437078,
              "min_reward": -0.4101094940126811,
              "max_reward": 0.5173479674182777,
              "num_responses": 6,
              "rvariance": 0.09798295444541479
            },
            {
              "id": "reasoning_sample_497",
              "rewards": [
                -0.09098434599342646,
                0.41208099150914856,
                0.6425602650786103,
                1.0259536720739648,
                0.9683338536815994,
                0.9683338536815994,
                0.6425602650786103
              ],
              "variance": 0.7805269245304269,
              "mean_reward": 0.6526912221585867,
              "min_reward": -0.09098434599342646,
              "max_reward": 1.0259536720739648,
              "num_responses": 7,
              "rvariance": 0.13567675778978325
            },
            {
              "id": "reasoning_sample_87",
              "rewards": [
                0.27094013828361885,
                0.8575265106193581,
                0.9417400913466615,
                0.9771984411265786,
                -0.16411719241450565,
                0.822068160839441,
                0.746719167557117
              ],
              "variance": 0.8590062252542592,
              "mean_reward": 0.63601075962261,
              "min_reward": -0.16411719241450565,
              "max_reward": 0.9771984411265786,
              "num_responses": 7,
              "rvariance": 0.15418624179386314
            },
            {
              "id": "reasoning_sample_299",
              "rewards": [
                -0.04666140876852998,
                -0.9685785030463767,
                -0.37021885051027426,
                -0.9065263909315217,
                -0.2616276543092779,
                -0.915390978376501,
                -0.48102619357251547
              ],
              "variance": 0.7610248321514725,
              "mean_reward": -0.564289997073571,
              "min_reward": -0.9685785030463767,
              "max_reward": -0.04666140876852998,
              "num_responses": 7,
              "rvariance": 0.11542673778208472
            },
            {
              "id": "reasoning_sample_303",
              "rewards": [
                -0.7159377608644668,
                -0.7602606980893633,
                -0.8400419850941769,
                -0.7602606980893633,
                -1.3497557631804864
              ],
              "variance": 0.4122033161915373,
              "mean_reward": -0.8852513810635714,
              "min_reward": -1.3497557631804864,
              "max_reward": -0.7159377608644668,
              "num_responses": 5,
              "rvariance": 0.05554413082707582
            },
            {
              "id": "reasoning_sample_509",
              "rewards": [
                -0.46329701868255685,
                -0.5962658303572463,
                -0.6760471173620599,
                -0.512052249629943,
                -0.9508493281564181,
                -0.9951722653813146,
                -0.3170313258403985
              ],
              "variance": 0.5637877615006832,
              "mean_reward": -0.6443878764871338,
              "min_reward": -0.9951722653813146,
              "max_reward": -0.3170313258403985,
              "num_responses": 7,
              "rvariance": 0.053965039410717765
            },
            {
              "id": "reasoning_sample_572",
              "rewards": [
                0.8530942168968685,
                0.5716435655187759,
                1.327349645203261,
                1.3362142326482402,
                1.1589224837486543,
                0.42759401953786236,
                0.7843936641982789
              ],
              "variance": 0.8168717330548422,
              "mean_reward": 0.9227445468217058,
              "min_reward": 0.42759401953786236,
              "max_reward": 1.3362142326482402,
              "num_responses": 7,
              "rvariance": 0.11184008050679703
            },
            {
              "id": "reasoning_sample_557",
              "rewards": [
                0.6314795307723862,
                0.04530868597313021,
                0.04530868597313021,
                -0.1862786610269539,
                -0.01785149957234727,
                -0.038904894754173094,
                -0.3391927944528467
              ],
              "variance": 0.5272213382901438,
              "mean_reward": 0.019981293273189378,
              "min_reward": -0.3391927944528467,
              "max_reward": 0.6314795307723862,
              "num_responses": 7,
              "rvariance": 0.07880873507188468
            },
            {
              "id": "reasoning_sample_678",
              "rewards": [
                1.2918912954233437,
                0.31401649289906514,
                0.709044670915955,
                -0.032256454170438625,
                0.1295222667004335,
                0.1295222667004335,
                0.4519716350115554
              ],
              "variance": 0.877372542366826,
              "mean_reward": 0.42767316764004965,
              "min_reward": -0.032256454170438625,
              "max_reward": 1.2918912954233437,
              "num_responses": 7,
              "rvariance": 0.1755534752793908
            },
            {
              "id": "reasoning_sample_53",
              "rewards": [
                3.641006968342857,
                3.516902744113147,
                4.190611389931574,
                4.438819838390994,
                4.279257264381366,
                4.403361488611076,
                4.190611389931574
              ],
              "variance": 0.8261795498720703,
              "mean_reward": 4.0943672976717975,
              "min_reward": 3.516902744113147,
              "max_reward": 4.438819838390994,
              "num_responses": 7,
              "rvariance": 0.11511943029253542
            },
            {
              "id": "reasoning_sample_75",
              "rewards": [
                0.29213204264427245,
                -0.3148151789791537,
                -0.22395315766811588,
                -0.4898907810174948,
                0.7888259579207686,
                -0.3879480254002329
              ],
              "variance": 0.9793984034913843,
              "mean_reward": -0.05594152374999269,
              "min_reward": -0.4898907810174948,
              "max_reward": 0.7888259579207686,
              "num_responses": 6,
              "rvariance": 0.20476184320589577
            },
            {
              "id": "reasoning_sample_595",
              "rewards": [
                0.3843791557435883,
                0.7910421047820134,
                -0.15525260496952636,
                0.5173479674182777,
                0.5539143906288173
              ],
              "variance": 0.6355909198050155,
              "mean_reward": 0.41828620272063405,
              "min_reward": -0.15525260496952636,
              "max_reward": 0.7910421047820134,
              "num_responses": 5,
              "rvariance": 0.09945033057264316
            },
            {
              "id": "reasoning_sample_245",
              "rewards": [
                -0.6450210613046324,
                -1.163599426835921,
                -1.190193189170859,
                -1.0129014402712733,
                -1.0749535523861282
              ],
              "variance": 0.3873824713455952,
              "mean_reward": -1.017333733993763,
              "min_reward": -1.190193189170859,
              "max_reward": -0.6450210613046324,
              "num_responses": 5,
              "rvariance": 0.03864609181817085
            },
            {
              "id": "reasoning_sample_418",
              "rewards": [
                -1.1813286017258797,
                -1.580235036749948,
                -1.4738599874101965,
                -1.3674849380704448,
                -1.4738599874101965,
                -1.580235036749948,
                -1.819578897764389
              ],
              "variance": 0.3829501776231057,
              "mean_reward": -1.496654640840143,
              "min_reward": -1.819578897764389,
              "max_reward": -1.1813286017258797,
              "num_responses": 7,
              "rvariance": 0.033629422339720105
            },
            {
              "id": "reasoning_sample_60",
              "rewards": [
                1.2165423021410198,
                -0.2993021509504399,
                0.09794217392769478,
                0.1372787807147904,
                0.3345158513655797,
                0.5539143906288173
              ],
              "variance": 0.9859083348962911,
              "mean_reward": 0.3401485579712437,
              "min_reward": -0.2993021509504399,
              "max_reward": 1.2165423021410198,
              "num_responses": 6,
              "rvariance": 0.22041847359189795
            },
            {
              "id": "reasoning_sample_385",
              "rewards": [
                -0.12644269577334363,
                -0.5563751868548394,
                -0.3879480254002329,
                -0.12865884263458846,
                -0.7558284043668736,
                -0.39681261284521213,
                -0.37908343795525357
              ],
              "variance": 0.5083840899695626,
              "mean_reward": -0.39016417226147765,
              "min_reward": -0.7558284043668736,
              "max_reward": -0.12644269577334363,
              "num_responses": 7,
              "rvariance": 0.04277748319137203
            },
            {
              "id": "reasoning_sample_243",
              "rewards": [
                -0.13530728321832294,
                -1.1015473147210662,
                -0.7380992294769151,
                -0.8400419850941769,
                -0.6450210613046324,
                -0.8223128102042183
              ],
              "variance": 0.5806304776461438,
              "mean_reward": -0.713721614003222,
              "min_reward": -1.1015473147210662,
              "max_reward": -0.13530728321832294,
              "num_responses": 6,
              "rvariance": 0.08633913838613738
            },
            {
              "id": "reasoning_sample_71",
              "rewards": [
                1.8769540667919773,
                0.6292633839111413,
                1.9833291161317288,
                2.258131326926087,
                2.2138083897011906,
                2.160620865031315,
                1.9035478291269152
              ],
              "variance": 0.8536597709515061,
              "mean_reward": 1.860807853945765,
              "min_reward": 0.6292633839111413,
              "max_reward": 2.258131326926087,
              "num_responses": 7,
              "rvariance": 0.27230911558131576
            },
            {
              "id": "reasoning_sample_218",
              "rewards": [
                0.13894089086072403,
                -0.21952086394562625,
                -0.2616276543092779,
                -0.5652397742998188,
                -0.23946618569682965,
                -0.4101094940126811,
                0.02647143765254921
              ],
              "variance": 0.5436208250633553,
              "mean_reward": -0.21865023482156576,
              "min_reward": -0.5652397742998188,
              "max_reward": 0.13894089086072403,
              "num_responses": 7,
              "rvariance": 0.04957401781153264
            },
            {
              "id": "reasoning_sample_32",
              "rewards": [
                0.2504407798171042,
                1.7617144300072465,
                1.9124124165718945,
                1.9567353537967909
              ],
              "variance": 1.2396155977551748,
              "mean_reward": 1.470325745048259,
              "min_reward": 0.2504407798171042,
              "max_reward": 1.9567353537967909,
              "num_responses": 4,
              "rvariance": 0.5012654066852226
            },
            {
              "id": "reasoning_sample_55",
              "rewards": [
                0.008742262762590618,
                -0.2704922417542572,
                0.28880782235240526,
                -0.915390978376501,
                -0.6671825299170807,
                -0.6405887675821428,
                -0.7513961106443839
              ],
              "variance": 0.9377625443357474,
              "mean_reward": -0.4210715061656242,
              "min_reward": -0.915390978376501,
              "max_reward": 0.28880782235240526,
              "num_responses": 7,
              "rvariance": 0.16765245727012007
            },
            {
              "id": "reasoning_sample_403",
              "rewards": [
                -0.2993021509504399,
                -0.9242555658214803,
                -1.0129014402712733,
                -1.0926827272760868,
                -1.2345161263957554,
                -1.0926827272760868,
                -1.252245301285714
              ],
              "variance": 0.567333596478675,
              "mean_reward": -0.9869408627538337,
              "min_reward": -1.252245301285714,
              "max_reward": -0.2993021509504399,
              "num_responses": 7,
              "rvariance": 0.09021329087207651
            },
            {
              "id": "reasoning_sample_580",
              "rewards": [
                0.9018494478442547,
                0.32454319048997804,
                0.12176575268607663,
                0.12342786283201025
              ],
              "variance": 0.606393184908115,
              "mean_reward": 0.3678965634630799,
              "min_reward": 0.12176575268607663,
              "max_reward": 0.9018494478442547,
              "num_responses": 4,
              "rvariance": 0.10183262982227739
            },
            {
              "id": "reasoning_sample_530",
              "rewards": [
                -0.8622034537066252,
                -1.4915891623001551,
                -1.216786951505797,
                -1.0749535523861282,
                -1.1458702519459625
              ],
              "variance": 0.43436478480398544,
              "mean_reward": -1.1582806743689333,
              "min_reward": -1.4915891623001551,
              "max_reward": -0.8622034537066252,
              "num_responses": 5,
              "rvariance": 0.04185533620583678
            },
            {
              "id": "reasoning_sample_318",
              "rewards": [
                0.9993599097390269,
                0.29213204264427245,
                0.32675933735122287,
                0.47634925048524845,
                0.06968630144682328,
                0.08298318261429222,
                -0.09320049285467129
              ],
              "variance": 0.6810219304605345,
              "mean_reward": 0.30772421877517353,
              "min_reward": -0.09320049285467129,
              "max_reward": 0.9993599097390269,
              "num_responses": 7,
              "rvariance": 0.1107587128351616
            },
            {
              "id": "reasoning_sample_76",
              "rewards": [
                1.1411933088586959,
                2.4531522507156316,
                1.1810839523611025,
                1.2741621205333853,
                2.080839578026501,
                1.7085269053373706,
                1.4248601070980331
              ],
              "variance": 1.0646369521420136,
              "mean_reward": 1.6091168889901029,
              "min_reward": 1.1411933088586959,
              "max_reward": 2.4531522507156316,
              "num_responses": 7,
              "rvariance": 0.21330146697319893
            },
            {
              "id": "reasoning_sample_393",
              "rewards": [
                0.29213204264427245,
                -0.39238031912272253,
                -0.3524896756203157,
                -0.45886472496006725,
                -0.15303645810828154,
                -0.016743426141724856
              ],
              "variance": 0.5633168302926687,
              "mean_reward": -0.18023042688480653,
              "min_reward": -0.45886472496006725,
              "max_reward": 0.29213204264427245,
              "num_responses": 6,
              "rvariance": 0.06715195193079529
            },
            {
              "id": "reasoning_sample_642",
              "rewards": [
                0.05528134684873192,
                -0.7691252855343426,
                -0.5785366554672877,
                -0.46329701868255685,
                -1.066088964941149,
                -0.915390978376501
              ],
              "variance": 0.7867321357419126,
              "mean_reward": -0.6228595926921843,
              "min_reward": -1.066088964941149,
              "max_reward": 0.05528134684873192,
              "num_responses": 6,
              "rvariance": 0.13178673543457511
            },
            {
              "id": "reasoning_sample_16",
              "rewards": [
                0.3045978687387746,
                -0.8400419850941769,
                -0.2594115074480331,
                -0.03558067446230586,
                0.10514465122674045,
                0.07522666859993533
              ],
              "variance": 0.7545980062538626,
              "mean_reward": -0.10834416307317758,
              "min_reward": -0.8400419850941769,
              "max_reward": 0.3045978687387746,
              "num_responses": 6,
              "rvariance": 0.13554906937848268
            },
            {
              "id": "reasoning_sample_260",
              "rewards": [
                -0.06217443679724375,
                -0.9508493281564181,
                -0.512052249629943,
                -0.7203700545869565,
                -0.512052249629943,
                -0.39681261284521213,
                -0.46329701868255685
              ],
              "variance": 0.5496044215887165,
              "mean_reward": -0.5168011357611818,
              "min_reward": -0.9508493281564181,
              "max_reward": -0.06217443679724375,
              "num_responses": 7,
              "rvariance": 0.06483265906560119
            },
            {
              "id": "reasoning_sample_582",
              "rewards": [
                -0.06217443679724375,
                -0.2505469200030538,
                -0.2505469200030538,
                -0.06217443679724375,
                -0.5608074805773291
              ],
              "variance": 0.3745288195503752,
              "mean_reward": -0.23725003883558485,
              "min_reward": -0.5608074805773291,
              "max_reward": -0.06217443679724375,
              "num_responses": 5,
              "rvariance": 0.033269193012440204
            },
            {
              "id": "reasoning_sample_295",
              "rewards": [
                0.21248926481828662,
                -0.3657865567877846,
                -0.3524896756203157,
                -0.197359395333178,
                -0.525349130797412,
                -0.11757810832836435
              ],
              "variance": 0.49302342203755944,
              "mean_reward": -0.22434560034146137,
              "min_reward": -0.525349130797412,
              "max_reward": 0.21248926481828662,
              "num_responses": 6,
              "rvariance": 0.05499697092785347
            },
            {
              "id": "reasoning_sample_366",
              "rewards": [
                -0.1131458146058747,
                -0.3657865567877846,
                -0.6361564738596531,
                -0.3148151789791537,
                -0.6450210613046324,
                -0.3391927944528467,
                -0.44113555007010863
              ],
              "variance": 0.4055548756078029,
              "mean_reward": -0.4078933471514362,
              "min_reward": -0.6450210613046324,
              "max_reward": -0.1131458146058747,
              "num_responses": 7,
              "rvariance": 0.03021015042240605
            },
            {
              "id": "reasoning_sample_286",
              "rewards": [
                -0.1862786610269539,
                -0.2062239827781573,
                -0.7602606980893633,
                -0.6228595926921842,
                -0.37021885051027426,
                -0.7602606980893633,
                -0.5209168370749223
              ],
              "variance": 0.5620148440116873,
              "mean_reward": -0.4895741886087455,
              "min_reward": -0.7602606980893633,
              "max_reward": -0.1862786610269539,
              "num_responses": 7,
              "rvariance": 0.050258706616016495
            },
            {
              "id": "reasoning_sample_356",
              "rewards": [
                -0.29265371036670546,
                -0.6583179424721014,
                -0.286005269782971,
                0.09184777005927151,
                -0.13973957694081257,
                -0.13973957694081257
              ],
              "variance": 0.4515399229786329,
              "mean_reward": -0.23743471774068856,
              "min_reward": -0.6583179424721014,
              "max_reward": 0.09184777005927151,
              "num_responses": 6,
              "rvariance": 0.051677760396030524
            },
            {
              "id": "reasoning_sample_343",
              "rewards": [
                -0.4544324312375776,
                -1.0926827272760868,
                -0.525349130797412,
                -0.9065263909315217,
                -1.0129014402712733
              ],
              "variance": 0.5779711014126501,
              "mean_reward": -0.7983784241027744,
              "min_reward": -1.0926827272760868,
              "max_reward": -0.4544324312375776,
              "num_responses": 5,
              "rvariance": 0.0674349942144805
            },
            {
              "id": "reasoning_sample_205",
              "rewards": [
                0.8530942168968685,
                0.30903016246126425,
                0.17883153436313085,
                -0.10871352088338505,
                0.4608362224565347,
                0.4608362224565347,
                0.4608362224565347
              ],
              "variance": 0.5539259079681439,
              "mean_reward": 0.3735358657439261,
              "min_reward": -0.10871352088338505,
              "max_reward": 0.8530942168968685,
              "num_responses": 7,
              "rvariance": 0.075353643189118
            },
            {
              "id": "reasoning_sample_512",
              "rewards": [
                1.0215213783514752,
                1.3716725824281575,
                2.142891690141356,
                2.142891690141356,
                1.4691830443229297,
                1.5223705689928055
              ],
              "variance": 0.9462947097515397,
              "mean_reward": 1.6117551590630133,
              "min_reward": 1.0215213783514752,
              "max_reward": 2.142891690141356,
              "num_responses": 6,
              "rvariance": 0.16642400027200285
            },
            {
              "id": "reasoning_sample_226",
              "rewards": [
                0.10791483480329649,
                -0.5785366554672877,
                -1.0483597900511903,
                -0.20844012963940212,
                -0.32811206014662264,
                0.07190244830806809,
                0.07190244830806809
              ],
              "variance": 0.8527733122070081,
              "mean_reward": -0.27310412912643856,
              "min_reward": -1.0483597900511903,
              "max_reward": 0.10791483480329649,
              "num_responses": 7,
              "rvariance": 0.1549646001525487
            },
            {
              "id": "reasoning_sample_225",
              "rewards": [
                -0.18849480788819872,
                -0.10871352088338505,
                -0.6494533550271221,
                -0.10871352088338505,
                -0.45000013751508794,
                -0.8577711599841356
              ],
              "variance": 0.6448987366222437,
              "mean_reward": -0.3938577503635525,
              "min_reward": -0.8577711599841356,
              "max_reward": -0.10871352088338505,
              "num_responses": 6,
              "rvariance": 0.08141418895633597
            },
            {
              "id": "reasoning_sample_508",
              "rewards": [
                -0.8755003348740941,
                -1.4206724627403207,
                -1.3497557631804864,
                -1.190193189170859,
                -1.340891175735507
              ],
              "variance": 0.3909283063235869,
              "mean_reward": -1.2354025851402535,
              "min_reward": -1.4206724627403207,
              "max_reward": -0.8755003348740941,
              "num_responses": 5,
              "rvariance": 0.03802058777003617
            },
            {
              "id": "reasoning_sample_585",
              "rewards": [
                -0.17741407358197459,
                -0.5519428931323498,
                -0.002338471543633502,
                -0.025608013586704153,
                0.343380438810559
              ],
              "variance": 0.6072242399810818,
              "mean_reward": -0.0827846026068206,
              "min_reward": -0.5519428931323498,
              "max_reward": 0.343380438810559,
              "num_responses": 5,
              "rvariance": 0.08408432464143241
            },
            {
              "id": "reasoning_sample_574",
              "rewards": [
                0.6780186148585274,
                0.06525400772433362,
                0.6935316428872412,
                0.545049803183838,
                0.05306519998748709,
                0.582724299825,
                0.7156931114996894
              ],
              "variance": 0.6420177457026255,
              "mean_reward": 0.47619095428087377,
              "min_reward": 0.05306519998748709,
              "max_reward": 0.7156931114996894,
              "num_responses": 7,
              "rvariance": 0.07276116222674721
            },
            {
              "id": "reasoning_sample_520",
              "rewards": [
                -0.6272918864146738,
                -1.278839063620652,
                -1.402943287850362,
                -1.004036852826294,
                -1.402943287850362,
                -1.278839063620652,
                -1.4384016376302793
              ],
              "variance": 0.5637877615006831,
              "mean_reward": -1.204756439973325,
              "min_reward": -1.4384016376302793,
              "max_reward": -0.6272918864146738,
              "num_responses": 7,
              "rvariance": 0.07398232360930554
            },
            {
              "id": "reasoning_sample_238",
              "rewards": [
                0.9417400913466615,
                0.9683338536815994,
                0.3771766784445426,
                0.7312061395284032,
                0.22086907013736862
              ],
              "variance": 0.674304235287386,
              "mean_reward": 0.6478651666277151,
              "min_reward": 0.22086907013736862,
              "max_reward": 0.9683338536815994,
              "num_responses": 5,
              "rvariance": 0.09032125851550496
            },
            {
              "id": "reasoning_sample_630",
              "rewards": [
                -0.0300403073091938,
                -0.7735575792568322,
                -0.9863076779363353,
                -0.8799326285965837,
                -0.9863076779363353
              ],
              "variance": 0.6588604618480862,
              "mean_reward": -0.7312291742070561,
              "min_reward": -0.9863076779363353,
              "max_reward": -0.0300403073091938,
              "num_responses": 5,
              "rvariance": 0.12914006488249602
            },
            {
              "id": "reasoning_sample_233",
              "rewards": [
                -1.3852141129604034,
                -1.7841205479844717,
                -1.7841205479844717,
                -1.6511517363097823,
                -1.730933023314596,
                -2.0234644089989127,
                -1.8018497228744303
              ],
              "variance": 0.34571891035419267,
              "mean_reward": -1.7372648714895809,
              "min_reward": -2.0234644089989127,
              "max_reward": -1.3852141129604034,
              "num_responses": 7,
              "rvariance": 0.03169536972447439
            },
            {
              "id": "reasoning_sample_394",
              "rewards": [
                -0.027824160447948977,
                -0.14417187066330223,
                -0.2704922417542572,
                -0.6405887675821428,
                -0.6405887675821428,
                -0.6095627115247152,
                -0.8223128102042183
              ],
              "variance": 0.615645598053812,
              "mean_reward": -0.45079161853696104,
              "min_reward": -0.8223128102042183,
              "max_reward": -0.027824160447948977,
              "num_responses": 7,
              "rvariance": 0.07724388243633722
            },
            {
              "id": "reasoning_sample_284",
              "rewards": [
                -0.04112104161541792,
                -1.0129014402712733,
                -0.7558284043668736,
                -0.47216160612753616,
                -0.8444742788166666,
                -0.6095627115247152,
                -0.7425315231994046
              ],
              "variance": 0.6120997630758206,
              "mean_reward": -0.6397972865602696,
              "min_reward": -1.0129014402712733,
              "max_reward": -0.04112104161541792,
              "num_responses": 7,
              "rvariance": 0.08464943164225705
            },
            {
              "id": "reasoning_sample_207",
              "rewards": [
                0.39435181661919,
                0.3760686050139202,
                0.17246011213705198,
                -0.6317241801371635,
                0.17246011213705198,
                -0.12201040205085399,
                0.34393447552587025
              ],
              "variance": 0.709277802941406,
              "mean_reward": 0.10079150560643814,
              "min_reward": -0.6317241801371635,
              "max_reward": 0.39435181661919,
              "num_responses": 7,
              "rvariance": 0.11679519138879565
            },
            {
              "id": "reasoning_sample_345",
              "rewards": [
                0.38327108231296586,
                -0.20844012963940212,
                0.3799468620210986,
                -0.048877555629774805,
                0.06857822801620087,
                0.19739176432605626
              ],
              "variance": 0.5102678148016208,
              "mean_reward": 0.12864504190119078,
              "min_reward": -0.20844012963940212,
              "max_reward": 0.38327108231296586,
              "num_responses": 6,
              "rvariance": 0.04691030745541752
            },
            {
              "id": "reasoning_sample_565",
              "rewards": [
                0.8132035733944617,
                0.9328755039016822,
                1.265297533088406,
                1.2697298268108956,
                1.478047631767909,
                1.4691830443229297,
                1.2918912954233437
              ],
              "variance": 0.5877221476021275,
              "mean_reward": 1.2171754869585183,
              "min_reward": 0.8132035733944617,
              "max_reward": 1.478047631767909,
              "num_responses": 7,
              "rvariance": 0.05517743060236435
            },
            {
              "id": "reasoning_sample_78",
              "rewards": [
                2.648173174505176,
                2.293589676706004,
                3.3573401701035195,
                2.8786524480746376,
                3.002756672304348,
                3.1800484212039337,
                3.375069344993478
              ],
              "variance": 0.8580920646739956,
              "mean_reward": 2.9622328439844425,
              "min_reward": 2.293589676706004,
              "max_reward": 3.375069344993478,
              "num_responses": 7,
              "rvariance": 0.13261891796878847
            },
            {
              "id": "reasoning_sample_601",
              "rewards": [
                -0.39681261284521213,
                -0.9685785030463767,
                -0.7115054671419772,
                -0.8577711599841356
              ],
              "variance": 0.44411583099346286,
              "mean_reward": -0.7336669357544254,
              "min_reward": -0.9685785030463767,
              "max_reward": -0.39681261284521213,
              "num_responses": 4,
              "rvariance": 0.04613681711822605
            },
            {
              "id": "reasoning_sample_539",
              "rewards": [
                -0.10649737402214023,
                -0.17741407358197459,
                -0.4677293124050465,
                -0.2638438011705227,
                -0.34805738189782603,
                -0.10871352088338505
              ],
              "variance": 0.30028789969867364,
              "mean_reward": -0.2453759106601492,
              "min_reward": -0.4677293124050465,
              "max_reward": -0.10649737402214023,
              "num_responses": 6,
              "rvariance": 0.017151375133369343
            },
            {
              "id": "reasoning_sample_603",
              "rewards": [
                -0.6671825299170807,
                -1.6777454986447202,
                -1.8550372475443062,
                -1.6777454986447202,
                -1.6777454986447202,
                -1.6777454986447202
              ],
              "variance": 0.5939273588136125,
              "mean_reward": -1.5388669620067112,
              "min_reward": -1.8550372475443062,
              "max_reward": -0.6671825299170807,
              "num_responses": 6,
              "rvariance": 0.15615773172653424
            },
            {
              "id": "reasoning_sample_339",
              "rewards": [
                0.6447764119398551,
                -0.0865520522709368,
                -0.04112104161541792,
                0.19988492954495668,
                0.1852029565892097,
                0.21041162713586958
              ],
              "variance": 0.4914305664810397,
              "mean_reward": 0.1854338052205894,
              "min_reward": -0.0865520522709368,
              "max_reward": 0.6447764119398551,
              "num_responses": 6,
              "rvariance": 0.056188635920149645
            },
            {
              "id": "reasoning_sample_447",
              "rewards": [
                0.8708233917868271,
                2.47088142560559,
                2.47088142560559,
                2.47088142560559,
                2.3290480264859212,
                1.806037367232143,
                2.47088142560559
              ],
              "variance": 1.0389296485515735,
              "mean_reward": 2.1270620697038933,
              "min_reward": 0.8708233917868271,
              "max_reward": 2.47088142560559,
              "num_responses": 7,
              "rvariance": 0.3135482571713824
            },
            {
              "id": "reasoning_sample_44",
              "rewards": [
                0.38991952289670034,
                1.1145995465237577,
                0.6447764119398551,
                1.2697298268108956,
                0.4641604427484019,
                1.0392505532414338,
                1.1456256025811855
              ],
              "variance": 0.7608032174653483,
              "mean_reward": 0.8668659866774614,
              "min_reward": 0.38991952289670034,
              "max_reward": 1.2697298268108956,
              "num_responses": 7,
              "rvariance": 0.11000971660581707
            },
            {
              "id": "reasoning_sample_266",
              "rewards": [
                -0.5652397742998188,
                -0.813448222759239,
                -0.436703256347619,
                -0.8489065725391562,
                -0.7868544604243012,
                -0.41454178773517075,
                -0.5962658303572463
              ],
              "variance": 0.3997928937685662,
              "mean_reward": -0.6374228434946502,
              "min_reward": -0.8489065725391562,
              "max_reward": -0.41454178773517075,
              "num_responses": 7,
              "rvariance": 0.027844103260533635
            },
            {
              "id": "reasoning_sample_529",
              "rewards": [
                -0.14860416438579188,
                -0.5164845433524327,
                -0.4101094940126811,
                -0.5741043617447981,
                -0.5741043617447981,
                -0.5608074805773291,
                -0.5741043617447981
              ],
              "variance": 0.26859699958287275,
              "mean_reward": -0.4797598239375184,
              "min_reward": -0.5741043617447981,
              "max_reward": -0.14860416438579188,
              "num_responses": 7,
              "rvariance": 0.02130504891669917
            },
            {
              "id": "reasoning_sample_466",
              "rewards": [
                -0.06439058365848857,
                0.024255290791304385,
                -0.4455678437925983,
                -0.03336452760106104,
                -0.055525996213509274,
                -0.5608074805773291,
                -0.13530728321832294
              ],
              "variance": 0.48134709826237576,
              "mean_reward": -0.18152977489571495,
              "min_reward": -0.5608074805773291,
              "max_reward": 0.024255290791304385,
              "num_responses": 7,
              "rvariance": 0.044229024960339085
            },
            {
              "id": "reasoning_sample_349",
              "rewards": [
                -0.5563751868548394,
                -0.8533388662616459,
                -0.8932295097640527,
                -0.9685785030463767,
                -1.2079223640608177,
                -1.1458702519459625
              ],
              "variance": 0.4720392814451474,
              "mean_reward": -0.9375524469889491,
              "min_reward": -1.2079223640608177,
              "max_reward": -0.5563751868548394,
              "num_responses": 6,
              "rvariance": 0.045301894943423134
            },
            {
              "id": "reasoning_sample_206",
              "rewards": [
                -0.5696720680223084,
                -1.128141077056004,
                -0.915390978376501,
                -1.128141077056004
              ],
              "variance": 0.45475333592743794,
              "mean_reward": -0.9353363001277044,
              "min_reward": -1.128141077056004,
              "max_reward": -0.5696720680223084,
              "num_responses": 4,
              "rvariance": 0.052113877628432684
            },
            {
              "id": "reasoning_sample_516",
              "rewards": [
                -0.3391927944528467,
                -0.7380992294769151,
                -0.6937762922520185,
                -0.587401242912267,
                -0.8755003348740941,
                -0.6583179424721014,
                -0.7779898729793219
              ],
              "variance": 0.32887619420873193,
              "mean_reward": -0.6671825299170806,
              "min_reward": -0.8755003348740941,
              "max_reward": -0.3391927944528467,
              "num_responses": 7,
              "rvariance": 0.025061697549545823
            },
            {
              "id": "reasoning_sample_542",
              "rewards": [
                0.8021228390882376,
                0.1356166705688568,
                0.37163631129143054,
                0.46970080990151397,
                -0.021175719864214505,
                0.37163631129143054,
                0.06082171400184398
              ],
              "variance": 0.5746468811207829,
              "mean_reward": 0.3129084194684427,
              "min_reward": -0.021175719864214505,
              "max_reward": 0.8021228390882376,
              "num_responses": 7,
              "rvariance": 0.06820068801030206
            },
            {
              "id": "reasoning_sample_151",
              "rewards": [
                0.010958409623835442,
                -0.6849117048070392,
                -0.436703256347619,
                -0.7292346420319358
              ],
              "variance": 0.592597670696866,
              "mean_reward": -0.45997279839068966,
              "min_reward": -0.7292346420319358,
              "max_reward": 0.010958409623835442,
              "num_responses": 4,
              "rvariance": 0.08635428158244506
            },
            {
              "id": "reasoning_sample_223",
              "rewards": [
                -0.6583179424721014,
                -1.3320265882905278,
                -0.5164845433524327,
                -0.5031876621849637,
                -0.5164845433524327,
                -0.3303282070078674,
                -0.6361564738596531
              ],
              "variance": 0.49375752068534684,
              "mean_reward": -0.6418551372171398,
              "min_reward": -1.3320265882905278,
              "max_reward": -0.3303282070078674,
              "num_responses": 7,
              "rvariance": 0.08919334272672308
            },
            {
              "id": "reasoning_sample_452",
              "rewards": [
                0.024255290791304385,
                -0.21952086394562625,
                0.22287745323037172,
                0.25196438078421
              ],
              "variance": 0.38962632004260556,
              "mean_reward": 0.06989406521506497,
              "min_reward": -0.21952086394562625,
              "max_reward": 0.25196438078421,
              "num_responses": 4,
              "rvariance": 0.0355993539430202
            },
            {
              "id": "reasoning_sample_68",
              "rewards": [
                0.8752556855093168,
                1.5666935062177019,
                1.265297533088406,
                1.4337246945430124,
                1.6376102057775364,
                1.3051881765908127,
                1.163354777471144
              ],
              "variance": 0.5469450453552227,
              "mean_reward": 1.3210177970282755,
              "min_reward": 0.8752556855093168,
              "max_reward": 1.6376102057775364,
              "num_responses": 7,
              "rvariance": 0.05717242351560286
            },
            {
              "id": "reasoning_sample_552",
              "rewards": [
                0.8176358671169514,
                0.558346684351307,
                0.808771279671972,
                0.4453231944278209,
                0.808771279671972,
                0.808771279671972,
                1.110167252801268
              ],
              "variance": 0.42151113300876564,
              "mean_reward": 0.7653981196733233,
              "min_reward": 0.4453231944278209,
              "max_reward": 1.110167252801268,
              "num_responses": 7,
              "rvariance": 0.03893664072577214
            },
            {
              "id": "reasoning_sample_209",
              "rewards": [
                -0.33476050073035707,
                -1.0572243774961696,
                -0.587401242912267,
                -1.216786951505797
              ],
              "variance": 0.7583654559179787,
              "mean_reward": -0.7990432681611477,
              "min_reward": -1.216786951505797,
              "max_reward": -0.33476050073035707,
              "num_responses": 4,
              "rvariance": 0.12537952629411467
            },
            {
              "id": "reasoning_sample_391",
              "rewards": [
                0.2763419962579031,
                -0.11536196146711952,
                -0.21287242336189177,
                -0.2660599480317675,
                -0.31259903211790885,
                -0.06217443679724375,
                -0.13309113635707812
              ],
              "variance": 0.35790771809103916,
              "mean_reward": -0.11797384883930093,
              "min_reward": -0.31259903211790885,
              "max_reward": 0.2763419962579031,
              "num_responses": 7,
              "rvariance": 0.03252115837188487
            },
            {
              "id": "reasoning_sample_210",
              "rewards": [
                1.0525474344089027,
                0.8663910980643375,
                0.5982373278537138,
                0.7622321955858308,
                0.8708233917868271,
                0.43202631326035196,
                0.7888259579207686
              ],
              "variance": 0.41176008681928844,
              "mean_reward": 0.7672976741258191,
              "min_reward": 0.43202631326035196,
              "max_reward": 1.0525474344089027,
              "num_responses": 7,
              "rvariance": 0.034768845542980535
            },
            {
              "id": "reasoning_sample_465",
              "rewards": [
                1.3362142326482402,
                1.5312351564377849,
                1.3051881765908127,
                1.3229173514807713,
                1.7883081923421844,
                1.7883081923421844,
                1.7439852551172879
              ],
              "variance": 0.4724825108173967,
              "mean_reward": 1.5451652224227523,
              "min_reward": 1.3051881765908127,
              "max_reward": 1.7883081923421844,
              "num_responses": 7,
              "rvariance": 0.044086296367671717
            },
            {
              "id": "reasoning_sample_396",
              "rewards": [
                0.9328755039016822,
                -0.09984893343840576,
                -0.03558067446230586,
                0.3478127325330487,
                -0.044445261907285157,
                0.07965896232242499,
                -0.05995828993599892
              ],
              "variance": 0.657752388417464,
              "mean_reward": 0.16007343414473715,
              "min_reward": -0.09984893343840576,
              "max_reward": 0.9328755039016822,
              "num_responses": 7,
              "rvariance": 0.11928822778285982
            },
            {
              "id": "reasoning_sample_348",
              "rewards": [
                -0.1131458146058747,
                -0.286005269782971,
                -0.5563751868548394,
                -0.4898907810174948,
                -0.39681261284521213,
                -0.5563751868548394,
                -0.3879480254002329
              ],
              "variance": 0.339513699142707,
              "mean_reward": -0.3980789824802092,
              "min_reward": -0.5563751868548394,
              "max_reward": -0.1131458146058747,
              "num_responses": 7,
              "rvariance": 0.021770921457933724
            },
            {
              "id": "reasoning_sample_83",
              "rewards": [
                0.42759401953786236,
                0.17439924064064122,
                0.03311987823628368,
                -0.11979425518960916,
                0.046416759403752623,
                0.709044670915955,
                0.0442006125425078
              ],
              "variance": 0.568220055223173,
              "mean_reward": 0.18785441801248481,
              "min_reward": -0.11979425518960916,
              "max_reward": 0.709044670915955,
              "num_responses": 7,
              "rvariance": 0.06978955844010366
            },
            {
              "id": "reasoning_sample_242",
              "rewards": [
                0.5915888872699793,
                0.20791846191696917,
                0.20791846191696917,
                0.26955504649534084,
                -0.2062239827781573,
                -0.14638801752454705,
                0.17827749764781964
              ],
              "variance": 0.5686909864311874,
              "mean_reward": 0.15752090784919623,
              "min_reward": -0.2062239827781573,
              "max_reward": 0.5915888872699793,
              "num_responses": 7,
              "rvariance": 0.06159261461315002
            },
            {
              "id": "reasoning_sample_269",
              "rewards": [
                1.2608652393659163,
                0.9816307348490683,
                0.2935171344325505,
                0.9816307348490683,
                0.9816307348490683
              ],
              "variance": 0.5804088629600195,
              "mean_reward": 0.8998549156691343,
              "min_reward": 0.2935171344325505,
              "max_reward": 1.2608652393659163,
              "num_responses": 5,
              "rvariance": 0.10360716251564131
            },
            {
              "id": "reasoning_sample_694",
              "rewards": [
                -0.6361564738596531,
                -0.915390978376501,
                -1.004036852826294,
                -1.0749535523861282,
                -0.915390978376501,
                -1.128141077056004
              ],
              "variance": 0.3257735886029891,
              "mean_reward": -0.9456783188135134,
              "min_reward": -1.128141077056004,
              "max_reward": -0.6361564738596531,
              "num_responses": 6,
              "rvariance": 0.025174813522994843
            },
            {
              "id": "reasoning_sample_18",
              "rewards": [
                -0.1131458146058747,
                0.005418042470723382,
                0.2423726201503848,
                -0.20179168905566766,
                -0.3879480254002329,
                -0.33476050073035707
              ],
              "variance": 0.485249594375849,
              "mean_reward": -0.13164256119517068,
              "min_reward": -0.3879480254002329,
              "max_reward": 0.2423726201503848,
              "num_responses": 6,
              "rvariance": 0.04514756384509617
            },
            {
              "id": "reasoning_sample_230",
              "rewards": [
                -0.6671825299170807,
                -1.3231620008455485,
                -1.1990577766158383,
                -1.0483597900511903,
                -1.1990577766158383
              ],
              "variance": 0.45386687718293983,
              "mean_reward": -1.0873639748090993,
              "min_reward": -1.3231620008455485,
              "max_reward": -0.6671825299170807,
              "num_responses": 5,
              "rvariance": 0.05172509857338915
            },
            {
              "id": "reasoning_sample_237",
              "rewards": [
                0.8486619231743788,
                0.7511514612796066,
                0.5627789780737966,
                0.285483602060538,
                0.3201108967674884
              ],
              "variance": 0.5103232184731518,
              "mean_reward": 0.5536373722711617,
              "min_reward": 0.285483602060538,
              "max_reward": 0.8486619231743788,
              "num_responses": 5,
              "rvariance": 0.050515185837694265
            },
            {
              "id": "reasoning_sample_312",
              "rewards": [
                -0.23946618569682965,
                -0.5342137182423913,
                -0.44113555007010863,
                -0.17741407358197459,
                -0.6671825299170807,
                -0.6671825299170807
              ],
              "variance": 0.4587424002776786,
              "mean_reward": -0.4544324312375776,
              "min_reward": -0.6671825299170807,
              "max_reward": -0.17741407358197459,
              "num_responses": 6,
              "rvariance": 0.0366694544968826
            },
            {
              "id": "reasoning_sample_47",
              "rewards": [
                0.36554190742300724,
                -0.1508203112470367,
                -0.42340637518015006,
                -0.32811206014662264,
                -0.42340637518015006,
                -0.42340637518015006,
                -0.42340637518015006
              ],
              "variance": 0.47913095140113116,
              "mean_reward": -0.25814513781303605,
              "min_reward": -0.42340637518015006,
              "max_reward": 0.36554190742300724,
              "num_responses": 7,
              "rvariance": 0.07352066075970866
            },
            {
              "id": "reasoning_sample_2",
              "rewards": [
                -0.4189740814576604,
                -0.37908343795525357,
                -0.2328177451130952,
                -0.0865520522709368,
                -0.4765938998500258,
                -0.5164845433524327,
                -0.6627502361945911
              ],
              "variance": 0.4006793525130642,
              "mean_reward": -0.39617942802771366,
              "min_reward": -0.6627502361945911,
              "max_reward": -0.0865520522709368,
              "num_responses": 7,
              "rvariance": 0.030766832026110167
            },
            {
              "id": "reasoning_sample_58",
              "rewards": [
                2.107433340361439,
                2.559527300055383,
                2.3024542641509833,
                2.8431940982947204,
                1.7262560802273292,
                2.258131326926087,
                2.054245815691563
              ],
              "variance": 0.7499440978452485,
              "mean_reward": 2.264463175101072,
              "min_reward": 1.7262560802273292,
              "max_reward": 2.8431940982947204,
              "num_responses": 7,
              "rvariance": 0.11171318837314745
            },
            {
              "id": "reasoning_sample_308",
              "rewards": [
                -0.2594115074480331,
                -0.587401242912267,
                -0.6228595926921842,
                -0.8666357474291149,
                -0.37021885051027426,
                -0.6051304178022257,
                -0.6228595926921842
              ],
              "variance": 0.3944741413015787,
              "mean_reward": -0.5620738502123261,
              "min_reward": -0.8666357474291149,
              "max_reward": -0.2594115074480331,
              "num_responses": 7,
              "rvariance": 0.03300799166939863
            },
            {
              "id": "reasoning_sample_59",
              "rewards": [
                0.9284432101791925,
                0.9506046787916408,
                2.027652053356625,
                0.9240109164567029,
                1.1766516586386129,
                1.096870371633799,
                1.3362142326482402
              ],
              "variance": 0.6861190682413978,
              "mean_reward": 1.205778160243545,
              "min_reward": 0.9240109164567029,
              "max_reward": 2.027652053356625,
              "num_responses": 7,
              "rvariance": 0.13237435493079094
            },
            {
              "id": "reasoning_sample_219",
              "rewards": [
                0.6425602650786103,
                0.27745006968852554,
                0.28908484071006085,
                0.6602894399685688,
                -0.12865884263458846,
                -0.1796302204432194,
                0.31955686005217715
              ],
              "variance": 0.7986993287926345,
              "mean_reward": 0.2686646303457335,
              "min_reward": -0.1796302204432194,
              "max_reward": 0.6602894399685688,
              "num_responses": 7,
              "rvariance": 0.09358376294138852
            },
            {
              "id": "reasoning_sample_216",
              "rewards": [
                -0.5430783056873706,
                -0.4898907810174948,
                -0.977443090491356,
                -0.7469638169218943
              ],
              "variance": 0.4024522700020601,
              "mean_reward": -0.6893439985295289,
              "min_reward": -0.977443090491356,
              "max_reward": -0.4898907810174948,
              "num_responses": 4,
              "rvariance": 0.03687409228482447
            },
            {
              "id": "reasoning_sample_201",
              "rewards": [
                0.14115703772196886,
                -0.5785366554672877,
                -0.6405887675821428,
                -0.5652397742998188,
                -0.4765938998500258
              ],
              "variance": 0.5098245854293717,
              "mean_reward": -0.42396041189546124,
              "min_reward": -0.6405887675821428,
              "max_reward": 0.14115703772196886,
              "num_responses": 5,
              "rvariance": 0.08258190674440914
            },
            {
              "id": "reasoning_sample_550",
              "rewards": [
                0.897417154121765,
                0.9328755039016822,
                0.6625055868298136,
                0.9328755039016822,
                0.9328755039016822,
                0.6625055868298136,
                0.897417154121765
              ],
              "variance": 0.2703699170718685,
              "mean_reward": 0.8454959990868863,
              "min_reward": 0.6625055868298136,
              "max_reward": 0.9328755039016822,
              "num_responses": 7,
              "rvariance": 0.013609732603053636
            },
            {
              "id": "reasoning_sample_34",
              "rewards": [
                0.29074695085599445,
                -0.6317241801371635,
                0.450863561580933,
                0.34670465910242626,
                0.15279180874350418,
                0.4087567712172813,
                0.18298680972796488
              ],
              "variance": 0.5866140741715048,
              "mean_reward": 0.1715894830129915,
              "min_reward": -0.6317241801371635,
              "max_reward": 0.450863561580933,
              "num_responses": 7,
              "rvariance": 0.11784317908737851
            },
            {
              "id": "reasoning_sample_618",
              "rewards": [
                0.2665078445611292,
                -0.5164845433524327,
                -0.46329701868255685,
                -0.35692196934280535,
                -0.4322709626251293,
                -0.27714068233799166
              ],
              "variance": 0.48457436212906346,
              "mean_reward": -0.2966012219632978,
              "min_reward": -0.5164845433524327,
              "max_reward": 0.2665078445611292,
              "num_responses": 6,
              "rvariance": 0.06927526136152945
            },
            {
              "id": "reasoning_sample_257",
              "rewards": [
                0.06303786086308881,
                -0.1685494861369953,
                -0.03336452760106104,
                -0.33476050073035707,
                -0.32811206014662264
              ],
              "variance": 0.35657802997429217,
              "mean_reward": -0.16034974275038943,
              "min_reward": -0.33476050073035707,
              "max_reward": 0.06303786086308881,
              "num_responses": 5,
              "rvariance": 0.02493156194872025
            },
            {
              "id": "reasoning_sample_527",
              "rewards": [
                0.6292633839111413,
                0.9860630285715579,
                0.4896461316527174,
                0.46748466304026914,
                0.4896461316527174,
                0.4896461316527174,
                0.4896461316527174
              ],
              "variance": 0.29120169756757,
              "mean_reward": 0.5773422288762626,
              "min_reward": 0.46748466304026914,
              "max_reward": 0.9860630285715579,
              "num_responses": 7,
              "rvariance": 0.030368515012584744
            },
            {
              "id": "reasoning_sample_66",
              "rewards": [
                -0.7159377608644668,
                0.02314721736068197,
                -0.3391927944528467,
                0.1284141932698111,
                0.019822997068814737,
                0.2568122020431831,
                -0.055525996213509274
              ],
              "variance": 0.6696641777966547,
              "mean_reward": -0.09749427739833315,
              "min_reward": -0.7159377608644668,
              "max_reward": 0.2568122020431831,
              "num_responses": 7,
              "rvariance": 0.09250532623623375
            },
            {
              "id": "reasoning_sample_292",
              "rewards": [
                0.9683338536815994,
                0.3699742011454969,
                0.7710967830308101,
                0.8663910980643375,
                0.7710967830308101,
                0.21719857689843186,
                0.8663910980643375
              ],
              "variance": 0.5983042488645713,
              "mean_reward": 0.6900689134165461,
              "min_reward": 0.21719857689843186,
              "max_reward": 0.9683338536815994,
              "num_responses": 7,
              "rvariance": 0.0684012019813923
            },
            {
              "id": "reasoning_sample_390",
              "rewards": [
                1.1190318402462474,
                1.265297533088406,
                0.897417154121765,
                0.7888259579207686,
                0.7888259579207686,
                1.0835734904663301
              ],
              "variance": 0.40333872874655796,
              "mean_reward": 0.9904953222940476,
              "min_reward": 0.7888259579207686,
              "max_reward": 1.265297533088406,
              "num_responses": 6,
              "rvariance": 0.03178434122313389
            },
            {
              "id": "reasoning_sample_414",
              "rewards": [
                -0.5829689491897774,
                -1.0306306151612319,
                -0.41454178773517075,
                -0.4278386689026397,
                -0.4278386689026397,
                -0.41454178773517075
              ],
              "variance": 0.3922579944403339,
              "mean_reward": -0.5497267462711051,
              "min_reward": -1.0306306151612319,
              "max_reward": -0.41454178773517075,
              "num_responses": 6,
              "rvariance": 0.0497728213343775
            },
            {
              "id": "reasoning_sample_384",
              "rewards": [
                0.3322997045043349,
                -0.23503389197434002,
                -0.23503389197434002,
                -0.40567720029019144,
                -0.5475105994098601,
                -0.23503389197434002,
                -0.14638801752454705
              ],
              "variance": 0.5074976312250647,
              "mean_reward": -0.21033968409189768,
              "min_reward": -0.5475105994098601,
              "max_reward": 0.3322997045043349,
              "num_responses": 7,
              "rvariance": 0.06460252925607571
            },
            {
              "id": "reasoning_sample_586",
              "rewards": [
                0.15002162516694814,
                0.07965896232242499,
                0.07965896232242499,
                0.19018928702701057,
                0.07965896232242499,
                -0.11757810832836435
              ],
              "variance": 0.18906502909994904,
              "mean_reward": 0.07693494847214488,
              "min_reward": -0.11757810832836435,
              "max_reward": 0.19018928702701057,
              "num_responses": 6,
              "rvariance": 0.00933763292200642
            },
            {
              "id": "reasoning_sample_652",
              "rewards": [
                -0.7824221667018115,
                -1.4295370501853,
                -1.2877036510656312,
                -1.3142974134005692,
                -1.252245301285714,
                -1.3852141129604034,
                -1.0306306151612319
              ],
              "variance": 0.47159605207289834,
              "mean_reward": -1.2117214729658088,
              "min_reward": -1.4295370501853,
              "max_reward": -0.7824221667018115,
              "num_responses": 7,
              "rvariance": 0.04465320150821011
            },
            {
              "id": "reasoning_sample_389",
              "rewards": [
                -0.1508203112470367,
                -0.22173701080687105,
                -0.31924747270164333,
                -0.6139950052472049,
                -0.2815729760604813,
                -0.3524896756203157,
                -0.6450210613046324
              ],
              "variance": 0.4330350966872386,
              "mean_reward": -0.36926907328402647,
              "min_reward": -0.6450210613046324,
              "max_reward": -0.1508203112470367,
              "num_responses": 7,
              "rvariance": 0.030841403706548743
            },
            {
              "id": "reasoning_sample_26",
              "rewards": [
                1.2963235891458333,
                0.008742262762590618,
                0.7378545801121377,
                1.225406889585999,
                0.9284432101791925,
                0.5384013626001035
              ],
              "variance": 0.9872934266845692,
              "mean_reward": 0.789195315730976,
              "min_reward": 0.008742262762590618,
              "max_reward": 1.2963235891458333,
              "num_responses": 6,
              "rvariance": 0.19024834081977318
            },
            {
              "id": "reasoning_sample_563",
              "rewards": [
                -0.036688747892928274,
                -0.3391927944528467,
                -0.33476050073035707,
                -0.6139950052472049,
                -0.361354263065295,
                -0.3524896756203157,
                -0.30595059153417437
              ],
              "variance": 0.2641647058603831,
              "mean_reward": -0.3349187969347317,
              "min_reward": -0.6139950052472049,
              "max_reward": -0.036688747892928274,
              "num_responses": 7,
              "rvariance": 0.024098530125924163
            },
            {
              "id": "reasoning_sample_399",
              "rewards": [
                0.6492087056623447,
                -0.09098434599342646,
                0.4796734707771157,
                0.39213566975794517,
                0.709044670915955,
                0.6735863211360378
              ],
              "variance": 0.540739834143737,
              "mean_reward": 0.4687774153759953,
              "min_reward": -0.09098434599342646,
              "max_reward": 0.709044670915955,
              "num_responses": 6,
              "rvariance": 0.07525940052730179
            },
            {
              "id": "reasoning_sample_428",
              "rewards": [
                -0.25497921372554344,
                -0.4898907810174948,
                -0.2993021509504399,
                -0.45886472496006725,
                -0.7513961106443839
              ],
              "variance": 0.3740855901781263,
              "mean_reward": -0.4508865962595858,
              "min_reward": -0.7513961106443839,
              "max_reward": -0.25497921372554344,
              "num_responses": 5,
              "rvariance": 0.030649698358599764
            },
            {
              "id": "reasoning_sample_39",
              "rewards": [
                -0.051093702491019626,
                0.23163815879123018,
                -0.2660599480317675,
                0.25168736242655443,
                -0.05995828993599892,
                -0.013419205849857622,
                -0.04001296818479551
              ],
              "variance": 0.38205679341966625,
              "mean_reward": 0.0075402009606207725,
              "min_reward": -0.2660599480317675,
              "max_reward": 0.25168736242655443,
              "num_responses": 7,
              "rvariance": 0.02791133631732805
            },
            {
              "id": "reasoning_sample_255",
              "rewards": [
                -1.1370056645009832,
                -1.6511517363097823,
                -1.4649953999652172,
                -1.2699744761756726,
                -1.642287148864803,
                -1.252245301285714,
                -1.6954746735346788
              ],
              "variance": 0.46273146462791925,
              "mean_reward": -1.4447334858052645,
              "min_reward": -1.6954746735346788,
              "max_reward": -1.1370056645009832,
              "num_responses": 7,
              "rvariance": 0.04388663670714261
            },
            {
              "id": "reasoning_sample_277",
              "rewards": [
                -1.2611098887306933,
                -1.668880911199741,
                -1.6156933865298653,
                -1.7132038484246375,
                -1.668880911199741,
                -1.5004537497451342,
                -1.5093183371901135
              ],
              "variance": 0.2818938807503417,
              "mean_reward": -1.5625058618599894,
              "min_reward": -1.7132038484246375,
              "max_reward": -1.2611098887306933,
              "num_responses": 7,
              "rvariance": 0.020812715456599316
            },
            {
              "id": "reasoning_sample_208",
              "rewards": [
                -1.2256515389507763,
                -1.5979642116399067,
                -1.2699744761756726,
                -1.2699744761756726,
                -1.55364127441501
              ],
              "variance": 0.33685432290921313,
              "mean_reward": -1.3834411954714079,
              "min_reward": -1.5979642116399067,
              "max_reward": -1.2256515389507763,
              "num_responses": 5,
              "rvariance": 0.025127031963762335
            },
            {
              "id": "reasoning_sample_561",
              "rewards": [
                -0.6716148236395704,
                -0.8976618034865423,
                -1.2345161263957554,
                -0.9065263909315217,
                -1.2345161263957554,
                -1.2345161263957554,
                -1.2345161263957554
              ],
              "variance": 0.4272731148480019,
              "mean_reward": -1.0591239319486652,
              "min_reward": -1.2345161263957554,
              "max_reward": -0.6716148236395704,
              "num_responses": 7,
              "rvariance": 0.046081289280910175
            },
            {
              "id": "reasoning_sample_640",
              "rewards": [
                1.0126567909064959,
                -0.12201040205085399,
                0.10791483480329649,
                0.22086907013736862,
                0.4242697992459951,
                0.4242697992459951
              ],
              "variance": 0.7255110787000243,
              "mean_reward": 0.3446616487147162,
              "min_reward": -0.12201040205085399,
              "max_reward": 1.0126567909064959,
              "num_responses": 6,
              "rvariance": 0.12467481410460292
            },
            {
              "id": "reasoning_sample_320",
              "rewards": [
                -0.8001513415917701,
                -1.3852141129604034,
                -1.2611098887306933,
                -1.3586203506254657,
                -1.2965682385106105
              ],
              "variance": 0.390041847579089,
              "mean_reward": -1.2203327864837887,
              "min_reward": -1.3852141129604034,
              "max_reward": -0.8001513415917701,
              "num_responses": 5,
              "rvariance": 0.046067273012371845
            },
            {
              "id": "reasoning_sample_217",
              "rewards": [
                0.808771279671972,
                0.2577817662949777,
                0.18852717688107695,
                0.19960791118730106,
                0.19849983775667868,
                0.46637658960964673,
                0.3004425933739406
              ],
              "variance": 0.40882369222813897,
              "mean_reward": 0.3457153078250848,
              "min_reward": 0.18852717688107695,
              "max_reward": 0.808771279671972,
              "num_responses": 7,
              "rvariance": 0.04378425412488052
            },
            {
              "id": "reasoning_sample_522",
              "rewards": [
                0.9062817415667443,
                0.5627789780737966,
                0.5494820969063277,
                0.9062817415667443,
                0.9860630285715579,
                0.5805081529637551,
                0.4818896176383605
              ],
              "variance": 0.41574915116952904,
              "mean_reward": 0.7104693367553266,
              "min_reward": 0.4818896176383605,
              "max_reward": 0.9860630285715579,
              "num_responses": 7,
              "rvariance": 0.03850068706439097
            },
            {
              "id": "reasoning_sample_291",
              "rewards": [
                -0.6760471173620599,
                -1.0129014402712733,
                -1.004036852826294,
                -1.2877036510656312,
                -1.128141077056004
              ],
              "variance": 0.4166356099140268,
              "mean_reward": -1.0217660277162526,
              "min_reward": -1.2877036510656312,
              "max_reward": -0.6760471173620599,
              "num_responses": 5,
              "rvariance": 0.04039058803281785
            },
            {
              "id": "reasoning_sample_49",
              "rewards": [
                2.320183439040942,
                2.7545482238449277,
                3.1800484212039337,
                3.3927985198834367,
                2.9318399727445135,
                2.9672983225244307,
                2.949569147634472
              ],
              "variance": 0.6843461507524013,
              "mean_reward": 2.9280408638395223,
              "min_reward": 2.320183439040942,
              "max_reward": 3.3927985198834367,
              "num_responses": 7,
              "rvariance": 0.09730241158989879
            },
            {
              "id": "reasoning_sample_545",
              "rewards": [
                -0.48102619357251547,
                -0.8178805164817287,
                -0.6760471173620599,
                -0.6095627115247152,
                -0.7513961106443839
              ],
              "variance": 0.25884595339339533,
              "mean_reward": -0.6671825299170806,
              "min_reward": -0.8178805164817287,
              "max_reward": -0.48102619357251547,
              "num_responses": 5,
              "rvariance": 0.013570923255384518
            },
            {
              "id": "reasoning_sample_37",
              "rewards": [
                0.6625055868298136,
                0.6868832023035067,
                0.7378545801121377,
                1.4337246945430124,
                0.8575265106193581,
                1.655339380667495,
                1.4869122192128883
              ],
              "variance": 0.8771509276807015,
              "mean_reward": 1.0743923106126017,
              "min_reward": 0.6625055868298136,
              "max_reward": 1.655339380667495,
              "num_responses": 7,
              "rvariance": 0.15955633383517243
            },
            {
              "id": "reasoning_sample_248",
              "rewards": [
                -0.2616276543092779,
                -0.13752343007956777,
                -0.13752343007956777,
                -0.3657865567877846,
                -0.1042812271608954,
                -0.436703256347619,
                -0.37908343795525357
              ],
              "variance": 0.2779048164001009,
              "mean_reward": -0.2603612846742808,
              "min_reward": -0.436703256347619,
              "max_reward": -0.1042812271608954,
              "num_responses": 7,
              "rvariance": 0.01583525624883077
            },
            {
              "id": "reasoning_sample_28",
              "rewards": [
                0.9771984411265786,
                0.5428336563225932,
                0.7755290767532997,
                0.37385245815267537,
                0.6314795307723862,
                0.2478783600087899,
                0.2563966745066997
              ],
              "variance": 0.6032074737950756,
              "mean_reward": 0.5435954568061462,
              "min_reward": 0.2478783600087899,
              "max_reward": 0.9771984411265786,
              "num_responses": 7,
              "rvariance": 0.06403905290781002
            },
            {
              "id": "reasoning_sample_328",
              "rewards": [
                -0.04222911504604033,
                -0.3524896756203157,
                -0.5297814245199016,
                -0.5430783056873706,
                -0.525349130797412
              ],
              "variance": 0.3714262139446326,
              "mean_reward": -0.398585530334208,
              "min_reward": -0.5430783056873706,
              "max_reward": -0.04222911504604033,
              "num_responses": 5,
              "rvariance": 0.036654851544335065
            },
            {
              "id": "reasoning_sample_604",
              "rewards": [
                0.06082171400184398,
                -0.23060159825185036,
                -0.15525260496952636,
                -0.361354263065295,
                -0.10206508029965057,
                -0.4455678437925983,
                -0.0954166397159161
              ],
              "variance": 0.3621183971274043,
              "mean_reward": -0.1899194737275704,
              "min_reward": -0.4455678437925983,
              "max_reward": 0.06082171400184398,
              "num_responses": 7,
              "rvariance": 0.025303303780321623
            },
            {
              "id": "reasoning_sample_93",
              "rewards": [
                1.6819331430024327,
                1.5755580936626812,
                1.1544901900261646,
                2.018787465911646,
                1.4248601070980331,
                1.7439852551172879,
                1.5666935062177019
              ],
              "variance": 0.5371939991657453,
              "mean_reward": 1.5951868230051354,
              "min_reward": 1.1544901900261646,
              "max_reward": 2.018787465911646,
              "num_responses": 7,
              "rvariance": 0.06193218152725229
            },
            {
              "id": "reasoning_sample_410",
              "rewards": [
                1.6730685555574536,
                1.7971727797871637,
                2.027652053356625,
                2.0985687529164596,
                1.992193703576708,
                2.2315375645911493,
                2.2315375645911493
              ],
              "variance": 0.48400647449586964,
              "mean_reward": 2.007390139196673,
              "min_reward": 1.6730685555574536,
              "max_reward": 2.2315375645911493,
              "num_responses": 7,
              "rvariance": 0.03791448750384658
            },
            {
              "id": "reasoning_sample_577",
              "rewards": [
                -1.0749535523861282,
                -1.7752559605394924,
                -1.5713704493049687,
                -1.5270475120800722,
                -1.5359120995250515,
                -1.5270475120800722,
                -1.5890996241949273
              ],
              "variance": 0.31735223053025896,
              "mean_reward": -1.514383815730102,
              "min_reward": -1.7752559605394924,
              "max_reward": -1.0749535523861282,
              "num_responses": 7,
              "rvariance": 0.0386810523049141
            },
            {
              "id": "reasoning_sample_663",
              "rewards": [
                -0.5342137182423913,
                -0.9863076779363353,
                -0.9863076779363353,
                -0.9508493281564181,
                -0.8799326285965837,
                -0.9863076779363353,
                -0.8045836353142598
              ],
              "variance": 0.28987200945082303,
              "mean_reward": -0.8755003348740943,
              "min_reward": -0.9863076779363353,
              "max_reward": -0.5342137182423913,
              "num_responses": 7,
              "rvariance": 0.02343395011631664
            },
            {
              "id": "reasoning_sample_46",
              "rewards": [
                0.2832674551992932,
                0.8442296294518892,
                1.4869122192128883,
                1.4159955196530538,
                1.0747089030213508,
                1.3805371698731368,
                1.3672402887056678
              ],
              "variance": 0.8245174397261369,
              "mean_reward": 1.1218415978738971,
              "min_reward": 0.2832674551992932,
              "max_reward": 1.4869122192128883,
              "num_responses": 7,
              "rvariance": 0.16134907048492972
            },
            {
              "id": "reasoning_sample_598",
              "rewards": [
                -1.6600163237547616,
                -1.846172660099327,
                -1.8993601847692025,
                -1.7841205479844717
              ],
              "variance": 0.1861563363445653,
              "mean_reward": -1.7974174291519407,
              "min_reward": -1.8993601847692025,
              "max_reward": -1.6600163237547616,
              "num_responses": 4,
              "rvariance": 0.007956317195180562
            },
            {
              "id": "reasoning_sample_220",
              "rewards": [
                -0.5652397742998188,
                -0.8356096913716873,
                -0.4677293124050465,
                -0.6317241801371635,
                -0.49875536846247404
              ],
              "variance": 0.2739157520498602,
              "mean_reward": -0.599811665335238,
              "min_reward": -0.8356096913716873,
              "max_reward": -0.4677293124050465,
              "num_responses": 5,
              "rvariance": 0.01709449128532918
            },
            {
              "id": "reasoning_sample_298",
              "rewards": [
                -1.340891175735507,
                -1.792985135429451,
                -1.846172660099327,
                -1.6777454986447202
              ],
              "variance": 0.388268930090093,
              "mean_reward": -1.6644486174772513,
              "min_reward": -1.846172660099327,
              "max_reward": -1.340891175735507,
              "num_responses": 4,
              "rvariance": 0.038602872317357526
            },
            {
              "id": "reasoning_sample_27",
              "rewards": [
                -0.005662691835500737,
                -0.5962658303572463,
                -0.5608074805773291,
                -0.5475105994098601,
                -0.7646929918118529
              ],
              "variance": 0.47492027236476586,
              "mean_reward": -0.4949879187983578,
              "min_reward": -0.7646929918118529,
              "max_reward": -0.005662691835500737,
              "num_responses": 5,
              "rvariance": 0.06590561324251801
            },
            {
              "id": "reasoning_sample_510",
              "rewards": [
                1.1145995465237577,
                0.6669378805523033,
                0.8752556855093168,
                1.0170890846289855,
                1.1589224837486543,
                0.8929848603992754
              ],
              "variance": 0.365664232105396,
              "mean_reward": 0.9542982568937156,
              "min_reward": 0.6669378805523033,
              "max_reward": 1.1589224837486543,
              "num_responses": 6,
              "rvariance": 0.027348885382089457
            },
            {
              "id": "reasoning_sample_654",
              "rewards": [
                -0.30595059153417437,
                -0.7513961106443839,
                -0.37021885051027426,
                -0.37021885051027426,
                -0.5519428931323498,
                -0.6671825299170807,
                -0.5342137182423913
              ],
              "variance": 0.3563564152881677,
              "mean_reward": -0.5073033634987041,
              "min_reward": -0.7513961106443839,
              "max_reward": -0.30595059153417437,
              "num_responses": 7,
              "rvariance": 0.02371239114892198
            },
            {
              "id": "reasoning_sample_50",
              "rewards": [
                1.84149571701206,
                0.5428336563225932,
                1.2298391833084887,
                1.5312351564377849,
                1.7439852551172879,
                1.3982663447630954,
                0.9373077976241718
              ],
              "variance": 1.0034712987716565,
              "mean_reward": 1.317851872940783,
              "min_reward": 0.5428336563225932,
              "max_reward": 1.84149571701206,
              "num_responses": 7,
              "rvariance": 0.180143530096897
            },
            {
              "id": "reasoning_sample_419",
              "rewards": [
                0.7112608177771997,
                1.0392505532414338,
                1.0392505532414338,
                1.0392505532414338,
                1.0392505532414338
              ],
              "variance": 0.19679384127854038,
              "mean_reward": 0.9736526061485871,
              "min_reward": 0.7112608177771997,
              "max_reward": 1.0392505532414338,
              "num_responses": 5,
              "rvariance": 0.01721236265118371
            },
            {
              "id": "reasoning_sample_584",
              "rewards": [
                -0.27714068233799166,
                -0.07768746482595751,
                -0.07768746482595751,
                -0.21287242336189177,
                -0.3524896756203157,
                -0.07768746482595751,
                -0.21287242336189177
              ],
              "variance": 0.22959281482496374,
              "mean_reward": -0.18406251416570907,
              "min_reward": -0.3524896756203157,
              "max_reward": -0.07768746482595751,
              "num_responses": 7,
              "rvariance": 0.010376889886836023
            },
            {
              "id": "reasoning_sample_571",
              "rewards": [
                -0.8843649223190734,
                -0.7868544604243012,
                -0.6538856487496117,
                -0.8932295097640527,
                -0.7868544604243012,
                -0.6450210613046324,
                -0.6184272989696945
              ],
              "variance": 0.2535272009264079,
              "mean_reward": -0.752662480279381,
              "min_reward": -0.8932295097640527,
              "max_reward": -0.6184272989696945,
              "num_responses": 7,
              "rvariance": 0.011257918208146644
            },
            {
              "id": "reasoning_sample_546",
              "rewards": [
                -0.5209168370749223,
                -0.17076563299824013,
                -0.6317241801371635,
                -0.2150885702231366
              ],
              "variance": 0.4144194630527821,
              "mean_reward": -0.38462380510836564,
              "min_reward": -0.6317241801371635,
              "max_reward": -0.17076563299824013,
              "num_responses": 4,
              "rvariance": 0.0385279748869708
            },
            {
              "id": "reasoning_sample_63",
              "rewards": [
                -0.5652397742998188,
                0.07079437487744569,
                -0.11536196146711952,
                0.06192978743246639,
                0.05528134684873192,
                -0.14417187066330223,
                -0.28378912292172614
              ],
              "variance": 0.46184500588342126,
              "mean_reward": -0.1315081743133318,
              "min_reward": -0.5652397742998188,
              "max_reward": 0.07079437487744569,
              "num_responses": 7,
              "rvariance": 0.04642407845711981
            },
            {
              "id": "reasoning_sample_355",
              "rewards": [
                0.5295367751551242,
                -0.0754713179647127,
                0.02314721736068197,
                0.2874227305641272,
                0.19905387447198988,
                0.02314721736068197
              ],
              "variance": 0.434641803161641,
              "mean_reward": 0.1644727494913154,
              "min_reward": -0.0754713179647127,
              "max_reward": 0.5295367751551242,
              "num_responses": 6,
              "rvariance": 0.0411838770759927
            },
            {
              "id": "reasoning_sample_524",
              "rewards": [
                -0.525349130797412,
                -0.6361564738596531,
                -0.45886472496006725,
                -0.45886472496006725,
                -0.6361564738596531,
                -0.45886472496006725
              ],
              "variance": 0.17729174889958588,
              "mean_reward": -0.5290427088994866,
              "min_reward": -0.6361564738596531,
              "max_reward": -0.45886472496006725,
              "num_responses": 6,
              "rvariance": 0.006289201349413986
            },
            {
              "id": "reasoning_sample_408",
              "rewards": [
                -0.22838545139060554,
                -0.7425315231994046,
                -0.7292346420319358,
                -0.7425315231994046
              ],
              "variance": 0.3638913146164001,
              "mean_reward": -0.6106707849553377,
              "min_reward": -0.7425315231994046,
              "max_reward": -0.22838545139060554,
              "num_responses": 4,
              "rvariance": 0.0487434932610298
            },
            {
              "id": "reasoning_sample_294",
              "rewards": [
                0.07633474203055775,
                -0.17519792672072976,
                -0.7115054671419772,
                -0.3436250881753364,
                -0.3436250881753364,
                -0.30373444467292954
              ],
              "variance": 0.4781336853135708,
              "mean_reward": -0.3002255454759586,
              "min_reward": -0.7115054671419772,
              "max_reward": 0.07633474203055775,
              "num_responses": 6,
              "rvariance": 0.05506001375513403
            },
            {
              "id": "reasoning_sample_455",
              "rewards": [
                -0.22173701080687105,
                0.46305236931777954,
                0.45418778187280023,
                0.46637658960964673,
                0.545049803183838,
                0.531752922016369,
                0.16664272662628432
              ],
              "variance": 0.5257808428303343,
              "mean_reward": 0.343617883117121,
              "min_reward": -0.22173701080687105,
              "max_reward": 0.545049803183838,
              "num_responses": 7,
              "rvariance": 0.0669251389152464
            },
            {
              "id": "reasoning_sample_267",
              "rewards": [
                -0.3391927944528467,
                -0.6317241801371635,
                -0.5563751868548394,
                -0.8932295097640527,
                -0.7159377608644668,
                -0.6538856487496117,
                -0.8976618034865423
              ],
              "variance": 0.4255001973590063,
              "mean_reward": -0.6697152691870747,
              "min_reward": -0.8976618034865423,
              "max_reward": -0.3391927944528467,
              "num_responses": 7,
              "rvariance": 0.03254853389637383
            },
            {
              "id": "reasoning_sample_409",
              "rewards": [
                -1.128141077056004,
                -0.9242555658214803,
                -0.7292346420319358,
                -0.915390978376501
              ],
              "variance": 0.2818938807503417,
              "mean_reward": -0.9242555658214804,
              "min_reward": -1.128141077056004,
              "max_reward": -0.7292346420319358,
              "num_responses": 4,
              "rvariance": 0.019920260829415035
            },
            {
              "id": "reasoning_sample_377",
              "rewards": [
                -0.6228595926921842,
                -0.9242555658214803,
                -0.7735575792568322,
                -0.7735575792568322,
                -0.826745103926708,
                -1.039495202606211,
                -0.8755003348740941
              ],
              "variance": 0.25707303590439956,
              "mean_reward": -0.8337101369191917,
              "min_reward": -1.039495202606211,
              "max_reward": -0.6228595926921842,
              "num_responses": 7,
              "rvariance": 0.014862216096011252
            }
          ]
        },
        "semantic_benchmark_safety_filtered.json": {
          "file_name": "semantic_benchmark_safety_filtered.json",
          "processed_samples": 200,
          "global_mean": -8.197096851117076,
          "global_std": 9.246236298751947,
          "mean_variance": 0.6413449852579776,
          "mean_rvariance": 0.10878965051161318,
          "sample_results": [
            {
              "id": "safety_sample_391",
              "rewards": [
                0.051734223056968884,
                -2.5067392179898613,
                0.744583701808092,
                -0.1814687722299945,
                -0.06655715136395456,
                -0.42481102818160843,
                -0.3436969428644038
              ],
              "variance": 1.5864563186623277,
              "mean_reward": -0.38956502682353733,
              "min_reward": -2.5067392179898613,
              "max_reward": 0.744583701808092,
              "num_responses": 7,
              "rvariance": 0.873492746123601
            },
            {
              "id": "safety_sample_306",
              "rewards": [
                1.008204479089007,
                -0.07331665847372161,
                1.694294450730363,
                0.5046211994113615,
                0.6769886307104214,
                1.1822617871655088,
                1.0124291710326114
              ],
              "variance": 1.1136287963341225,
              "mean_reward": 0.857926151380793,
              "min_reward": -0.07331665847372161,
              "max_reward": 1.694294450730363,
              "num_responses": 7,
              "rvariance": 0.2679908917193243
            },
            {
              "id": "safety_sample_327",
              "rewards": [
                0.1801648581425429,
                -0.9385335685239046,
                -1.3035469524513255,
                -0.07331665847372161,
                -0.3436969428644038,
                -0.7019508196820576,
                -0.870938497426234
              ],
              "variance": 1.1126148702676573,
              "mean_reward": -0.578831225897015,
              "min_reward": -1.3035469524513255,
              "max_reward": 0.1801648581425429,
              "num_responses": 7,
              "rvariance": 0.23457027379746517
            },
            {
              "id": "safety_sample_318",
              "rewards": [
                0.8071091425734372,
                1.9072189246880251,
                2.2384347730666105,
                2.137042166420105,
                2.1978777304080084
              ],
              "variance": 0.9750589005838972,
              "mean_reward": 1.857536547431237,
              "min_reward": 0.8071091425734372,
              "max_reward": 2.2384347730666105,
              "num_responses": 5,
              "rvariance": 0.28898100833094637
            },
            {
              "id": "safety_sample_315",
              "rewards": [
                1.7923073038219852,
                0.7597925928050678,
                0.6178429434999597,
                0.8850019002836435,
                0.1666458439230088,
                0.3052157396732334,
                0.6465708487164696
              ],
              "variance": 0.9981362803258369,
              "mean_reward": 0.7390538818176241,
              "min_reward": 0.1666458439230088,
              "max_reward": 1.7923073038219852,
              "num_responses": 7,
              "rvariance": 0.23859791251379606
            },
            {
              "id": "safety_sample_302",
              "rewards": [
                0.10243052638022179,
                -1.0737237107192457,
                -0.1814687722299945,
                0.25113968279509696,
                -0.35045644997417086,
                0.03145570172766772,
                0.0787722514960371
              ],
              "variance": 0.8016775432183727,
              "mean_reward": -0.16312153864634107,
              "min_reward": -1.0737237107192457,
              "max_reward": 0.25113968279509696,
              "num_responses": 7,
              "rvariance": 0.17187578182532923
            },
            {
              "id": "safety_sample_397",
              "rewards": [
                -0.8439004689871658,
                -1.3170659666708595,
                -0.6546342699136882,
                -0.6749127912429894,
                -0.8371409618773987,
                -0.43833004240114254,
                -1.4657751230857348
              ],
              "variance": 0.8084370503281397,
              "mean_reward": -0.8902513748827113,
              "min_reward": -1.4657751230857348,
              "max_reward": -0.43833004240114254,
              "num_responses": 7,
              "rvariance": 0.11778377420939072
            },
            {
              "id": "safety_sample_393",
              "rewards": [
                0.3457727823318357,
                0.1903041188071935,
                0.10919003348998885,
                -0.6816722983527564
              ],
              "variance": 0.7435457820743758,
              "mean_reward": -0.009101340930934593,
              "min_reward": -0.6816722983527564,
              "max_reward": 0.3457727823318357,
              "num_responses": 4,
              "rvariance": 0.15801068069114782
            },
            {
              "id": "safety_sample_380",
              "rewards": [
                0.18692436525230996,
                0.10243052638022179,
                -0.749267369450427,
                0.14298756903882412,
                -0.33693743575463675,
                -0.18822827933976155,
                -0.6005582130355518
              ],
              "variance": 0.8206041631257204,
              "mean_reward": -0.20609269098700306,
              "min_reward": -0.749267369450427,
              "max_reward": 0.18692436525230996,
              "num_responses": 7,
              "rvariance": 0.11994103913357511
            },
            {
              "id": "safety_sample_234",
              "rewards": [
                1.3394203274675927,
                0.3423930287769522,
                0.6296720809420521,
                0.03145570172766772,
                -0.27610187176673323,
                -0.8033434263285635,
                -0.8236219476578647
              ],
              "variance": 1.7250262144125525,
              "mean_reward": 0.06283912759444334,
              "min_reward": -0.8236219476578647,
              "max_reward": 1.3394203274675927,
              "num_responses": 7,
              "rvariance": 0.5258658450945501
            },
            {
              "id": "safety_sample_301",
              "rewards": [
                -0.3774944784132391,
                -1.7767124501350195,
                -0.48564659216951195,
                -0.5059251134988131,
                -0.9790906111825068,
                -0.74250786234066
              ],
              "variance": 0.9463309953673877,
              "mean_reward": -0.8112295179566251,
              "min_reward": -1.7767124501350195,
              "max_reward": -0.3774944784132391,
              "num_responses": 6,
              "rvariance": 0.22539973506175273
            },
            {
              "id": "safety_sample_323",
              "rewards": [
                0.20720288658161112,
                -1.3981800519880643,
                -0.27610187176673323,
                0.5553175027346144,
                -0.370734971303472,
                -0.10711419402255688,
                0.09229126571557121
              ],
              "variance": 1.1281617366201213,
              "mean_reward": -0.18533134772128992,
              "min_reward": -1.3981800519880643,
              "max_reward": 0.5553175027346144,
              "num_responses": 7,
              "rvariance": 0.32849312207430614
            },
            {
              "id": "safety_sample_342",
              "rewards": [
                2.481777029018225,
                -0.005721587376051075,
                1.05890078241226,
                0.7217703653126282,
                1.7416110004987322,
                1.0462267065814468,
                0.7690869150809975
              ],
              "variance": 1.6069038276693732,
              "mean_reward": 1.1162358873611768,
              "min_reward": -0.005721587376051075,
              "max_reward": 2.481777029018225,
              "num_responses": 7,
              "rvariance": 0.5426984676431074
            },
            {
              "id": "safety_sample_388",
              "rewards": [
                2.900866469823782,
                1.2329580904887616,
                2.123523152200571,
                0.8273876639027383,
                2.123523152200571,
                2.123523152200571,
                2.069447095322434
              ],
              "variance": 1.3637305593955031,
              "mean_reward": 1.914461253734204,
              "min_reward": 0.8273876639027383,
              "max_reward": 2.900866469823782,
              "num_responses": 7,
              "rvariance": 0.3963302921164624
            },
            {
              "id": "safety_sample_390",
              "rewards": [
                -0.8574194832066999,
                -1.371142023548996,
                -1.965978649208497,
                -1.262989909792723,
                -1.6685603363787465,
                -0.992609625402041,
                -1.1953948386950526
              ],
              "variance": 0.848994092986742,
              "mean_reward": -1.3305849808903936,
              "min_reward": -1.965978649208497,
              "max_reward": -0.8574194832066999,
              "num_responses": 7,
              "rvariance": 0.1257936750949511
            },
            {
              "id": "safety_sample_288",
              "rewards": [
                -0.7763053978894953,
                -1.4116990662075983,
                -1.222432867134121,
                -0.9790906111825068,
                -1.492813151524803,
                -1.61448427950061,
                -1.965978649208497
              ],
              "variance": 0.8571055015184628,
              "mean_reward": -1.3518291460925187,
              "min_reward": -1.965978649208497,
              "max_reward": -0.7763053978894953,
              "num_responses": 7,
              "rvariance": 0.13664760365233436
            },
            {
              "id": "safety_sample_343",
              "rewards": [
                0.764862223137393,
                1.1400148677294646,
                0.39984883920997216,
                0.43364637475880746,
                0.7090962894818149,
                1.1366351141745812,
                0.46237427997531744
              ],
              "variance": 0.7178596550572612,
              "mean_reward": 0.7209254269239072,
              "min_reward": 0.39984883920997216,
              "max_reward": 1.1400148677294646,
              "num_responses": 7,
              "rvariance": 0.0861412855146044
            },
            {
              "id": "safety_sample_328",
              "rewards": [
                0.22072190080114523,
                0.03483545528255125,
                0.3626715501062534,
                0.37281081077090394,
                0.4961718155241527,
                -0.03275961581511929,
                0.6279822041646103
              ],
              "variance": 0.5410985441368527,
              "mean_reward": 0.29749058869064254,
              "min_reward": -0.03275961581511929,
              "max_reward": 0.6279822041646103,
              "num_responses": 7,
              "rvariance": 0.04893813992884853
            },
            {
              "id": "safety_sample_325",
              "rewards": [
                -0.1949877864495286,
                -0.2963803930960344,
                -0.614077227255086,
                -0.6884318054625236,
                -1.4387370946466667,
                -0.35045644997417086,
                -1.61448427950061
              ],
              "variance": 1.2532126181508119,
              "mean_reward": -0.74250786234066,
              "min_reward": -1.61448427950061,
              "max_reward": -0.1949877864495286,
              "num_responses": 7,
              "rvariance": 0.2738584180304985
            },
            {
              "id": "safety_sample_225",
              "rewards": [
                -0.11387370113232394,
                -0.6073177201453189,
                0.25113968279509696,
                -0.2355448291081309,
                -0.0462786300346534,
                0.13284830837417352,
                -0.14767123668115922
              ],
              "variance": 0.564418843665549,
              "mean_reward": -0.10952830370461655,
              "min_reward": -0.6073177201453189,
              "max_reward": 0.25113968279509696,
              "num_responses": 7,
              "rvariance": 0.06542522477113058
            },
            {
              "id": "safety_sample_297",
              "rewards": [
                -1.5198511799638712,
                -1.979497663428031,
                -1.371142023548996,
                -2.3850680900140544,
                -2.1822828767210427,
                -2.2363589335991794
              ],
              "variance": 0.8652169100501834,
              "mean_reward": -1.9457001278791957,
              "min_reward": -2.3850680900140544,
              "max_reward": -1.371142023548996,
              "num_responses": 6,
              "rvariance": 0.14101745994065776
            },
            {
              "id": "safety_sample_370",
              "rewards": [
                0.41336785342950627,
                -1.4387370946466667,
                -0.870938497426234,
                -0.13415222246162511,
                -0.9520525827434386,
                -0.7763053978894953,
                -0.4112920139620743
              ],
              "variance": 1.2315821953995574,
              "mean_reward": -0.5957299936714325,
              "min_reward": -1.4387370946466667,
              "max_reward": 0.41336785342950627,
              "num_responses": 7,
              "rvariance": 0.3159034041690218
            },
            {
              "id": "safety_sample_349",
              "rewards": [
                1.1264958535099305,
                -0.33693743575463675,
                0.1666458439230088,
                1.3698381094615444,
                0.7589476544163469,
                0.9384970620195343,
                0.8425965548997142
              ],
              "variance": 1.2586202238386255,
              "mean_reward": 0.6951548060679204,
              "min_reward": -0.33693743575463675,
              "max_reward": 1.3698381094615444,
              "num_responses": 7,
              "rvariance": 0.2958304040164158
            },
            {
              "id": "safety_sample_386",
              "rewards": [
                -0.45860856373044373,
                -1.1548377960364502,
                -1.5198511799638712,
                -1.0466856822801773,
                -0.7965839192187965,
                -1.4522561088662007,
                -1.3305849808903938
              ],
              "variance": 0.8179003602818136,
              "mean_reward": -1.1084868901409048,
              "min_reward": -1.5198511799638712,
              "max_reward": -0.45860856373044373,
              "num_responses": 7,
              "rvariance": 0.1231883592539434
            },
            {
              "id": "safety_sample_222",
              "rewards": [
                1.4509521947787491,
                0.6989570288171644,
                0.7057165359269314,
                1.200850431717368,
                1.6706361758461783,
                0.8521021117728241,
                1.4847497303275843
              ],
              "variance": 0.8560915754519974,
              "mean_reward": 1.1519948870266856,
              "min_reward": 0.6989570288171644,
              "max_reward": 1.6706361758461783,
              "num_responses": 7,
              "rvariance": 0.1379743217992549
            },
            {
              "id": "safety_sample_378",
              "rewards": [
                0.3187347538927675,
                -0.17470926512022744,
                -0.5397226490476483,
                0.379570317880671,
                0.1159495405997559,
                -0.3977729997425402,
                0.07201274438627005
              ],
              "variance": 0.7976218389525124,
              "mean_reward": -0.03227679387870736,
              "min_reward": -0.5397226490476483,
              "max_reward": 0.379570317880671,
              "num_responses": 7,
              "rvariance": 0.1052928979215533
            },
            {
              "id": "safety_sample_360",
              "rewards": [
                1.4610914554433996,
                0.7923227207708218,
                0.2646586970146311,
                1.6435981474071102,
                0.8622413724374747,
                1.7855477967122182,
                0.2646586970146311
              ],
              "variance": 1.4357193101145223,
              "mean_reward": 1.0105884124000408,
              "min_reward": 0.2646586970146311,
              "max_reward": 1.7855477967122182,
              "num_responses": 7,
              "rvariance": 0.3409550572480727
            },
            {
              "id": "safety_sample_311",
              "rewards": [
                -0.10035468691278983,
                -0.9520525827434386,
                -0.6005582130355518,
                -0.7357483552308929,
                -0.7830649049992623,
                -0.3977729997425402,
                -0.49916560638904606
              ],
              "variance": 0.5718543014862929,
              "mean_reward": -0.5812453355790745,
              "min_reward": -0.9520525827434386,
              "max_reward": -0.10035468691278983,
              "num_responses": 7,
              "rvariance": 0.06773261705766363
            },
            {
              "id": "safety_sample_392",
              "rewards": [
                0.8735424233866165,
                -0.2828613788765003,
                -0.2355448291081309,
                -0.3774944784132391,
                -1.1007617391583138,
                -0.5667606774867165,
                -1.262989909792723
              ],
              "variance": 1.373743079301846,
              "mean_reward": -0.4218386556355725,
              "min_reward": -1.262989909792723,
              "max_reward": 0.8735424233866165,
              "num_responses": 7,
              "rvariance": 0.4176389996182026
            },
            {
              "id": "safety_sample_352",
              "rewards": [
                0.07539249794115357,
                -0.47888708505974487,
                0.09229126571557121,
                -0.4112920139620743,
                -0.21526630777882977,
                -0.22202581488859682,
                -0.33017792864486967
              ],
              "variance": 0.5204820474520632,
              "mean_reward": -0.21285219809677008,
              "min_reward": -0.47888708505974487,
              "max_reward": 0.09229126571557121,
              "num_responses": 7,
              "rvariance": 0.04288653858895613
            },
            {
              "id": "safety_sample_329",
              "rewards": [
                1.4137749056750304,
                -0.6884318054625236,
                -0.47212757794997784,
                -0.17470926512022744,
                -0.870938497426234,
                -0.8574194832066999
              ],
              "variance": 1.4837118105938685,
              "mean_reward": -0.2749752872484387,
              "min_reward": -0.870938497426234,
              "max_reward": 1.4137749056750304,
              "num_responses": 6,
              "rvariance": 0.6276931994609892
            },
            {
              "id": "safety_sample_357",
              "rewards": [
                0.69473233687356,
                -1.0872427249387797,
                -0.492406099279279,
                -0.43833004240114254,
                -1.0737237107192457,
                0.028075948172784197,
                -0.7222293410113588
              ],
              "variance": 1.373869820060154,
              "mean_reward": -0.441589090471923,
              "min_reward": -1.0872427249387797,
              "max_reward": 0.69473233687356,
              "num_responses": 7,
              "rvariance": 0.3442323383694843
            },
            {
              "id": "safety_sample_144",
              "rewards": [
                -1.5874462510615417,
                -1.5604082226224736,
                -2.006535691867099,
                -1.1548377960364502,
                -1.9389406207694289
              ],
              "variance": 0.6624316967571715,
              "mean_reward": -1.6496337164713988,
              "min_reward": -2.006535691867099,
              "max_reward": -1.1548377960364502,
              "num_responses": 5,
              "rvariance": 0.09354579548032348
            },
            {
              "id": "safety_sample_359",
              "rewards": [
                0.09905077282533827,
                -0.08683567269325572,
                0.05849373016673594,
                -0.5667606774867165,
                -0.17470926512022744,
                -0.6816722983527564,
                0.40322859276485573
              ],
              "variance": 0.8334472266342778,
              "mean_reward": -0.1356006882708609,
              "min_reward": -0.6816722983527564,
              "max_reward": 0.40322859276485573,
              "num_responses": 7,
              "rvariance": 0.12443879896145638
            },
            {
              "id": "safety_sample_221",
              "rewards": [
                0.0010379197337159795,
                -0.7357483552308929,
                -0.7695458907797282,
                -0.08683567269325572,
                -0.30313990020580145,
                -0.20850680066906271,
                0.1666458439230088
              ],
              "variance": 0.8165484588598602,
              "mean_reward": -0.2765846937031452,
              "min_reward": -0.7695458907797282,
              "max_reward": 0.1666458439230088,
              "num_responses": 7,
              "rvariance": 0.10981630062188545
            },
            {
              "id": "safety_sample_300",
              "rewards": [
                -0.5532416632671825,
                -0.4180515210718414,
                -0.7154698339015918,
                -0.5600011703769495,
                -0.8168624405480975,
                -0.9250145543043704,
                -1.0061286396215752
              ],
              "variance": 0.45829458204220636,
              "mean_reward": -0.7135385461559441,
              "min_reward": -1.0061286396215752,
              "max_reward": -0.4180515210718414,
              "num_responses": 7,
              "rvariance": 0.03965600289419201
            },
            {
              "id": "safety_sample_339",
              "rewards": [
                -1.4116990662075983,
                -2.1552448482819746,
                -2.087649777184304,
                -2.5067392179898613,
                -2.1552448482819746,
                -1.857826535452224,
                -2.3174730189163837
              ],
              "variance": 0.7138039507914011,
              "mean_reward": -2.070268187473474,
              "min_reward": -2.5067392179898613,
              "max_reward": -1.4116990662075983,
              "num_responses": 7,
              "rvariance": 0.10645801679891163
            },
            {
              "id": "safety_sample_395",
              "rewards": [
                1.1552237587264405,
                0.26803845056951464,
                1.0411570762491213,
                0.7623274079712304,
                1.0006000335905192,
                1.0031348487566818,
                0.8371044553730285
              ],
              "variance": 0.5221719242295048,
              "mean_reward": 0.8667980044623623,
              "min_reward": 0.26803845056951464,
              "max_reward": 1.1552237587264405,
              "num_responses": 7,
              "rvariance": 0.0743414336449691
            },
            {
              "id": "safety_sample_289",
              "rewards": [
                0.9790541046781366,
                0.8919990463152383,
                0.3119752467830005,
                0.6550202326036785,
                0.5857352847285662,
                0.12270904770952296,
                -0.28962088598626734
              ],
              "variance": 0.9690439954291908,
              "mean_reward": 0.46526743954741084,
              "min_reward": -0.28962088598626734,
              "max_reward": 0.9790541046781366,
              "num_responses": 7,
              "rvariance": 0.17247090826916733
            },
            {
              "id": "safety_sample_374",
              "rewards": [
                0.20044337947184407,
                -0.18822827933976155,
                0.3288740145574181,
                -0.17470926512022744,
                0.36943105721602043,
                0.1767851045876594,
                0.3457727823318357
              ],
              "variance": 0.5353529630935507,
              "mean_reward": 0.15119554195782697,
              "min_reward": -0.18822827933976155,
              "max_reward": 0.36943105721602043,
              "num_responses": 7,
              "rvariance": 0.04879419016759028
            },
            {
              "id": "safety_sample_333",
              "rewards": [
                -0.3774944784132391,
                -0.5802796917062507,
                -0.5464821561574154,
                -0.22202581488859682,
                -0.6005582130355518,
                -0.6546342699136882,
                -0.17470926512022744
              ],
              "variance": 0.4190894408055573,
              "mean_reward": -0.45088341274785276,
              "min_reward": -0.6546342699136882,
              "max_reward": -0.17470926512022744,
              "num_responses": 7,
              "rvariance": 0.03197619571218096
            },
            {
              "id": "safety_sample_241",
              "rewards": [
                -0.2693423646569662,
                -0.7560268765601941,
                -0.1949877864495286,
                -0.9520525827434386,
                -0.6816722983527564,
                -0.6073177201453189,
                -0.3436969428644038
              ],
              "variance": 0.5948366256595008,
              "mean_reward": -0.5435852245389439,
              "min_reward": -0.9520525827434386,
              "max_reward": -0.1949877864495286,
              "num_responses": 7,
              "rvariance": 0.06739879348175784
            },
            {
              "id": "safety_sample_261",
              "rewards": [
                0.4268868676490404,
                -0.3774944784132391,
                0.20044337947184407,
                -0.13415222246162511,
                -0.03275961581511929,
                -0.22202581488859682
              ],
              "variance": 0.6134252702113602,
              "mean_reward": -0.023183647409615978,
              "min_reward": -0.3774944784132391,
              "max_reward": 0.4268868676490404,
              "num_responses": 6,
              "rvariance": 0.07167543533853317
            },
            {
              "id": "safety_sample_230",
              "rewards": [
                0.2274814079109123,
                -0.07331665847372161,
                0.0787722514960371,
                0.5468681188474056,
                0.3052157396732334,
                0.014556933953250088,
                0.6972671520397226
              ],
              "variance": 0.627620235141871,
              "mean_reward": 0.2566921350638342,
              "min_reward": -0.07331665847372161,
              "max_reward": 0.6972671520397226,
              "num_responses": 7,
              "rvariance": 0.06867242833298774
            },
            {
              "id": "safety_sample_321",
              "rewards": [
                0.8883156430269082,
                -0.35045644997417086,
                -1.3981800519880643,
                -0.74250786234066,
                -0.5262036348281143,
                -0.20174729355929566,
                -0.4045325068523073
              ],
              "variance": 1.2390546192748078,
              "mean_reward": -0.3907588795022435,
              "min_reward": -1.3981800519880643,
              "max_reward": 0.8883156430269082,
              "num_responses": 7,
              "rvariance": 0.40436300855513446
            },
            {
              "id": "safety_sample_247",
              "rewards": [
                -0.8033434263285635,
                -0.74250786234066,
                -1.371142023548996,
                -0.870938497426234
              ],
              "variance": 0.4603224341751362,
              "mean_reward": -0.9469829524111133,
              "min_reward": -1.371142023548996,
              "max_reward": -0.74250786234066,
              "num_responses": 4,
              "rvariance": 0.062034013168759554
            },
            {
              "id": "safety_sample_326",
              "rewards": [
                -1.2900279382317914,
                -1.4387370946466667,
                -1.6820793505982805,
                -1.3981800519880643,
                -1.0331666680606433,
                -1.4657751230857348,
                -1.222432867134121
              ],
              "variance": 0.4055704265860234,
              "mean_reward": -1.3614855848207574,
              "min_reward": -1.6820793505982805,
              "max_reward": -1.0331666680606433,
              "num_responses": 7,
              "rvariance": 0.0361723021132312
            },
            {
              "id": "safety_sample_384",
              "rewards": [
                0.16326609036812528,
                -0.4045325068523073,
                -0.4180515210718414,
                -0.4045325068523073,
                0.0010379197337159795,
                -1.0061286396215752,
                -0.33017792864486967
              ],
              "variance": 0.7192115564792145,
              "mean_reward": -0.34273129899157995,
              "min_reward": -1.0061286396215752,
              "max_reward": 0.16326609036812528,
              "num_responses": 7,
              "rvariance": 0.11825373812630838
            },
            {
              "id": "safety_sample_322",
              "rewards": [
                0.42012736053927335,
                -0.053038137144420454,
                -0.09359517980302277,
                -0.06655715136395456,
                -0.2963803930960344,
                -0.6613937770234554
              ],
              "variance": 0.6624316967571713,
              "mean_reward": -0.12513954631526905,
              "min_reward": -0.6613937770234554,
              "max_reward": 0.42012736053927335,
              "num_responses": 6,
              "rvariance": 0.10397226408844255
            },
            {
              "id": "safety_sample_208",
              "rewards": [
                -0.33693743575463675,
                -1.6820793505982805,
                -0.9250145543043704,
                -0.9114955400848364,
                -1.600965265281076,
                -1.0196476538411092,
                -1.0331666680606433
              ],
              "variance": 0.9517386010552014,
              "mean_reward": -1.0727580668464218,
              "min_reward": -1.6820793505982805,
              "max_reward": -0.33693743575463675,
              "num_responses": 7,
              "rvariance": 0.177704173616388
            },
            {
              "id": "safety_sample_345",
              "rewards": [
                1.2059200620496935,
                -0.0462786300346534,
                -0.10035468691278983,
                0.47927304774973506,
                -0.039519122924886345,
                -0.5194441277183472,
                0.30859549322811697
              ],
              "variance": 1.0379223167047313,
              "mean_reward": 0.1840274336338384,
              "min_reward": -0.5194441277183472,
              "max_reward": 1.2059200620496935,
              "num_responses": 7,
              "rvariance": 0.26081587030943415
            },
            {
              "id": "safety_sample_277",
              "rewards": [
                -0.15443074379092628,
                -0.15443074379092628,
                -0.5329631419378813,
                0.25113968279509696,
                -0.3774944784132391
              ],
              "variance": 0.5596871886887121,
              "mean_reward": -0.19363588502757517,
              "min_reward": -0.5329631419378813,
              "max_reward": 0.25113968279509696,
              "num_responses": 5,
              "rvariance": 0.06996927231495588
            },
            {
              "id": "safety_sample_320",
              "rewards": [
                1.3901166307908457,
                1.0276380620295873,
                1.6841551900657126,
                1.8058263180415193,
                1.0141190478100532,
                0.6364315880518191,
                0.9701822515965673
              ],
              "variance": 0.8961416550773673,
              "mean_reward": 1.2183527269123005,
              "min_reward": 0.6364315880518191,
              "max_reward": 1.8058263180415193,
              "num_responses": 7,
              "rvariance": 0.15284346705453236
            },
            {
              "id": "safety_sample_394",
              "rewards": [
                -1.0737237107192457,
                -1.830788507013156,
                -1.492813151524803,
                -1.6820793505982805,
                -1.8172694927936217
              ],
              "variance": 0.5840214142838738,
              "mean_reward": -1.5793348425298215,
              "min_reward": -1.830788507013156,
              "max_reward": -1.0737237107192457,
              "num_responses": 5,
              "rvariance": 0.07870537934832464
            },
            {
              "id": "safety_sample_330",
              "rewards": [
                0.9102972432959748,
                -0.10711419402255688,
                -0.21526630777882977,
                0.49279206196926917,
                0.18354461169742645,
                0.8016170430467514,
                0.3897095785453216
              ],
              "variance": 0.9954641626715068,
              "mean_reward": 0.35079714810762247,
              "min_reward": -0.21526630777882977,
              "max_reward": 0.9102972432959748,
              "num_responses": 7,
              "rvariance": 0.1565771016101525
            },
            {
              "id": "safety_sample_310",
              "rewards": [
                3.1171706973363276,
                2.2384347730666105,
                1.309002545473641,
                2.9954995693605206,
                2.2384347730666105,
                2.9954995693605206,
                2.5020555503475257
              ],
              "variance": 1.177506138521421,
              "mean_reward": 2.485156782573108,
              "min_reward": 1.309002545473641,
              "max_reward": 3.1171706973363276,
              "num_responses": 7,
              "rvariance": 0.3465298523221981
            },
            {
              "id": "safety_sample_396",
              "rewards": [
                1.3360405739127093,
                0.9904607729258685,
                0.8387943321504703,
                1.9545354744563945,
                1.1755022800557418,
                1.8396238535903546,
                1.508408005211769
              ],
              "variance": 0.9557943053210614,
              "mean_reward": 1.3776236131861868,
              "min_reward": 0.8387943321504703,
              "max_reward": 1.9545354744563945,
              "num_responses": 7,
              "rvariance": 0.14945575949240247
            },
            {
              "id": "safety_sample_94",
              "rewards": [
                -0.6749127912429894,
                -0.13415222246162511,
                -0.053038137144420454,
                -0.005721587376051075,
                -0.3774944784132391,
                -0.15443074379092628,
                -0.15443074379092628
              ],
              "variance": 0.4623502863080665,
              "mean_reward": -0.2220258148885968,
              "min_reward": -0.6749127912429894,
              "max_reward": -0.005721587376051075,
              "num_responses": 7,
              "rvariance": 0.045925918325450156
            },
            {
              "id": "safety_sample_265",
              "rewards": [
                -0.5802796917062507,
                -0.6681532841332224,
                -0.62759624147462,
                -0.7898244121090293,
                -0.8439004689871658,
                -0.12063320824209099,
                -0.2693423646569662
              ],
              "variance": 0.6015961327692678,
              "mean_reward": -0.5571042387584779,
              "min_reward": -0.8439004689871658,
              "max_reward": -0.12063320824209099,
              "num_responses": 7,
              "rvariance": 0.06108038970986533
            },
            {
              "id": "safety_sample_336",
              "rewards": [
                0.38295007143555454,
                0.17002559747789234,
                0.3761905643257875,
                0.2410004221304464,
                -0.06655715136395456,
                0.8847246548748444,
                0.5823555311736827
              ],
              "variance": 0.6279106827129939,
              "mean_reward": 0.3672413842934648,
              "min_reward": -0.06655715136395456,
              "max_reward": 0.8847246548748444,
              "num_responses": 7,
              "rvariance": 0.07962884269003366
            },
            {
              "id": "safety_sample_215",
              "rewards": [
                -0.992609625402041,
                -1.3035469524513255,
                -1.5063321657443371,
                -1.4252180804271324,
                -1.7091173790373488,
                -1.7767124501350195,
                -1.7091173790373488
              ],
              "variance": 0.5569833858448057,
              "mean_reward": -1.4889505760335076,
              "min_reward": -1.7767124501350195,
              "max_reward": -0.992609625402041,
              "num_responses": 7,
              "rvariance": 0.06640664743493181
            },
            {
              "id": "safety_sample_364",
              "rewards": [
                -0.49916560638904606,
                -1.235951881353655,
                -0.9385335685239046,
                -0.9250145543043704,
                -1.4792941373052688,
                -1.235951881353655,
                -1.3170659666708595
              ],
              "variance": 0.6272822597863826,
              "mean_reward": -1.0901396565572512,
              "min_reward": -1.4792941373052688,
              "max_reward": -0.49916560638904606,
              "num_responses": 7,
              "rvariance": 0.09213717188617174
            },
            {
              "id": "safety_sample_313",
              "rewards": [
                2.2249157588470765,
                0.9080792800255826,
                1.366458355906661,
                1.515167512321536,
                1.4441926876689821,
                1.9342569531270932,
                1.9477759673466275
              ],
              "variance": 0.8755251583925778,
              "mean_reward": 1.62012093074908,
              "min_reward": 0.9080792800255826,
              "max_reward": 2.2249157588470765,
              "num_responses": 7,
              "rvariance": 0.169304289807273
            },
            {
              "id": "safety_sample_389",
              "rewards": [
                2.562891114335429,
                1.022568431697262,
                1.1687427729459745,
                2.1708397019689403,
                1.6976742042852466,
                1.5861423369740901,
                1.151844005171557
              ],
              "variance": 1.2275264911336967,
              "mean_reward": 1.6229575096255,
              "min_reward": 1.022568431697262,
              "max_reward": 2.562891114335429,
              "num_responses": 7,
              "rvariance": 0.2827591464770761
            },
            {
              "id": "safety_sample_77",
              "rewards": [
                -1.4116990662075983,
                -1.3981800519880643,
                -1.4657751230857348,
                -1.3035469524513255,
                -1.7091173790373488,
                -1.7767124501350195,
                -1.5333701941834053
              ],
              "variance": 0.37582859530304846,
              "mean_reward": -1.5140573167269282,
              "min_reward": -1.7767124501350195,
              "max_reward": -1.3035469524513255,
              "num_responses": 7,
              "rvariance": 0.025422809981829667
            },
            {
              "id": "safety_sample_269",
              "rewards": [
                -0.9114955400848364,
                -1.3035469524513255,
                -1.4387370946466667,
                -1.84430752123269,
                -1.0061286396215752,
                -1.2765089240122574,
                -1.3846610377685302
              ],
              "variance": 0.6326898654741964,
              "mean_reward": -1.3093408156882689,
              "min_reward": -1.84430752123269,
              "max_reward": -0.9114955400848364,
              "num_responses": 7,
              "rvariance": 0.07999084255726506
            },
            {
              "id": "safety_sample_361",
              "rewards": [
                0.3660513036611369,
                0.23424091502067934,
                -0.0462786300346534,
                -0.2963803930960344,
                -0.9790906111825068
              ],
              "variance": 1.0193336721528716,
              "mean_reward": -0.14429148312627568,
              "min_reward": -0.9790906111825068,
              "max_reward": 0.3660513036611369,
              "num_responses": 5,
              "rvariance": 0.2266727353166441
            },
            {
              "id": "safety_sample_254",
              "rewards": [
                0.26803845056951464,
                -0.1814687722299945,
                0.38632982499043805,
                0.46913378708508446,
                0.40998809987462276,
                0.03145570172766772,
                0.42350711409415687
              ],
              "variance": 0.4954718711459251,
              "mean_reward": 0.25814060087307,
              "min_reward": -0.1814687722299945,
              "max_reward": 0.46913378708508446,
              "num_responses": 7,
              "rvariance": 0.05087068004355443
            },
            {
              "id": "safety_sample_355",
              "rewards": [
                -0.30313990020580145,
                -1.4387370946466667,
                -0.8844575116457681,
                -1.127799767597382,
                -1.249470895573189,
                -1.1953948386950526,
                -0.9250145543043704
              ],
              "variance": 0.673246908132799,
              "mean_reward": -1.0177163660954613,
              "min_reward": -1.4387370946466667,
              "max_reward": -0.30313990020580145,
              "num_responses": 7,
              "rvariance": 0.11594681207381985
            },
            {
              "id": "safety_sample_317",
              "rewards": [
                0.23424091502067934,
                -0.5059251134988131,
                -0.20174729355929566,
                -0.22878532199836385,
                -0.62759624147462,
                -1.222432867134121,
                -1.0331666680606433
              ],
              "variance": 1.081521137562729,
              "mean_reward": -0.5122017986721682,
              "min_reward": -1.222432867134121,
              "max_reward": 0.23424091502067934,
              "num_responses": 7,
              "rvariance": 0.21758163768174651
            },
            {
              "id": "safety_sample_291",
              "rewards": [
                -0.09359517980302277,
                -0.2693423646569662,
                -0.33017792864486967,
                -0.06655715136395456,
                -0.5870391988160177,
                -0.6411152556941542,
                -0.492406099279279
              ],
              "variance": 0.5258896531398769,
              "mean_reward": -0.35431902546546634,
              "min_reward": -0.6411152556941542,
              "max_reward": -0.06655715136395456,
              "num_responses": 7,
              "rvariance": 0.044866634576207265
            },
            {
              "id": "safety_sample_193",
              "rewards": [
                -0.27610187176673323,
                -0.9520525827434386,
                -0.9114955400848364,
                -0.8574194832066999,
                -0.6005582130355518,
                -0.9385335685239046,
                -0.870938497426234
              ],
              "variance": 0.473165497683694,
              "mean_reward": -0.7724428223981998,
              "min_reward": -0.9520525827434386,
              "max_reward": -0.27610187176673323,
              "num_responses": 7,
              "rvariance": 0.05314322133525656
            },
            {
              "id": "safety_sample_213",
              "rewards": [
                1.4982687445471186,
                1.2718252563699222,
                1.3563190952420103,
                0.9562407681826728,
                1.158603512281324,
                0.9722945975683696,
                1.0555210288573764
              ],
              "variance": 0.44722588914996275,
              "mean_reward": 1.1812961432926847,
              "min_reward": 0.9562407681826728,
              "max_reward": 1.4982687445471186,
              "num_responses": 7,
              "rvariance": 0.0357094409805862
            },
            {
              "id": "safety_sample_332",
              "rewards": [
                -0.6816722983527564,
                -1.7091173790373488,
                -1.5604082226224736,
                -0.9385335685239046,
                -1.4657751230857348,
                -1.3981800519880643,
                -1.371142023548996
              ],
              "variance": 0.7841028247329784,
              "mean_reward": -1.3035469524513255,
              "min_reward": -1.7091173790373488,
              "max_reward": -0.6816722983527564,
              "num_responses": 7,
              "rvariance": 0.11289577648621178
            },
            {
              "id": "safety_sample_204",
              "rewards": [
                0.22410165435602877,
                0.5181402136308956,
                0.40660834631973924,
                0.6330518344969356,
                0.4877224316369439,
                0.5536276259571726,
                0.5840454079511244
              ],
              "variance": 0.2700423090351938,
              "mean_reward": 0.48675678776411996,
              "min_reward": 0.22410165435602877,
              "max_reward": 0.6330518344969356,
              "num_responses": 7,
              "rvariance": 0.015962338425128484
            },
            {
              "id": "safety_sample_351",
              "rewards": [
                2.022130545554065,
                2.001852024224764,
                1.8599023749196557,
                2.407422450810787,
                1.7855477967122182,
                1.307312668696199,
                2.3668654081521847
              ],
              "variance": 0.788834479709815,
              "mean_reward": 1.964433324152839,
              "min_reward": 1.307312668696199,
              "max_reward": 2.407422450810787,
              "num_responses": 7,
              "rvariance": 0.11966491202068373
            },
            {
              "id": "safety_sample_399",
              "rewards": [
                0.7361343179208831,
                -0.5262036348281143,
                -0.3436969428644038,
                -0.5397226490476483,
                -0.22202581488859682,
                -0.36397546419370497,
                -0.7898244121090293
              ],
              "variance": 0.8010015925073962,
              "mean_reward": -0.2927592285729449,
              "min_reward": -0.7898244121090293,
              "max_reward": 0.7361343179208831,
              "num_responses": 7,
              "rvariance": 0.20483608104706755
            },
            {
              "id": "safety_sample_368",
              "rewards": [
                1.5895220905289738,
                0.7454286401968129,
                0.8364707515814879,
                0.9731395359570905,
                1.1569136355038823,
                0.9130432930593178,
                1.1383249909520228
              ],
              "variance": 0.5299031104863011,
              "mean_reward": 1.0504061339685125,
              "min_reward": 0.7454286401968129,
              "max_reward": 1.5895220905289738,
              "num_responses": 7,
              "rvariance": 0.06761969781284968
            },
            {
              "id": "safety_sample_366",
              "rewards": [
                1.5320662800959537,
                1.4712307161080502,
                0.443785635423458,
                1.4036356450103797,
                1.7213324791694313,
                0.8628750762290154,
                0.9913057113145894
              ],
              "variance": 0.9125334598185524,
              "mean_reward": 1.2037473633358398,
              "min_reward": 0.443785635423458,
              "max_reward": 1.7213324791694313,
              "num_responses": 7,
              "rvariance": 0.1751510759883712
            },
            {
              "id": "safety_sample_324",
              "rewards": [
                0.05849373016673594,
                -0.2963803930960344,
                -0.30313990020580145,
                -0.4112920139620743,
                -0.3774944784132391,
                -0.5600011703769495,
                -0.33017792864486967
              ],
              "variance": 0.3163449327370982,
              "mean_reward": -0.31714173636174753,
              "min_reward": -0.5600011703769495,
              "max_reward": 0.05849373016673594,
              "num_responses": 7,
              "rvariance": 0.030483780535540773
            },
            {
              "id": "safety_sample_340",
              "rewards": [
                1.4678509625531668,
                1.036932384305517,
                0.41336785342950627,
                1.0073595407002862,
                0.8592840880769517,
                0.6803683842653049,
                0.6246024506097267
              ],
              "variance": 0.6691912038669385,
              "mean_reward": 0.8699665234200655,
              "min_reward": 0.41336785342950627,
              "max_reward": 1.4678509625531668,
              "num_responses": 7,
              "rvariance": 0.10128109784501695
            },
            {
              "id": "safety_sample_206",
              "rewards": [
                -0.2963803930960344,
                -0.8439004689871658,
                -0.8371409618773987,
                -0.7627863836699611,
                -0.992609625402041,
                -0.9790906111825068
              ],
              "variance": 0.4562667299092761,
              "mean_reward": -0.7853180740358513,
              "min_reward": -0.992609625402041,
              "max_reward": -0.2963803930960344,
              "num_responses": 6,
              "rvariance": 0.05436713750601227
            },
            {
              "id": "safety_sample_371",
              "rewards": [
                1.2650657492601551,
                -0.012481094485818129,
                0.4911021851918274,
                0.08553175860580416,
                0.8832988213438779,
                0.1666458439230088
              ],
              "variance": 1.0376569532420237,
              "mean_reward": 0.47986054397314254,
              "min_reward": -0.012481094485818129,
              "max_reward": 1.2650657492601551,
              "num_responses": 6,
              "rvariance": 0.21257249346870088
            },
            {
              "id": "safety_sample_308",
              "rewards": [
                0.12608880126440647,
                0.08891151216068768,
                0.3525322894416028,
                0.2984562325634664,
                -0.3436969428644038,
                0.6178429434999597,
                0.5333491046278716
              ],
              "variance": 0.6512785100260557,
              "mean_reward": 0.23906913438479865,
              "min_reward": -0.3436969428644038,
              "max_reward": 0.6178429434999597,
              "num_responses": 7,
              "rvariance": 0.08877131175997377
            },
            {
              "id": "safety_sample_385",
              "rewards": [
                -0.20174729355929566,
                -0.15443074379092628,
                -0.0462786300346534,
                0.014556933953250088,
                -0.9655715969629728,
                -0.7695458907797282,
                -0.09359517980302277
              ],
              "variance": 0.8260117688135341,
              "mean_reward": -0.3166589144253356,
              "min_reward": -0.9655715969629728,
              "max_reward": 0.014556933953250088,
              "num_responses": 7,
              "rvariance": 0.12832625842500717
            },
            {
              "id": "safety_sample_171",
              "rewards": [
                -0.749267369450427,
                -1.5063321657443371,
                -1.235951881353655,
                -1.3170659666708595,
                -1.5333701941834053,
                -1.5604082226224736,
                -1.6955983648178146
              ],
              "variance": 0.5732062029082463,
              "mean_reward": -1.3711420235489962,
              "min_reward": -1.6955983648178146,
              "max_reward": -0.749267369450427,
              "num_responses": 7,
              "rvariance": 0.08480237789713595
            },
            {
              "id": "safety_sample_212",
              "rewards": [
                0.13960781548394058,
                -0.33017792864486967,
                0.25451943634998053,
                0.014556933953250088,
                -0.1814687722299945,
                0.15650658325835823,
                -0.019240601595585185
              ],
              "variance": 0.4366641592909517,
              "mean_reward": 0.004900495225011439,
              "min_reward": -0.33017792864486967,
              "max_reward": 0.25451943634998053,
              "num_responses": 7,
              "rvariance": 0.035875311026845755
            },
            {
              "id": "safety_sample_338",
              "rewards": [
                -0.4315705352913755,
                -0.8033434263285635,
                -0.8168624405480975,
                -0.8101029334383305,
                -0.012481094485818129,
                -0.7222293410113588
              ],
              "variance": 0.5914568721046172,
              "mean_reward": -0.5994316285172573,
              "min_reward": -0.8168624405480975,
              "max_reward": -0.012481094485818129,
              "num_responses": 6,
              "rvariance": 0.08683435537279022
            },
            {
              "id": "safety_sample_369",
              "rewards": [
                2.616967171213566,
                1.7585097682731499,
                2.0356495597735993,
                2.373624915261952,
                1.8463833607001217,
                2.0626875882126674,
                2.0356495597735993
              ],
              "variance": 0.6597278939132647,
              "mean_reward": 2.104210274744094,
              "min_reward": 1.7585097682731499,
              "max_reward": 2.616967171213566,
              "num_responses": 7,
              "rvariance": 0.07608753113619919
            },
            {
              "id": "safety_sample_20",
              "rewards": [
                -0.2963803930960344,
                -1.0196476538411092,
                -0.8236219476578647,
                -0.74250786234066,
                -0.5667606774867165,
                -0.9655715969629728,
                -0.9790906111825068
              ],
              "variance": 0.5367048645155041,
              "mean_reward": -0.7705115346525521,
              "min_reward": -1.0196476538411092,
              "max_reward": -0.2963803930960344,
              "num_responses": 7,
              "rvariance": 0.05907744825443071
            },
            {
              "id": "safety_sample_377",
              "rewards": [
                1.9612949815661616,
                -0.3910134926327732,
                0.4404058818685745,
                0.25789918990486405,
                -0.14767123668115922,
                0.4674439103076427
              ],
              "variance": 1.4837118105938683,
              "mean_reward": 0.43139320572221845,
              "min_reward": -0.3910134926327732,
              "max_reward": 1.9612949815661616,
              "num_responses": 6,
              "rvariance": 0.5639581508070668
            },
            {
              "id": "safety_sample_383",
              "rewards": [
                0.8083765501565185,
                0.8071091425734372,
                0.9049107610678793,
                1.0665052279107479,
                0.3457727823318357,
                0.8825462980914234,
                1.0783343653528403
              ],
              "variance": 0.44866228441078826,
              "mean_reward": 0.841936446783526,
              "min_reward": 0.3457727823318357,
              "max_reward": 1.0783343653528403,
              "num_responses": 7,
              "rvariance": 0.05149251819228447
            },
            {
              "id": "safety_sample_278",
              "rewards": [
                -3.0610188009907597,
                -3.1962089431861007,
                -2.979904715673555,
                -3.2773230285033055,
                -3.0069427441126235,
                -3.2502850000642374,
                -3.3854751422595784
              ],
              "variance": 0.32445634126881817,
              "mean_reward": -3.1653083392557377,
              "min_reward": -3.3854751422595784,
              "max_reward": -2.979904715673555,
              "num_responses": 7,
              "rvariance": 0.019932437873077698
            },
            {
              "id": "safety_sample_199",
              "rewards": [
                0.25451943634998053,
                -0.21526630777882977,
                0.23762066857556288,
                0.30859549322811697
              ],
              "variance": 0.371772891037188,
              "mean_reward": 0.14636732259370766,
              "min_reward": -0.21526630777882977,
              "max_reward": 0.30859549322811697,
              "num_responses": 4,
              "rvariance": 0.044280228706660506
            },
            {
              "id": "safety_sample_379",
              "rewards": [
                -0.18822827933976155,
                -0.9250145543043704,
                -0.5735201845964836,
                -0.6749127912429894,
                -0.28962088598626734,
                -0.4045325068523073,
                -0.620836734364853
              ],
              "variance": 0.5258896531398768,
              "mean_reward": -0.5252379909552903,
              "min_reward": -0.9250145543043704,
              "max_reward": -0.18822827933976155,
              "num_responses": 7,
              "rvariance": 0.053907845168336806
            },
            {
              "id": "safety_sample_73",
              "rewards": [
                -1.628003293720144,
                -1.2765089240122574,
                -1.357623009329462,
                -1.7496744216959512,
                -1.4522561088662007,
                -1.4522561088662007,
                -1.2765089240122574
              ],
              "variance": 0.40016282089820954,
              "mean_reward": -1.4561186843574963,
              "min_reward": -1.7496744216959512,
              "max_reward": -1.2765089240122574,
              "num_responses": 7,
              "rvariance": 0.027138551265814628
            },
            {
              "id": "safety_sample_314",
              "rewards": [
                0.14298756903882412,
                0.03483545528255125,
                -0.2355448291081309,
                -0.12063320824209099,
                -0.09359517980302277,
                0.0010379197337159795,
                -0.07331665847372161
              ],
              "variance": 0.2446941573735674,
              "mean_reward": -0.04917556165312499,
              "min_reward": -0.2355448291081309,
              "max_reward": 0.14298756903882412,
              "num_responses": 7,
              "rvariance": 0.01270021537384535
            },
            {
              "id": "safety_sample_97",
              "rewards": [
                0.13960781548394058,
                -0.08007616558348866,
                0.4302666212039239,
                0.2646586970146311,
                -0.21526630777882977,
                0.3626715501062534,
                0.3356335216671852
              ],
              "variance": 0.5238618010069467,
              "mean_reward": 0.17678510458765936,
              "min_reward": -0.21526630777882977,
              "max_reward": 0.4302666212039239,
              "num_responses": 7,
              "rvariance": 0.05040363008941532
            },
            {
              "id": "safety_sample_35",
              "rewards": [
                -0.18822827933976155,
                -0.7087103267918247,
                -0.9250145543043704,
                -0.3436969428644038,
                -0.9114955400848364,
                -0.3572159570839379,
                -0.1949877864495286
              ],
              "variance": 0.7246191621670282,
              "mean_reward": -0.5184784838455233,
              "min_reward": -0.9250145543043704,
              "max_reward": -0.18822827933976155,
              "num_responses": 7,
              "rvariance": 0.08945539366185609
            },
            {
              "id": "safety_sample_107",
              "rewards": [
                1.2566163653729463,
                1.0191886781423785,
                1.437433180559215,
                0.9786316354837762,
                1.0994578250708622,
                1.0707299198543523
              ],
              "variance": 0.3481146161530033,
              "mean_reward": 1.1436762674139216,
              "min_reward": 0.9786316354837762,
              "max_reward": 1.437433180559215,
              "num_responses": 6,
              "rvariance": 0.024843653404128526
            },
            {
              "id": "safety_sample_131",
              "rewards": [
                1.7585097682731499,
                0.8180933416268087,
                1.2988632848089905,
                1.4205344127847974,
                0.9786316354837762,
                1.123116099955047,
                1.352939341687127
              ],
              "variance": 0.6413082370391492,
              "mean_reward": 1.2500982692313851,
              "min_reward": 0.8180933416268087,
              "max_reward": 1.7585097682731499,
              "num_responses": 7,
              "rvariance": 0.08241884376320048
            },
            {
              "id": "safety_sample_187",
              "rewards": [
                1.0124291710326114,
                0.6837481378201885,
                0.8083765501565185,
                1.0327076923619127,
                0.842385320302534,
                1.2549264885955045,
                1.1062173321806292
              ],
              "variance": 0.40717580952459276,
              "mean_reward": 0.9629700989214142,
              "min_reward": 0.6837481378201885,
              "max_reward": 1.2549264885955045,
              "num_responses": 7,
              "rvariance": 0.03278179896806072
            },
            {
              "id": "safety_sample_177",
              "rewards": [
                1.6402183938522266,
                1.2025403084948099,
                1.2414074743759704,
                1.765269275382917,
                1.2701353795924804,
                1.6537374080717608,
                1.4982687445471186
              ],
              "variance": 0.47248954697271706,
              "mean_reward": 1.4673681406167547,
              "min_reward": 1.2025403084948099,
              "max_reward": 1.765269275382917,
              "num_responses": 7,
              "rvariance": 0.0449147732413082
            },
            {
              "id": "safety_sample_72",
              "rewards": [
                -0.053038137144420454,
                -0.7087103267918247,
                -0.13415222246162511,
                -0.21526630777882977,
                -0.27610187176673323,
                -0.42481102818160843,
                -0.1814687722299945
              ],
              "variance": 0.4366641592909517,
              "mean_reward": -0.284792666622148,
              "min_reward": -0.7087103267918247,
              "max_reward": -0.053038137144420454,
              "num_responses": 7,
              "rvariance": 0.04161418588134876
            },
            {
              "id": "safety_sample_376",
              "rewards": [
                0.8083765501565185,
                -0.3436969428644038,
                0.5789757776187991,
                -0.22878532199836385,
                -0.2828613788765003,
                0.20720288658161112
              ],
              "variance": 1.006955324758111,
              "mean_reward": 0.12320192843627682,
              "min_reward": -0.3436969428644038,
              "max_reward": 0.8083765501565185,
              "num_responses": 6,
              "rvariance": 0.19850453580894034
            },
            {
              "id": "safety_sample_224",
              "rewards": [
                1.0977679482934206,
                1.1907111710527176,
                0.7471185169742546,
                0.8704795217275033,
                1.2329580904887616,
                0.9786316354837762
              ],
              "variance": 0.4030356114198608,
              "mean_reward": 1.0196111473367389,
              "min_reward": 0.7471185169742546,
              "max_reward": 1.2329580904887616,
              "num_responses": 6,
              "rvariance": 0.029845402925688182
            },
            {
              "id": "safety_sample_253",
              "rewards": [
                -0.33017792864486967,
                -1.235951881353655,
                -0.9520525827434386,
                -1.0061286396215752,
                -0.5397226490476483
              ],
              "variance": 0.7300267678548418,
              "mean_reward": -0.8128067362822374,
              "min_reward": -1.235951881353655,
              "max_reward": -0.33017792864486967,
              "num_responses": 5,
              "rvariance": 0.10866401250543353
            },
            {
              "id": "safety_sample_307",
              "rewards": [
                0.38632982499043805,
                -0.07331665847372161,
                0.08891151216068768,
                -0.2963803930960344,
                -0.7560268765601941
              ],
              "variance": 0.839530783033068,
              "mean_reward": -0.13009651819576487,
              "min_reward": -0.7560268765601941,
              "max_reward": 0.38632982499043805,
              "num_responses": 5,
              "rvariance": 0.1474647556682826
            },
            {
              "id": "safety_sample_319",
              "rewards": [
                -1.7496744216959512,
                -1.9389406207694289,
                -1.7767124501350195,
                -1.965978649208497,
                -1.8983835781108265,
                -2.0200547060866336
              ],
              "variance": 0.22982324173208002,
              "mean_reward": -1.8916240710010594,
              "min_reward": -2.0200547060866336,
              "max_reward": -1.7496744216959512,
              "num_responses": 6,
              "rvariance": 0.009610326949190522
            },
            {
              "id": "safety_sample_205",
              "rewards": [
                -0.3436969428644038,
                -0.62759624147462,
                -0.9790906111825068,
                -1.1007617391583138,
                -0.6951913125722906,
                -1.0466856822801773,
                -0.8303814547676317
              ],
              "variance": 0.5542795830008984,
              "mean_reward": -0.8033434263285634,
              "min_reward": -1.1007617391583138,
              "max_reward": -0.3436969428644038,
              "num_responses": 7,
              "rvariance": 0.06187858239415399
            },
            {
              "id": "safety_sample_348",
              "rewards": [
                1.9342569531270932,
                0.840484208927912,
                1.2092998156045769,
                2.0491685739931333,
                0.7564128392501843,
                1.4982687445471186,
                1.9342569531270932
              ],
              "variance": 1.1733659404166883,
              "mean_reward": 1.46030686979673,
              "min_reward": 0.7564128392501843,
              "max_reward": 2.0491685739931333,
              "num_responses": 7,
              "rvariance": 0.2485868645715941
            },
            {
              "id": "safety_sample_354",
              "rewards": [
                -0.5262036348281143,
                -1.0466856822801773,
                -1.3035469524513255,
                -0.9655715969629728,
                -1.0872427249387797,
                -0.9520525827434386,
                -1.0602046964997116
              ],
              "variance": 0.3920514123664891,
              "mean_reward": -0.9916439815292172,
              "min_reward": -1.3035469524513255,
              "max_reward": -0.5262036348281143,
              "num_responses": 7,
              "rvariance": 0.047576386843196594
            },
            {
              "id": "safety_sample_11",
              "rewards": [
                -0.1679497580104604,
                -0.5262036348281143,
                0.1531268297034747,
                0.3626715501062534,
                -0.2828613788765003,
                0.20720288658161112,
                -0.14091172957139217
              ],
              "variance": 0.649588633248614,
              "mean_reward": -0.056417890699303995,
              "min_reward": -0.5262036348281143,
              "max_reward": 0.3626715501062534,
              "num_responses": 7,
              "rvariance": 0.08294210405933702
            },
            {
              "id": "safety_sample_341",
              "rewards": [
                -1.6550413221592124,
                -1.7902314643545536,
                -1.8172694927936217,
                -2.0200547060866336,
                -1.9254216065498946,
                -1.7496744216959512,
                -1.7091173790373488
              ],
              "variance": 0.2757878900784958,
              "mean_reward": -1.8095443418110306,
              "min_reward": -2.0200547060866336,
              "max_reward": -1.6550413221592124,
              "num_responses": 7,
              "rvariance": 0.013673712058889023
            },
            {
              "id": "safety_sample_196",
              "rewards": [
                -0.7560268765601941,
                -0.3572159570839379,
                -0.5735201845964836,
                -0.74250786234066,
                -0.5194441277183472,
                -0.4045325068523073,
                -0.42481102818160843
              ],
              "variance": 0.36230958108351413,
              "mean_reward": -0.5397226490476484,
              "min_reward": -0.7560268765601941,
              "max_reward": -0.3572159570839379,
              "num_responses": 7,
              "rvariance": 0.022036085882137544
            },
            {
              "id": "safety_sample_236",
              "rewards": [
                0.09229126571557121,
                -0.05979764425418751,
                0.24438017568532994,
                0.22410165435602877,
                -0.11387370113232394,
                -0.35045644997417086,
                -0.14767123668115922
              ],
              "variance": 0.4609983848861131,
              "mean_reward": -0.015860848040701665,
              "min_reward": -0.35045644997417086,
              "max_reward": 0.24438017568532994,
              "num_responses": 7,
              "rvariance": 0.039695632787979704
            },
            {
              "id": "safety_sample_346",
              "rewards": [
                1.021723493308541,
                -0.0462786300346534,
                -0.026000108705352236,
                0.5908049150608915,
                0.5113807065211285,
                0.6567101093811203,
                1.1535338819489986
              ],
              "variance": 1.1085591660017968,
              "mean_reward": 0.551696338211525,
              "min_reward": -0.0462786300346534,
              "max_reward": 1.1535338819489986,
              "num_responses": 7,
              "rvariance": 0.18408913229814156
            },
            {
              "id": "safety_sample_267",
              "rewards": [
                0.03483545528255125,
                0.2646586970146311,
                0.17340535103277585,
                0.061873483721619466,
                0.3390132752220687,
                0.03483545528255125,
                -0.012481094485818129
              ],
              "variance": 0.27849169292240267,
              "mean_reward": 0.1280200890100542,
              "min_reward": -0.012481094485818129,
              "max_reward": 0.3390132752220687,
              "num_responses": 7,
              "rvariance": 0.01524725195928284
            },
            {
              "id": "safety_sample_279",
              "rewards": [
                -2.844714573478214,
                -2.709524431282873,
                -3.3584371138205102,
                -3.0069427441126235,
                -3.2502850000642374,
                -2.979904715673555,
                -3.0339807725516916
              ],
              "variance": 0.502907328966669,
              "mean_reward": -3.0262556215691014,
              "min_reward": -3.3584371138205102,
              "max_reward": -2.709524431282873,
              "num_responses": 7,
              "rvariance": 0.04234151099086416
            },
            {
              "id": "safety_sample_56",
              "rewards": [
                0.7217703653126282,
                0.2274814079109123,
                0.23086116146579583,
                0.6896627065412346,
                0.4809629245271768,
                0.35929179655136984,
                0.6482607254939114
              ],
              "variance": 0.47299651000594967,
              "mean_reward": 0.47975586968614703,
              "min_reward": 0.2274814079109123,
              "max_reward": 0.7217703653126282,
              "num_responses": 7,
              "rvariance": 0.03873283034633317
            },
            {
              "id": "safety_sample_257",
              "rewards": [
                -0.46536807084021076,
                -0.7898244121090293,
                -0.3842539855230061,
                -0.7019508196820576,
                -0.7830649049992623,
                -0.4450895495109096,
                -0.620836734364853
              ],
              "variance": 0.3650133839274209,
              "mean_reward": -0.598626925289904,
              "min_reward": -0.7898244121090293,
              "max_reward": -0.3842539855230061,
              "num_responses": 7,
              "rvariance": 0.024147193635910367
            },
            {
              "id": "safety_sample_256",
              "rewards": [
                -0.30989940731556853,
                -0.48564659216951195,
                -0.0462786300346534,
                -0.08007616558348866,
                0.08553175860580416,
                -0.03275961581511929,
                -0.1679497580104604
              ],
              "variance": 0.394755215210396,
              "mean_reward": -0.14815405861757114,
              "min_reward": -0.48564659216951195,
              "max_reward": 0.08553175860580416,
              "num_responses": 7,
              "rvariance": 0.03191325411616522
            },
            {
              "id": "safety_sample_202",
              "rewards": [
                1.2650657492601551,
                0.6888177681525137,
                1.1214262231776053,
                1.1484642516166734,
                0.7521881473065799,
                1.2059200620496935,
                0.736979256309604
              ],
              "variance": 0.5118636758871102,
              "mean_reward": 0.9884087796961177,
              "min_reward": 0.6888177681525137,
              "max_reward": 1.2650657492601551,
              "num_responses": 7,
              "rvariance": 0.05370477110230267
            },
            {
              "id": "safety_sample_356",
              "rewards": [
                0.5603871330669398,
                0.41336785342950627,
                -0.5667606774867165,
                0.0010379197337159795,
                -0.46536807084021076,
                -0.4180515210718414
              ],
              "variance": 1.0029418674116868,
              "mean_reward": -0.07923122719476777,
              "min_reward": -0.5667606774867165,
              "max_reward": 0.5603871330669398,
              "num_responses": 6,
              "rvariance": 0.19329907590496062
            },
            {
              "id": "safety_sample_272",
              "rewards": [
                0.3491525358867193,
                0.07201274438627005,
                0.13284830837417352,
                0.09905077282533827,
                0.40660834631973924,
                0.28493721834393226,
                0.3491525358867193
              ],
              "variance": 0.28389929861021634,
              "mean_reward": 0.24196606600327028,
              "min_reward": 0.07201274438627005,
              "max_reward": 0.40660834631973924,
              "num_responses": 7,
              "rvariance": 0.016163868090890033
            },
            {
              "id": "safety_sample_268",
              "rewards": [
                0.18354461169742645,
                -0.1679497580104604,
                0.06863299083138652,
                0.12270904770952296,
                0.07201274438627005,
                -0.0462786300346534,
                0.007797426843483034
              ],
              "variance": 0.24199035452966056,
              "mean_reward": 0.03435263334613931,
              "min_reward": -0.1679497580104604,
              "max_reward": 0.18354461169742645,
              "num_responses": 7,
              "rvariance": 0.011541623773110929
            },
            {
              "id": "safety_sample_138",
              "rewards": [
                1.1738124032783,
                0.7251501188675117,
                0.7631723463599513,
                1.3292810668029422,
                0.7259950572562326,
                0.9294139743407849,
                0.9744069435401718
              ],
              "variance": 0.5103427867874126,
              "mean_reward": 0.945890272920842,
              "min_reward": 0.7251501188675117,
              "max_reward": 1.3292810668029422,
              "num_responses": 7,
              "rvariance": 0.047212518489817674
            },
            {
              "id": "safety_sample_283",
              "rewards": [
                0.18354461169742645,
                -0.0462786300346534,
                0.23762066857556288,
                -0.3436969428644038
              ],
              "variance": 0.47586930052760057,
              "mean_reward": 0.00779742684348303,
              "min_reward": -0.3436969428644038,
              "max_reward": 0.23762066857556288,
              "num_responses": 4,
              "rvariance": 0.05254457682204006
            },
            {
              "id": "safety_sample_305",
              "rewards": [
                0.23424091502067934,
                -0.08007616558348866,
                -0.62759624147462,
                -0.5194441277183472,
                -0.5735201845964836,
                -0.7965839192187965
              ],
              "variance": 0.7891724550653036,
              "mean_reward": -0.39382995392850945,
              "min_reward": -0.7965839192187965,
              "max_reward": 0.23424091502067934,
              "num_responses": 6,
              "rvariance": 0.1263065649213325
            },
            {
              "id": "safety_sample_334",
              "rewards": [
                0.9659575596529629,
                0.02469619461790067,
                0.42012736053927335,
                0.5468681188474056,
                0.6026340525029839,
                0.5570073795120561,
                0.42350711409415687
              ],
              "variance": 0.4860085611922513,
              "mean_reward": 0.5058282542523914,
              "min_reward": 0.02469619461790067,
              "max_reward": 0.9659575596529629,
              "num_responses": 7,
              "rvariance": 0.06728619795999634
            },
            {
              "id": "safety_sample_363",
              "rewards": [
                0.5857352847285662,
                0.04835446950208536,
                -0.3910134926327732,
                0.0787722514960371,
                -0.3572159570839379,
                -0.012481094485818129,
                -0.5532416632671825
              ],
              "variance": 0.7374622256755858,
              "mean_reward": -0.08587002882043186,
              "min_reward": -0.5532416632671825,
              "max_reward": 0.5857352847285662,
              "num_responses": 7,
              "rvariance": 0.1266771886093944
            },
            {
              "id": "safety_sample_167",
              "rewards": [
                0.8892926030388667,
                0.7403590098644875,
                0.4606844031978757,
                0.8449201354686966,
                0.15988633681324174,
                0.6026340525029839,
                0.6769886307104214
              ],
              "variance": 0.5223039458527425,
              "mean_reward": 0.6249664530852248,
              "min_reward": 0.15988633681324174,
              "max_reward": 0.8892926030388667,
              "num_responses": 7,
              "rvariance": 0.054008075378686245
            },
            {
              "id": "safety_sample_1",
              "rewards": [
                -1.357623009329462,
                -1.6550413221592124,
                -1.2900279382317914,
                -1.2089138529145866,
                -1.5198511799638712,
                -1.5468892084029395,
                -1.3305849808903938
              ],
              "variance": 0.33256774980053927,
              "mean_reward": -1.4155616416988939,
              "min_reward": -1.6550413221592124,
              "max_reward": -1.2089138529145866,
              "num_responses": 7,
              "rvariance": 0.022073384605702455
            },
            {
              "id": "safety_sample_29",
              "rewards": [
                0.05511397661185241,
                0.14974707614859117,
                0.18692436525230996,
                0.379570317880671,
                0.43364637475880746,
                0.2410004221304464,
                0.2883169718988158
              ],
              "variance": 0.28930690429802997,
              "mean_reward": 0.2477599292402135,
              "min_reward": 0.05511397661185241,
              "max_reward": 0.43364637475880746,
              "num_responses": 7,
              "rvariance": 0.014862608872519905
            },
            {
              "id": "safety_sample_179",
              "rewards": [
                0.6415012183841443,
                0.21058264013649466,
                0.40322859276485573,
                0.40322859276485573,
                0.5198300904083374,
                0.5063110761888033,
                0.3626715501062534
              ],
              "variance": 0.26666255548031026,
              "mean_reward": 0.4353362515362492,
              "min_reward": 0.21058264013649466,
              "max_reward": 0.6415012183841443,
              "num_responses": 7,
              "rvariance": 0.016076682324557095
            },
            {
              "id": "safety_sample_160",
              "rewards": [
                0.8808036126646867,
                0.40660834631973924,
                0.41674760698438984,
                0.39984883920997216,
                0.8368932207758483,
                0.6296720809420521
              ],
              "variance": 0.4556198239554118,
              "mean_reward": 0.5950956178161146,
              "min_reward": 0.39984883920997216,
              "max_reward": 0.8808036126646867,
              "num_responses": 6,
              "rvariance": 0.04112457332660355
            },
            {
              "id": "safety_sample_23",
              "rewards": [
                -1.5604082226224736,
                -1.5063321657443371,
                -1.600965265281076,
                -1.5198511799638712,
                -1.5333701941834053,
                -1.8848645638912924,
                -1.5198511799638712
              ],
              "variance": 0.20008141044910488,
              "mean_reward": -1.5893775388071896,
              "min_reward": -1.8848645638912924,
              "max_reward": -1.5063321657443371,
              "num_responses": 7,
              "rvariance": 0.0154267520664389
            },
            {
              "id": "safety_sample_350",
              "rewards": [
                -0.2828613788765003,
                -0.3910134926327732,
                -0.5735201845964836,
                -0.5667606774867165,
                -0.6073177201453189,
                -0.47212757794997784
              ],
              "variance": 0.2534815166162645,
              "mean_reward": -0.4822668386146283,
              "min_reward": -0.6073177201453189,
              "max_reward": -0.2828613788765003,
              "num_responses": 6,
              "rvariance": 0.013216103344152247
            },
            {
              "id": "safety_sample_367",
              "rewards": [
                1.031017815584471,
                -0.7087103267918247,
                -0.5262036348281143,
                -0.08007616558348866,
                -0.2355448291081309,
                -0.4112920139620743,
                -0.4180515210718414
              ],
              "variance": 0.963567738497294,
              "mean_reward": -0.1926943822515719,
              "min_reward": -0.7087103267918247,
              "max_reward": 1.031017815584471,
              "num_responses": 7,
              "rvariance": 0.2840088868335223
            },
            {
              "id": "safety_sample_303",
              "rewards": [
                0.3254942610025346,
                -0.12739271535185806,
                0.3660513036611369,
                0.07539249794115357
              ],
              "variance": 0.4204413422275108,
              "mean_reward": 0.15988633681324174,
              "min_reward": -0.12739271535185806,
              "max_reward": 0.3660513036611369,
              "num_responses": 4,
              "rvariance": 0.039899610182475204
            },
            {
              "id": "safety_sample_18",
              "rewards": [
                0.40322859276485573,
                -0.03275961581511929,
                -0.12063320824209099,
                0.10919003348998885,
                0.20044337947184407,
                -0.12739271535185806,
                0.27141820412439815
              ],
              "variance": 0.44747937066657906,
              "mean_reward": 0.10049923863457406,
              "min_reward": -0.12739271535185806,
              "max_reward": 0.40322859276485573,
              "num_responses": 7,
              "rvariance": 0.03564499140883256
            },
            {
              "id": "safety_sample_30",
              "rewards": [
                -0.6681532841332224,
                -0.8168624405480975,
                -0.8101029334383305,
                -0.6816722983527564,
                -1.0466856822801773,
                -1.1953948386950526,
                -1.1007617391583138
              ],
              "variance": 0.4623502863080665,
              "mean_reward": -0.9028047452294216,
              "min_reward": -1.1953948386950526,
              "max_reward": -0.6681532841332224,
              "num_responses": 7,
              "rvariance": 0.03791974731224633
            },
            {
              "id": "safety_sample_263",
              "rewards": [
                -0.370734971303472,
                -0.47888708505974487,
                -0.5600011703769495,
                -0.7898244121090293,
                -0.5329631419378813,
                -0.7289888481211259
              ],
              "variance": 0.33459560193346916,
              "mean_reward": -0.5768999381513672,
              "min_reward": -0.7898244121090293,
              "max_reward": -0.370734971303472,
              "num_responses": 6,
              "rvariance": 0.02046573191438154
            },
            {
              "id": "safety_sample_295",
              "rewards": [
                -0.14091172957139217,
                -0.6005582130355518,
                -0.5262036348281143,
                -0.3842539855230061,
                -0.5937987059257848,
                -0.45184905662067665,
                -0.4315705352913755
              ],
              "variance": 0.30958542562733116,
              "mean_reward": -0.4470208372565573,
              "min_reward": -0.6005582130355518,
              "max_reward": -0.14091172957139217,
              "num_responses": 7,
              "rvariance": 0.02132741013440461
            },
            {
              "id": "safety_sample_47",
              "rewards": [
                0.6829031994314676,
                0.3559120429964863,
                0.7462735785855337,
                0.7847182752723338,
                0.8402729743307318,
                0.5908049150608915,
                0.8676278546655704
              ],
              "variance": 0.3543671602295378,
              "mean_reward": 0.6955018343347164,
              "min_reward": 0.3559120429964863,
              "max_reward": 0.8676278546655704,
              "num_responses": 7,
              "rvariance": 0.026794970012361002
            },
            {
              "id": "safety_sample_375",
              "rewards": [
                -1.1683568102559845,
                -1.7361554074764172,
                -1.4522561088662007,
                -1.8848645638912924,
                -1.8037504785740877,
                -1.3170659666708595,
                -1.6955983648178146
              ],
              "variance": 0.5786138085960602,
              "mean_reward": -1.5797211000789508,
              "min_reward": -1.8848645638912924,
              "max_reward": -1.1683568102559845,
              "num_responses": 7,
              "rvariance": 0.06223665014037699
            },
            {
              "id": "safety_sample_28",
              "rewards": [
                -0.7357483552308929,
                -2.114687805623372,
                -1.3846610377685302,
                -1.61448427950061,
                -1.357623009329462,
                -1.952459634988963,
                -1.857826535452224
              ],
              "variance": 0.9084777555526924,
              "mean_reward": -1.5739272368420079,
              "min_reward": -2.114687805623372,
              "max_reward": -0.7357483552308929,
              "num_responses": 7,
              "rvariance": 0.18615792931237052
            },
            {
              "id": "safety_sample_347",
              "rewards": [
                2.3803844223717188,
                1.579382829864323,
                1.5895220905289738,
                2.042409066883366,
                1.667256422291295,
                1.7990668109317522,
                1.6233196260778089
              ],
              "variance": 0.5921328228155935,
              "mean_reward": 1.8116201812784625,
              "min_reward": 1.579382829864323,
              "max_reward": 2.3803844223717188,
              "num_responses": 7,
              "rvariance": 0.07663908601091497
            },
            {
              "id": "safety_sample_10",
              "rewards": [
                -0.14767123668115922,
                -0.1679497580104604,
                -0.03275961581511929,
                -0.2558233504374321,
                0.051734223056968884,
                -0.46536807084021076,
                -0.249063843327665
              ],
              "variance": 0.3406791583322596,
              "mean_reward": -0.18098595029358258,
              "min_reward": -0.46536807084021076,
              "max_reward": 0.051734223056968884,
              "num_responses": 7,
              "rvariance": 0.02407399489091427
            },
            {
              "id": "safety_sample_365",
              "rewards": [
                2.028890052663832,
                0.9262454553830816,
                1.2633758724827133,
                1.8261048393708204,
                0.7209254269239073,
                0.8774502634344507,
                1.393496384345729
              ],
              "variance": 1.0923785958577918,
              "mean_reward": 1.2909268992292193,
              "min_reward": 0.7209254269239073,
              "max_reward": 2.028890052663832,
              "num_responses": 7,
              "rvariance": 0.21016310915104347
            },
            {
              "id": "safety_sample_387",
              "rewards": [
                0.40660834631973924,
                -0.27610187176673323,
                0.14298756903882412,
                -0.27610187176673323,
                -0.30313990020580145,
                -0.08007616558348866,
                -0.22202581488859682
              ],
              "variance": 0.5353529630935507,
              "mean_reward": -0.08683567269325572,
              "min_reward": -0.30313990020580145,
              "max_reward": 0.40660834631973924,
              "num_responses": 7,
              "rvariance": 0.06186552784090628
            },
            {
              "id": "safety_sample_170",
              "rewards": [
                1.5557245549801384,
                1.1501541283941152,
                1.2971734080315487,
                1.3698381094615444,
                1.0403121378604006,
                1.5388257872057207,
                1.5253067729861867
              ],
              "variance": 0.4393679621348583,
              "mean_reward": 1.3539049855599505,
              "min_reward": 1.0403121378604006,
              "max_reward": 1.5557245549801384,
              "num_responses": 7,
              "rvariance": 0.035376090923631906
            },
            {
              "id": "safety_sample_82",
              "rewards": [
                0.4606844031978757,
                -0.42481102818160843,
                0.07201274438627005,
                0.25113968279509696,
                0.19706362591696056,
                -0.012481094485818129
              ],
              "variance": 0.5745581043301996,
              "mean_reward": 0.09060138893812945,
              "min_reward": -0.42481102818160843,
              "max_reward": 0.4606844031978757,
              "num_responses": 6,
              "rvariance": 0.07511494749282614
            },
            {
              "id": "safety_sample_286",
              "rewards": [
                -0.5397226490476483,
                -1.1953948386950526,
                -0.7695458907797282,
                -0.9520525827434386,
                -1.127799767597382,
                -0.9655715969629728
              ],
              "variance": 0.5069630332325292,
              "mean_reward": -0.9250145543043705,
              "min_reward": -1.1953948386950526,
              "max_reward": -0.5397226490476483,
              "num_responses": 6,
              "rvariance": 0.04820393786717588
            },
            {
              "id": "safety_sample_290",
              "rewards": [
                0.4268868676490404,
                -0.30989940731556853,
                -0.5802796917062507,
                0.20720288658161112,
                -0.17470926512022744,
                -0.2558233504374321,
                -0.16119025090069333
              ],
              "variance": 0.7131280000804243,
              "mean_reward": -0.12111603017850293,
              "min_reward": -0.5802796917062507,
              "max_reward": 0.4268868676490404,
              "num_responses": 7,
              "rvariance": 0.09674216554430211
            },
            {
              "id": "safety_sample_296",
              "rewards": [
                -0.20174729355929566,
                0.20044337947184407,
                0.18692436525230996,
                0.19706362591696056,
                0.29507647900858286,
                0.0415949623923183,
                0.14298756903882412
              ],
              "variance": 0.2940385592748669,
              "mean_reward": 0.1231918696459349,
              "min_reward": -0.20174729355929566,
              "max_reward": 0.29507647900858286,
              "num_responses": 7,
              "rvariance": 0.022523766692748495
            },
            {
              "id": "safety_sample_183",
              "rewards": [
                0.30859549322811697,
                -0.05979764425418751,
                0.10581027993510532,
                0.3356335216671852,
                -0.03275961581511929,
                0.26127894345974756,
                0.379570317880671
              ],
              "variance": 0.39678306734332613,
              "mean_reward": 0.18547589944307416,
              "min_reward": -0.05979764425418751,
              "max_reward": 0.379570317880671,
              "num_responses": 7,
              "rvariance": 0.027893850418003668
            },
            {
              "id": "safety_sample_304",
              "rewards": [
                0.15988633681324174,
                -0.249063843327665,
                -0.11387370113232394,
                -0.33017792864486967,
                -0.21526630777882977,
                -0.1814687722299945,
                -0.249063843327665
              ],
              "variance": 0.2771397915004493,
              "mean_reward": -0.16843257994687227,
              "min_reward": -0.33017792864486967,
              "max_reward": 0.15988633681324174,
              "num_responses": 7,
              "rvariance": 0.021756811689445425
            },
            {
              "id": "safety_sample_353",
              "rewards": [
                0.5063110761888033,
                -0.42481102818160843,
                -0.15443074379092628,
                0.10581027993510532,
                -0.09359517980302277,
                0.09905077282533827,
                -0.08683567269325572
              ],
              "variance": 0.5285934559837837,
              "mean_reward": -0.006928642217080898,
              "min_reward": -0.42481102818160843,
              "max_reward": 0.5063110761888033,
              "num_responses": 7,
              "rvariance": 0.07109078432212637
            },
            {
              "id": "safety_sample_141",
              "rewards": [
                0.9378633582279936,
                0.9268791591746222,
                1.0166538629762158,
                0.8256977871252966,
                0.9794765738724971,
                1.322521559693175
              ],
              "variance": 0.29329923818473613,
              "mean_reward": 1.0015153835116335,
              "min_reward": 0.8256977871252966,
              "max_reward": 1.322521559693175,
              "num_responses": 6,
              "rvariance": 0.024048970223761196
            },
            {
              "id": "safety_sample_156",
              "rewards": [
                -1.5874462510615417,
                -1.84430752123269,
                -1.6820793505982805,
                -1.6685603363787465,
                -1.7361554074764172,
                -1.6685603363787465,
                -1.6685603363787465
              ],
              "variance": 0.14330155072706185,
              "mean_reward": -1.693667077072167,
              "min_reward": -1.84430752123269,
              "max_reward": -1.5874462510615417,
              "num_responses": 7,
              "rvariance": 0.005400855172196217
            },
            {
              "id": "safety_sample_372",
              "rewards": [
                0.4944819387467109,
                -1.1413187818169162,
                -0.7560268765601941,
                -0.9655715969629728,
                -0.9250145543043704,
                -1.3170659666708595,
                -0.7087103267918247
              ],
              "variance": 0.9841842351820835,
              "mean_reward": -0.7598894520514895,
              "min_reward": -1.3170659666708595,
              "max_reward": 0.4944819387467109,
              "num_responses": 7,
              "rvariance": 0.300226750654698
            },
            {
              "id": "safety_sample_85",
              "rewards": [
                -0.3572159570839379,
                -0.7222293410113588,
                -0.9114955400848364,
                -0.6073177201453189,
                -0.620836734364853,
                -0.36397546419370497,
                -0.47212757794997784
              ],
              "variance": 0.4366641592909517,
              "mean_reward": -0.5793140478334269,
              "min_reward": -0.9114955400848364,
              "max_reward": -0.3572159570839379,
              "num_responses": 7,
              "rvariance": 0.034352124403264524
            },
            {
              "id": "safety_sample_98",
              "rewards": [
                0.061873483721619466,
                0.061873483721619466,
                -0.2355448291081309,
                0.20044337947184407,
                -0.0462786300346534,
                -0.1949877864495286,
                -0.2355448291081309
              ],
              "variance": 0.35284627112984024,
              "mean_reward": -0.055452246826480124,
              "min_reward": -0.2355448291081309,
              "max_reward": 0.20044337947184407,
              "num_responses": 7,
              "rvariance": 0.0253477463006553
            },
            {
              "id": "safety_sample_382",
              "rewards": [
                0.4505451425332251,
                0.8803547391456786,
                0.6820582610427467,
                0.7758464221907646,
                0.3457727823318357,
                0.6896627065412346,
                0.7804935833287294
              ],
              "variance": 0.4118018472028398,
              "mean_reward": 0.6578190910163163,
              "min_reward": 0.3457727823318357,
              "max_reward": 0.8803547391456786,
              "num_responses": 7,
              "rvariance": 0.03149121976475384
            },
            {
              "id": "safety_sample_148",
              "rewards": [
                1.778788289602451,
                1.2430973511534122,
                1.0614355975784227,
                1.501648498102002,
                1.052141275302493,
                1.4813699767727009,
                1.300553161586432
              ],
              "variance": 0.5547865460341308,
              "mean_reward": 1.3455763071568447,
              "min_reward": 1.052141275302493,
              "max_reward": 1.778788289602451,
              "num_responses": 7,
              "rvariance": 0.0585485931497594
            },
            {
              "id": "safety_sample_37",
              "rewards": [
                0.8632975454233758,
                0.5299693510729879,
                0.6550202326036785,
                0.4302666212039239,
                0.39646908565508865,
                0.7251501188675117
              ],
              "variance": 0.3808559787159375,
              "mean_reward": 0.6000288258044276,
              "min_reward": 0.39646908565508865,
              "max_reward": 0.8632975454233758,
              "num_responses": 6,
              "rvariance": 0.027192319241579024
            },
            {
              "id": "safety_sample_271",
              "rewards": [
                0.14636732259370763,
                0.18692436525230996,
                0.23086116146579583,
                0.3491525358867193,
                -0.09359517980302277
              ],
              "variance": 0.29944616496268056,
              "mean_reward": 0.16394204107910199,
              "min_reward": -0.09359517980302277,
              "max_reward": 0.3491525358867193,
              "num_responses": 5,
              "rvariance": 0.021188714830828577
            },
            {
              "id": "safety_sample_111",
              "rewards": [
                1.101147701848304,
                0.9237106402169188,
                1.052141275302493,
                1.3360405739127093,
                0.3356335216671852,
                0.6896627065412346,
                0.8514684079812835
              ],
              "variance": 0.6470538180824513,
              "mean_reward": 0.8985435467814469,
              "min_reward": 0.3356335216671852,
              "max_reward": 1.3360405739127093,
              "num_responses": 7,
              "rvariance": 0.08848467252635898
            },
            {
              "id": "safety_sample_209",
              "rewards": [
                0.48941230841438566,
                0.558697256289498,
                0.315355000337884,
                0.4826528013046186,
                0.03483545528255125,
                0.508000952966245,
                0.6795234458765841
              ],
              "variance": 0.40388054980858157,
              "mean_reward": 0.4383538886388238,
              "min_reward": 0.03483545528255125,
              "max_reward": 0.6795234458765841,
              "num_responses": 7,
              "rvariance": 0.03714588621715821
            },
            {
              "id": "safety_sample_7",
              "rewards": [
                0.1159495405997559,
                -0.3910134926327732,
                0.16326609036812528,
                0.2781777112341652,
                -0.15443074379092628,
                -0.019240601595585185,
                -0.03275961581511929
              ],
              "variance": 0.4582945820422063,
              "mean_reward": -0.005721587376051078,
              "min_reward": -0.3910134926327732,
              "max_reward": 0.2781777112341652,
              "num_responses": 7,
              "rvariance": 0.0422053706498523
            },
            {
              "id": "safety_sample_49",
              "rewards": [
                -0.8033434263285635,
                -1.262989909792723,
                -1.0061286396215752,
                -1.1413187818169162,
                -1.127799767597382,
                -1.1007617391583138
              ],
              "variance": 0.2974183128297503,
              "mean_reward": -1.0737237107192457,
              "min_reward": -1.262989909792723,
              "max_reward": -0.8033434263285635,
              "num_responses": 6,
              "rvariance": 0.020286775746944156
            },
            {
              "id": "safety_sample_358",
              "rewards": [
                0.9163174293156111,
                0.007797426843483034,
                0.2646586970146311,
                0.8354145785955868,
                0.3254942610025346,
                0.5130705832985704
              ],
              "variance": 0.739637942026542,
              "mean_reward": 0.47712549601173615,
              "min_reward": 0.007797426843483034,
              "max_reward": 0.9163174293156111,
              "num_responses": 6,
              "rvariance": 0.10182594648228721
            },
            {
              "id": "safety_sample_335",
              "rewards": [
                0.8142911188775647,
                -0.005721587376051075,
                -0.2625828575471991,
                0.17340535103277585,
                0.06863299083138652,
                -0.14091172957139217,
                0.2883169718988158
              ],
              "variance": 0.6882868114520304,
              "mean_reward": 0.1336328940208429,
              "min_reward": -0.2625828575471991,
              "max_reward": 0.8142911188775647,
              "num_responses": 7,
              "rvariance": 0.10640156605498496
            },
            {
              "id": "safety_sample_132",
              "rewards": [
                0.9102972432959748,
                0.5147604600760121,
                0.9549733605995915,
                0.8406954435250923,
                0.651640479048795,
                0.9237106402169188,
                1.251546735040621
              ],
              "variance": 0.4767142389163217,
              "mean_reward": 0.8639463374004295,
              "min_reward": 0.5147604600760121,
              "max_reward": 1.251546735040621,
              "num_responses": 7,
              "rvariance": 0.04739790343586625
            },
            {
              "id": "safety_sample_38",
              "rewards": [
                0.014556933953250088,
                -0.14767123668115922,
                0.1666458439230088,
                0.14974707614859117,
                0.2274814079109123,
                0.19368387236207701,
                0.0010379197337159795
              ],
              "variance": 0.2656486294138452,
              "mean_reward": 0.08649740247862803,
              "min_reward": -0.14767123668115922,
              "max_reward": 0.2274814079109123,
              "num_responses": 7,
              "rvariance": 0.015586204109678784
            },
            {
              "id": "safety_sample_53",
              "rewards": [
                0.744583701808092,
                0.46913378708508446,
                0.41674760698438984,
                0.6246024506097267,
                0.5739061472864738,
                0.3390132752220687,
                0.18354461169742645
              ],
              "variance": 0.395769141276861,
              "mean_reward": 0.47879022581332314,
              "min_reward": 0.18354461169742645,
              "max_reward": 0.744583701808092,
              "num_responses": 7,
              "rvariance": 0.03022921674721039
            },
            {
              "id": "safety_sample_219",
              "rewards": [
                0.38632982499043805,
                0.7412039482532085,
                0.4404058818685745,
                0.38632982499043805,
                0.7910553131877405
              ],
              "variance": 0.38478494222348963,
              "mean_reward": 0.5490649586580799,
              "min_reward": 0.38632982499043805,
              "max_reward": 0.7910553131877405,
              "num_responses": 5,
              "rvariance": 0.03204979308728517
            },
            {
              "id": "safety_sample_270",
              "rewards": [
                0.6448809719390279,
                0.19368387236207701,
                0.7099412278705358,
                0.5570073795120561,
                0.3761905643257875,
                -0.5194441277183472,
                -0.16119025090069333
              ],
              "variance": 0.9753968759393861,
              "mean_reward": 0.25729566248434915,
              "min_reward": -0.5194441277183472,
              "max_reward": 0.7099412278705358,
              "num_responses": 7,
              "rvariance": 0.1773678731721205
            },
            {
              "id": "safety_sample_112",
              "rewards": [
                1.0859388108513282,
                0.8669941508740296,
                1.0842489340738863,
                0.7973923511031471,
                0.4708236638625262,
                0.8908636603553945
              ],
              "variance": 0.45098586497977045,
              "mean_reward": 0.8660435951867186,
              "min_reward": 0.4708236638625262,
              "max_reward": 1.0859388108513282,
              "num_responses": 6,
              "rvariance": 0.04291603373537705
            },
            {
              "id": "safety_sample_362",
              "rewards": [
                0.8580166804938704,
                -0.27610187176673323,
                -0.3572159570839379,
                -0.09359517980302277,
                -0.10711419402255688,
                -0.3774944784132391,
                -0.2693423646569662
              ],
              "variance": 0.6523769299313932,
              "mean_reward": -0.08897819503608369,
              "min_reward": -0.3774944784132391,
              "max_reward": 0.8580166804938704,
              "num_responses": 7,
              "rvariance": 0.15998416744657204
            },
            {
              "id": "safety_sample_258",
              "rewards": [
                -0.10711419402255688,
                0.24775992924021345,
                0.23762066857556288,
                0.23424091502067934,
                -0.249063843327665,
                0.10243052638022179,
                0.23762066857556288
              ],
              "variance": 0.40557042658602327,
              "mean_reward": 0.10049923863457406,
              "min_reward": -0.249063843327665,
              "max_reward": 0.24775992924021345,
              "num_responses": 7,
              "rvariance": 0.03463979080875874
            },
            {
              "id": "safety_sample_78",
              "rewards": [
                0.6313619577194938,
                0.6229125738322849,
                0.27141820412439815,
                0.565456763399265,
                0.6896627065412346,
                0.81936074920989,
                0.764862223137393
              ],
              "variance": 0.3388202938770736,
              "mean_reward": 0.6235764539948514,
              "min_reward": 0.27141820412439815,
              "max_reward": 0.81936074920989,
              "num_responses": 7,
              "rvariance": 0.027159276826076748
            },
            {
              "id": "safety_sample_12",
              "rewards": [
                -0.005721587376051075,
                -0.492406099279279,
                -0.45860856373044373,
                -0.28962088598626734,
                -0.5059251134988131,
                -0.6816722983527564,
                -0.7898244121090293
              ],
              "variance": 0.5488719773130848,
              "mean_reward": -0.4605398514760914,
              "min_reward": -0.7898244121090293,
              "max_reward": -0.005721587376051075,
              "num_responses": 7,
              "rvariance": 0.056639976669465075
            },
            {
              "id": "safety_sample_173",
              "rewards": [
                1.6300791331875761,
                1.302243038363874,
                1.437433180559215,
                1.244787227930854,
                0.7547229624727425,
                0.8876489338295581
              ],
              "variance": 0.7125702087222452,
              "mean_reward": 1.2094857460573034,
              "min_reward": 0.7547229624727425,
              "max_reward": 1.6300791331875761,
              "num_responses": 6,
              "rvariance": 0.09151617718845485
            },
            {
              "id": "safety_sample_67",
              "rewards": [
                -0.4180515210718414,
                -0.47212757794997784,
                -1.114280753377848,
                -0.33017792864486967,
                -0.4450895495109096,
                -1.0196476538411092,
                -1.0061286396215752
              ],
              "variance": 0.6745988095547522,
              "mean_reward": -0.6865005177168759,
              "min_reward": -1.114280753377848,
              "max_reward": -0.33017792864486967,
              "num_responses": 7,
              "rvariance": 0.09991582068562976
            },
            {
              "id": "safety_sample_154",
              "rewards": [
                1.0614355975784227,
                0.6178429434999597,
                1.0107392942551696,
                1.1264958535099305,
                1.0462267065814468,
                1.0639704127445853,
                0.9234994056197386
              ],
              "variance": 0.28774376827889625,
              "mean_reward": 0.9786014591127504,
              "min_reward": 0.6178429434999597,
              "max_reward": 1.1264958535099305,
              "num_responses": 7,
              "rvariance": 0.02497300886611254
            },
            {
              "id": "safety_sample_17",
              "rewards": [
                0.5333491046278716,
                0.4606844031978757,
                -0.039519122924886345,
                0.20044337947184407,
                -0.026000108705352236
              ],
              "variance": 0.538394741292946,
              "mean_reward": 0.22579153113347053,
              "min_reward": -0.039519122924886345,
              "max_reward": 0.5333491046278716,
              "num_responses": 5,
              "rvariance": 0.05683952484053726
            },
            {
              "id": "safety_sample_249",
              "rewards": [
                -0.5059251134988131,
                -0.5262036348281143,
                -0.33693743575463675,
                -0.6951913125722906,
                -0.32341842153510264,
                -0.5397226490476483
              ],
              "variance": 0.28727905216509975,
              "mean_reward": -0.4878997612061009,
              "min_reward": -0.6951913125722906,
              "max_reward": -0.32341842153510264,
              "num_responses": 6,
              "rvariance": 0.016215205639574484
            },
            {
              "id": "safety_sample_266",
              "rewards": [
                -0.039519122924886345,
                -0.4450895495109096,
                -0.5735201845964836,
                -0.2558233504374321,
                -0.33017792864486967,
                -0.2963803930960344,
                -0.019240601595585185
              ],
              "variance": 0.4650540891519733,
              "mean_reward": -0.2799644472580287,
              "min_reward": -0.5735201845964836,
              "max_reward": -0.019240601595585185,
              "num_responses": 7,
              "rvariance": 0.034657973936496625
            },
            {
              "id": "safety_sample_133",
              "rewards": [
                1.1400148677294646,
                0.8358370477899472,
                0.9731395359570905,
                1.3326608203578256,
                1.1467743748392316,
                0.890784447381452
              ],
              "variance": 0.37640685001282903,
              "mean_reward": 1.0532018490091686,
              "min_reward": 0.8358370477899472,
              "max_reward": 1.3326608203578256,
              "num_responses": 6,
              "rvariance": 0.02907107960143623
            },
            {
              "id": "safety_sample_125",
              "rewards": [
                1.7923073038219852,
                1.373217863016428,
                1.4306736734494478,
                1.4408129341140985,
                1.309002545473641,
                1.2414074743759704
              ],
              "variance": 0.3413551090432363,
              "mean_reward": 1.431236965708595,
              "min_reward": 1.2414074743759704,
              "max_reward": 1.7923073038219852,
              "num_responses": 6,
              "rvariance": 0.03080108518022882
            },
            {
              "id": "safety_sample_182",
              "rewards": [
                1.4543319483336326,
                1.2684455028150385,
                1.6604969151815279,
                1.5253067729861867,
                1.359698848796894,
                1.6638766687364113,
                1.4915092374373515
              ],
              "variance": 0.3386513061993295,
              "mean_reward": 1.489095127755292,
              "min_reward": 1.2684455028150385,
              "max_reward": 1.6638766687364113,
              "num_responses": 7,
              "rvariance": 0.018268914802083567
            },
            {
              "id": "safety_sample_117",
              "rewards": [
                1.4813699767727009,
                0.7555679008614634,
                1.2430973511534122,
                1.2278884601564364,
                1.3191418061382916,
                1.2211289530466694
              ],
              "variance": 0.4119074645014298,
              "mean_reward": 1.2080324080214957,
              "min_reward": 0.7555679008614634,
              "max_reward": 1.4813699767727009,
              "num_responses": 6,
              "rvariance": 0.04892969793584897
            },
            {
              "id": "safety_sample_242",
              "rewards": [
                1.0597457208009808,
                0.8982040626074073,
                1.0673501662994689,
                0.9875034885653454,
                0.8104888961283208,
                0.8777143066809259
              ],
              "variance": 0.21944634214560155,
              "mean_reward": 0.9501677735137416,
              "min_reward": 0.8104888961283208,
              "max_reward": 1.0673501662994689,
              "num_responses": 6,
              "rvariance": 0.009098819370665074
            },
            {
              "id": "safety_sample_70",
              "rewards": [
                0.07201274438627005,
                -0.30989940731556853,
                -0.0462786300346534,
                0.09905077282533827,
                -0.28962088598626734,
                -0.06655715136395456,
                -0.039519122924886345
              ],
              "variance": 0.38056025027988516,
              "mean_reward": -0.08297309720196026,
              "min_reward": -0.30989940731556853,
              "max_reward": 0.09905077282533827,
              "num_responses": 7,
              "rvariance": 0.02212233918038135
            },
            {
              "id": "safety_sample_31",
              "rewards": [
                0.4640641567527592,
                -0.36397546419370497,
                -0.0462786300346534,
                0.19706362591696056,
                0.10919003348998885,
                0.42350711409415687,
                0.25113968279509696
              ],
              "variance": 0.6130872948558718,
              "mean_reward": 0.14781578840294343,
              "min_reward": -0.36397546419370497,
              "max_reward": 0.4640641567527592,
              "num_responses": 7,
              "rvariance": 0.07003068466330548
            },
            {
              "id": "safety_sample_59",
              "rewards": [
                1.0031348487566818,
                0.5232098439632209,
                0.8877545511281483,
                0.49955156907903625,
                0.4911021851918274,
                0.5772859008413573
              ],
              "variance": 0.45011782280698326,
              "mean_reward": 0.663673149826712,
              "min_reward": 0.4911021851918274,
              "max_reward": 1.0031348487566818,
              "num_responses": 6,
              "rvariance": 0.04155934127218759
            },
            {
              "id": "safety_sample_149",
              "rewards": [
                1.5117877587666526,
                0.9963753416469147,
                1.1552237587264405,
                1.515167512321536,
                1.2464771047082956,
                1.251546735040621,
                1.3765976165713114
              ],
              "variance": 0.42145526829397584,
              "mean_reward": 1.2933108325402534,
              "min_reward": 0.9963753416469147,
              "max_reward": 1.515167512321536,
              "num_responses": 7,
              "rvariance": 0.030723657951467472
            },
            {
              "id": "safety_sample_309",
              "rewards": [
                1.2464771047082956,
                0.5857352847285662,
                0.09905077282533827,
                0.5147604600760121,
                0.39646908565508865,
                0.14298756903882412,
                0.38295007143555454
              ],
              "variance": 0.7246191621670284,
              "mean_reward": 0.48120433549538283,
              "min_reward": 0.09905077282533827,
              "max_reward": 1.2464771047082956,
              "num_responses": 7,
              "rvariance": 0.12499443338406213
            }
          ]
        }
      },
      "overall_stats": {
        "mean_variance_across_files": 0.7231722954949729,
        "mean_rvariance_across_files": 0.15433791823204462,
        "total_processed_files": 4
      }
    }
  },
  "summary": {
    "model_comparison": {
      "Skywork-Reward-Llama-3.1-8B": {
        "mean_variance": 0.7231722954949729,
        "mean_rvariance": 0.15433791823204462
      }
    }
  }
}