{
  "models": {
    "RM-Mistral-7B": {
      "model_name": "RM-Mistral-7B",
      "model_path": "weqweasdas/RM-Mistral-7B",
      "files": {
        "semantic_benchmark_chat_filtered.json": {
          "file_name": "semantic_benchmark_chat_filtered.json",
          "processed_samples": 200,
          "global_mean": 7.0428759350910495,
          "global_std": 2.6578266510317454,
          "mean_variance": 0.34833306324413227,
          "mean_rvariance": 0.03422093241898524,
          "sample_results": [
            {
              "id": "chat_sample_306",
              "rewards": [
                -0.09843604171456725,
                0.16023395082731595,
                0.45417712417036504,
                0.16023395082731595,
                0.019141227622652385,
                -0.29831739958784065,
                0.6187853012424726
              ],
              "variance": 0.6984089798630848,
              "mean_reward": 0.145116873341102,
              "min_reward": -0.29831739958784065,
              "max_reward": 0.6187853012424726,
              "num_responses": 7,
              "rvariance": 0.08459413006442366
            },
            {
              "id": "chat_sample_202",
              "rewards": [
                -1.2389355542855978,
                -1.3917860044239834,
                -1.5034844102943419,
                -0.9920232886774365,
                -0.9097192001413827,
                -1.479968956426898,
                -1.0743273772134903
              ],
              "variance": 0.5302734847108606,
              "mean_reward": -1.2271778273518756,
              "min_reward": -1.5034844102943419,
              "max_reward": -0.9097192001413827,
              "num_responses": 7,
              "rvariance": 0.04956052513929758
            },
            {
              "id": "chat_sample_298",
              "rewards": [
                -0.8038996577378851,
                -0.7921419308041631,
                -1.0743273772134903,
                -1.4740900929600371,
                -0.8744460193402168,
                -0.7803842038704412,
                -0.8862037462739388
              ],
              "variance": 0.4467936234814346,
              "mean_reward": -0.9550704326000247,
              "min_reward": -1.4740900929600371,
              "max_reward": -0.7803842038704412,
              "num_responses": 7,
              "rvariance": 0.053537160222201965
            },
            {
              "id": "chat_sample_268",
              "rewards": [
                -0.12195149558201118,
                -0.509956484394836,
                -0.2160133110517869,
                -0.3453483073227285,
                -0.15722467638317708,
                -0.2865596726541187,
                -0.2160133110517869
              ],
              "variance": 0.26807617408886075,
              "mean_reward": -0.26472389406292074,
              "min_reward": -0.509956484394836,
              "max_reward": -0.12195149558201118,
              "num_responses": 7,
              "rvariance": 0.014828800280770101
            },
            {
              "id": "chat_sample_303",
              "rewards": [
                -1.2800875985536246,
                -1.3976648678908443,
                -1.3506339601559565,
                -2.1530988233824804,
                -1.3506339601559565,
                -2.812266389604268,
                -1.3506339601559565
              ],
              "variance": 1.0943504343561719,
              "mean_reward": -1.670717079985584,
              "min_reward": -2.812266389604268,
              "max_reward": -1.2800875985536246,
              "num_responses": 7,
              "rvariance": 0.29576221224953697
            },
            {
              "id": "chat_sample_65",
              "rewards": [
                1.0185480169890193,
                0.5247234857726968,
                1.0185480169890193,
                1.0185480169890193,
                0.7833934783145801,
                0.7833934783145801,
                0.9715171092541315
              ],
              "variance": 0.3386225356911925,
              "mean_reward": 0.8740959432318638,
              "min_reward": 0.5247234857726968,
              "max_reward": 1.0185480169890193,
              "num_responses": 7,
              "rvariance": 0.030086439534652284
            },
            {
              "id": "chat_sample_212",
              "rewards": [
                0.5482389396401407,
                1.0420634708564633,
                0.7833934783145801,
                0.9715171092541315,
                0.7833934783145801,
                0.7598780244471361,
                1.1596407401936828
              ],
              "variance": 0.4138719880670132,
              "mean_reward": 0.8640178915743879,
              "min_reward": 0.5482389396401407,
              "max_reward": 1.1596407401936828,
              "num_responses": 7,
              "rvariance": 0.03631588988091187
            },
            {
              "id": "chat_sample_262",
              "rewards": [
                1.2301871017960146,
                0.8539398399169118,
                0.7363625705796921,
                1.3007334633983465,
                1.3712798250006781,
                0.9244862015192435,
                1.3477643711332343
              ],
              "variance": 0.5502616204981878,
              "mean_reward": 1.1092504819063032,
              "min_reward": 0.7363625705796921,
              "max_reward": 1.3712798250006781,
              "num_responses": 7,
              "rvariance": 0.05931520112308042
            },
            {
              "id": "chat_sample_178",
              "rewards": [
                -0.5569873921297238,
                -0.42765239585878223,
                -0.7215955692018313,
                -0.42765239585878223,
                -0.6510492075994996,
                -0.42765239585878223,
                -0.5922605729308897
              ],
              "variance": 0.25161535638165,
              "mean_reward": -0.5435499899197559,
              "min_reward": -0.7215955692018313,
              "max_reward": -0.42765239585878223,
              "num_responses": 7,
              "rvariance": 0.012300907386635779
            },
            {
              "id": "chat_sample_290",
              "rewards": [
                -0.11019376864828921,
                0.019141227622652385,
                0.054414408423818277,
                0.18374940469475987,
                0.0779298622912622,
                -0.004374226244791544,
                0.0779298622912622
              ],
              "variance": 0.1669597224588519,
              "mean_reward": 0.042656681490096306,
              "min_reward": -0.11019376864828921,
              "max_reward": 0.18374940469475987,
              "num_responses": 7,
              "rvariance": 0.006951705458869394
            },
            {
              "id": "chat_sample_292",
              "rewards": [
                -0.3453483073227285,
                -0.2865596726541187,
                -0.2630442187866747,
                -0.8979614732076608,
                -0.12195149558201118,
                -0.07492058784712333,
                -0.15722467638317708
              ],
              "variance": 0.4632544411886454,
              "mean_reward": -0.30671577596907057,
              "min_reward": -0.8979614732076608,
              "max_reward": -0.07492058784712333,
              "num_responses": 7,
              "rvariance": 0.06622740825547895
            },
            {
              "id": "chat_sample_116",
              "rewards": [
                0.2778112201645356,
                0.5247234857726968,
                0.7363625705796921,
                0.45417712417036504,
                0.38363076256803325,
                0.4071462164354772,
                0.7833934783145801
              ],
              "variance": 0.4138719880670131,
              "mean_reward": 0.5096064082864828,
              "min_reward": 0.2778112201645356,
              "max_reward": 0.7833934783145801,
              "num_responses": 7,
              "rvariance": 0.029967944555239732
            },
            {
              "id": "chat_sample_106",
              "rewards": [
                -0.6510492075994996,
                -0.36886376119017245,
                -0.839172838539051,
                -0.45116784972622614,
                -0.46292557665994816,
                -0.2630442187866747
              ],
              "variance": 0.4291570330808516,
              "mean_reward": -0.5060372420835954,
              "min_reward": -0.839172838539051,
              "max_reward": -0.2630442187866747,
              "num_responses": 6,
              "rvariance": 0.03578987248553025
            },
            {
              "id": "chat_sample_251",
              "rewards": [
                -0.20425558411806494,
                -0.5805028459971677,
                0.3483575817668674,
                0.2425380393633697,
                0.23078031242964772,
                0.03089895455637435,
                0.3013266740319795
              ],
              "variance": 0.6748935259956407,
              "mean_reward": 0.05273473314757229,
              "min_reward": -0.5805028459971677,
              "max_reward": 0.3483575817668674,
              "num_responses": 7,
              "rvariance": 0.09777528586955261
            },
            {
              "id": "chat_sample_280",
              "rewards": [
                -1.1977835100175709,
                -1.3094819158879296,
                -1.0037810156111584,
                -1.162510329216405,
                -1.1096005580146562,
                -1.0860851041472122,
                -1.1977835100175709
              ],
              "variance": 0.18929940363292364,
              "mean_reward": -1.1524322775589293,
              "min_reward": -1.3094819158879296,
              "max_reward": -1.0037810156111584,
              "num_responses": 7,
              "rvariance": 0.008173332270432083
            },
            {
              "id": "chat_sample_58",
              "rewards": [
                -0.5334719382622799,
                -0.13370922251573314,
                -0.180740130250621,
                -0.6510492075994996,
                -0.49819875746111403,
                0.00738350068893042,
                -0.42765239585878223
              ],
              "variance": 0.5032307127633,
              "mean_reward": -0.3453483073227285,
              "min_reward": -0.6510492075994996,
              "max_reward": 0.00738350068893042,
              "num_responses": 7,
              "rvariance": 0.05075534951504074
            },
            {
              "id": "chat_sample_90",
              "rewards": [
                -0.7568687500029972,
                -0.5687451190634458,
                -1.2742087350867637,
                -1.0508119233460462,
                -0.5687451190634458,
                -0.5922605729308897
              ],
              "variance": 0.5937652101529591,
              "mean_reward": -0.8019400365822648,
              "min_reward": -1.2742087350867637,
              "max_reward": -0.5687451190634458,
              "num_responses": 6,
              "rvariance": 0.07328859617879235
            },
            {
              "id": "chat_sample_180",
              "rewards": [
                -0.19249785718434295,
                -0.45116784972622614,
                -0.22777103798550885,
                -0.09843604171456725,
                -0.19249785718434295
              ],
              "variance": 0.22574835712746172,
              "mean_reward": -0.23247412875899762,
              "min_reward": -0.45116784972622614,
              "max_reward": -0.09843604171456725,
              "num_responses": 5,
              "rvariance": 0.013802295201973413
            },
            {
              "id": "chat_sample_291",
              "rewards": [
                0.054414408423818277,
                0.36011530870058933,
                -0.02788968011223547,
                0.19550713162848185,
                -0.36886376119017245,
                0.25429576629709166
              ],
              "variance": 0.5055822581500444,
              "mean_reward": 0.0779298622912622,
              "min_reward": -0.36886376119017245,
              "max_reward": 0.36011530870058933,
              "num_responses": 6,
              "rvariance": 0.055988877772428225
            },
            {
              "id": "chat_sample_129",
              "rewards": [
                -0.32183285345528456,
                0.00738350068893042,
                -0.016131953178513507,
                0.04265668149009631,
                -0.08667831478084528,
                -0.5687451190634458,
                -0.3453483073227285
              ],
              "variance": 0.4561998050284122,
              "mean_reward": -0.18409948080311297,
              "min_reward": -0.5687451190634458,
              "max_reward": 0.04265668149009631,
              "num_responses": 7,
              "rvariance": 0.04553028518475417
            },
            {
              "id": "chat_sample_31",
              "rewards": [
                0.23078031242964772,
                -0.13370922251573314,
                -0.3100751265215626,
                -0.7686264769367191,
                -0.19249785718434295,
                0.06617213535754024
              ],
              "variance": 0.6878270256227348,
              "mean_reward": -0.18465937256186163,
              "min_reward": -0.7686264769367191,
              "max_reward": 0.23078031242964772,
              "num_responses": 6,
              "rvariance": 0.09915177119918356
            },
            {
              "id": "chat_sample_294",
              "rewards": [
                0.36011530870058933,
                -0.27480194572039673,
                0.16023395082731595,
                0.03089895455637435,
                0.5717543935075847,
                -0.09843604171456725,
                0.23078031242964772
              ],
              "variance": 0.6137533459402866,
              "mean_reward": 0.14007784751236402,
              "min_reward": -0.27480194572039673,
              "max_reward": 0.5717543935075847,
              "num_responses": 7,
              "rvariance": 0.06918978274079263
            },
            {
              "id": "chat_sample_128",
              "rewards": [
                -0.3453483073227285,
                -1.0037810156111584,
                -0.9214769270751048,
                -1.0390541964123243,
                -0.7686264769367191,
                -0.7803842038704412,
                -0.9920232886774365
              ],
              "variance": 0.41857507884050205,
              "mean_reward": -0.8358134879865589,
              "min_reward": -1.0390541964123243,
              "max_reward": -0.3453483073227285,
              "num_responses": 7,
              "rvariance": 0.04991459942301838
            },
            {
              "id": "chat_sample_173",
              "rewards": [
                -0.039647407045957435,
                -0.6275337537320557,
                -0.6040182998646118,
                -0.32183285345528456,
                -0.46292557665994816,
                -0.839172838539051,
                -0.15722467638317708
              ],
              "variance": 0.6019956190065645,
              "mean_reward": -0.43605077224001226,
              "min_reward": -0.839172838539051,
              "max_reward": -0.039647407045957435,
              "num_responses": 7,
              "rvariance": 0.06800483294666716
            },
            {
              "id": "chat_sample_174",
              "rewards": [
                -0.9567501078762706,
                -0.827415111605329,
                -0.9332346540088267,
                -0.839172838539051,
                -0.7333532961355533,
                -0.8509305654727729,
                -0.9097192001413827
              ],
              "variance": 0.1528504501383856,
              "mean_reward": -0.8643679676827408,
              "min_reward": -0.9567501078762706,
              "max_reward": -0.7333532961355533,
              "num_responses": 7,
              "rvariance": 0.004954218663057894
            },
            {
              "id": "chat_sample_297",
              "rewards": [
                0.28956894709825753,
                0.2778112201645356,
                -0.16898240331689904,
                -1.1977835100175709,
                0.5952698473750286,
                0.25429576629709166,
                0.23078031242964772
              ],
              "variance": 0.9923521532061338,
              "mean_reward": 0.04013716857572732,
              "min_reward": -1.1977835100175709,
              "max_reward": 0.5952698473750286,
              "num_responses": 7,
              "rvariance": 0.297894967588625
            },
            {
              "id": "chat_sample_264",
              "rewards": [
                -2.6123850317309945,
                -3.58460207756313,
                -2.3441618860554625,
                -2.5598426894959245,
                -3.608117531430574
              ],
              "variance": 1.1682771424519487,
              "mean_reward": -2.9418218432552172,
              "min_reward": -3.608117531430574,
              "max_reward": -2.3441618860554625,
              "num_responses": 5,
              "rvariance": 0.2937500969663863
            },
            {
              "id": "chat_sample_275",
              "rewards": [
                0.18374940469475987,
                0.10144531615870613,
                0.23078031242964772,
                0.19550713162848185,
                0.3483575817668674,
                0.136718496959872,
                0.25429576629709166
              ],
              "variance": 0.1693112678455963,
              "mean_reward": 0.2072648585622038,
              "min_reward": 0.10144531615870613,
              "max_reward": 0.3483575817668674,
              "num_responses": 7,
              "rvariance": 0.005648260685331382
            },
            {
              "id": "chat_sample_172",
              "rewards": [
                0.2425380393633697,
                -0.839172838539051,
                -0.5687451190634458,
                -0.27480194572039673,
                -0.46292557665994816,
                -0.5687451190634458,
                -0.6275337537320557
              ],
              "variance": 0.6443234359679637,
              "mean_reward": -0.4427694733449962,
              "min_reward": -0.839172838539051,
              "max_reward": 0.2425380393633697,
              "num_responses": 7,
              "rvariance": 0.10303984852631005
            },
            {
              "id": "chat_sample_145",
              "rewards": [
                0.5717543935075847,
                0.4071462164354772,
                1.1596407401936828,
                1.136125286326239,
                0.9715171092541315,
                1.3947952788681222,
                1.3947952788681222
              ],
              "variance": 0.8888841561893804,
              "mean_reward": 1.0051106147790512,
              "min_reward": 0.4071462164354772,
              "max_reward": 1.3947952788681222,
              "num_responses": 7,
              "rvariance": 0.12732003406974754
            },
            {
              "id": "chat_sample_270",
              "rewards": [
                0.5482389396401407,
                0.5247234857726968,
                0.6423007551099165,
                0.7833934783145801,
                0.5717543935075847,
                0.9009707476517996,
                0.9009707476517996
              ],
              "variance": 0.3621379895586365,
              "mean_reward": 0.6960503639497883,
              "min_reward": 0.5247234857726968,
              "max_reward": 0.9009707476517996,
              "num_responses": 7,
              "rvariance": 0.023021881714437604
            },
            {
              "id": "chat_sample_278",
              "rewards": [
                0.08968758922498417,
                -0.29831739958784065,
                0.21902258549592576,
                0.2660534932308136,
                0.28956894709825753,
                0.2660534932308136,
                0.2072648585622038
              ],
              "variance": 0.3409740810779369,
              "mean_reward": 0.14847622389359397,
              "min_reward": -0.29831739958784065,
              "max_reward": 0.28956894709825753,
              "num_responses": 7,
              "rvariance": 0.03700993190318535
            },
            {
              "id": "chat_sample_165",
              "rewards": [
                -0.2395287649192308,
                0.28956894709825753,
                0.3483575817668674,
                0.36011530870058933,
                0.36011530870058933,
                0.36011530870058933,
                0.4071462164354772
              ],
              "variance": 0.30099780950328225,
              "mean_reward": 0.2694128437833056,
              "min_reward": -0.2395287649192308,
              "max_reward": 0.4071462164354772,
              "num_responses": 7,
              "rvariance": 0.044187342084745306
            },
            {
              "id": "chat_sample_127",
              "rewards": [
                0.3365998548331454,
                0.9950325631215754,
                1.0890943785913512,
                0.7128471167122482,
                0.5717543935075847,
                0.7128471167122482,
                0.5482389396401407
              ],
              "variance": 0.569073983592143,
              "mean_reward": 0.7094877661597562,
              "min_reward": 0.3365998548331454,
              "max_reward": 1.0890943785913512,
              "num_responses": 7,
              "rvariance": 0.05852523459366345
            },
            {
              "id": "chat_sample_256",
              "rewards": [
                -0.3453483073227285,
                -0.07492058784712333,
                -0.13370922251573314,
                -0.19249785718434295,
                -0.1454669494494551,
                -0.13370922251573314,
                -0.09843604171456725
              ],
              "variance": 0.16460817707210745,
              "mean_reward": -0.16058402693566906,
              "min_reward": -0.3453483073227285,
              "max_reward": -0.07492058784712333,
              "num_responses": 7,
              "rvariance": 0.006861423569793168
            },
            {
              "id": "chat_sample_114",
              "rewards": [
                -0.8509305654727729,
                -0.42765239585878223,
                -0.7098378422681094,
                -0.7686264769367191,
                -0.45116784972622614,
                -0.8979614732076608,
                -0.6863223884006654
              ],
              "variance": 0.4279812603874795,
              "mean_reward": -0.6846427131244194,
              "min_reward": -0.8979614732076608,
              "max_reward": -0.42765239585878223,
              "num_responses": 7,
              "rvariance": 0.028771709524979743
            },
            {
              "id": "chat_sample_119",
              "rewards": [
                -2.3103584211210118,
                -2.0854918935135793,
                -1.797427583637391,
                -1.9150048529746106,
                -2.1472199599156196,
                -2.1060679156475928,
                -2.132522801248467
              ],
              "variance": 0.34450139915805367,
              "mean_reward": -2.070584775436896,
              "min_reward": -2.3103584211210118,
              "max_reward": -1.797427583637391,
              "num_responses": 7,
              "rvariance": 0.023928844402843024
            },
            {
              "id": "chat_sample_179",
              "rewards": [
                -0.6040182998646118,
                -0.9567501078762706,
                -0.8626882924064949,
                -0.5569873921297238,
                -0.6157760267983337,
                -0.6392914806657776,
                -0.9097192001413827
              ],
              "variance": 0.34332562646468134,
              "mean_reward": -0.7350329714117992,
              "min_reward": -0.9567501078762706,
              "max_reward": -0.5569873921297238,
              "num_responses": 7,
              "rvariance": 0.02403191034847788
            },
            {
              "id": "chat_sample_191",
              "rewards": [
                -0.39237921505761636,
                0.1719916777610379,
                0.12496077002615005,
                0.2660534932308136,
                0.25429576629709166,
                0.19550713162848185,
                0.28956894709825753
              ],
              "variance": 0.35743489878514767,
              "mean_reward": 0.12999979585488805,
              "min_reward": -0.39237921505761636,
              "max_reward": 0.28956894709825753,
              "num_responses": 7,
              "rvariance": 0.04834030898225169
            },
            {
              "id": "chat_sample_156",
              "rewards": [
                0.2778112201645356,
                0.5012080319052529,
                0.5952698473750286,
                0.806908932182024,
                0.7128471167122482,
                0.5952698473750286
              ],
              "variance": 0.3703683984122419,
              "mean_reward": 0.5815524992856863,
              "min_reward": 0.2778112201645356,
              "max_reward": 0.806908932182024,
              "num_responses": 6,
              "rvariance": 0.027852354628492584
            },
            {
              "id": "chat_sample_166",
              "rewards": [
                -0.521714211328558,
                -0.32183285345528456,
                -0.39237921505761636,
                -0.29831739958784065,
                -0.5687451190634458,
                -0.4746833035936701,
                -0.4746833035936701
              ],
              "variance": 0.2280999025142062,
              "mean_reward": -0.4360507722400122,
              "min_reward": -0.5687451190634458,
              "max_reward": -0.29831739958784065,
              "num_responses": 7,
              "rvariance": 0.00883633989333561
            },
            {
              "id": "chat_sample_245",
              "rewards": [
                -0.5452296651960019,
                -0.6745646614669435,
                -0.39237921505761636,
                -0.7686264769367191,
                -0.8038996577378851,
                -0.5569873921297238,
                -0.4041369419913383
              ],
              "variance": 0.38330189803933595,
              "mean_reward": -0.5922605729308897,
              "min_reward": -0.8038996577378851,
              "max_reward": -0.39237921505761636,
              "num_responses": 7,
              "rvariance": 0.023067022658975717
            },
            {
              "id": "chat_sample_161",
              "rewards": [
                0.9009707476517996,
                1.112609832458795,
                1.3242489172657903,
                1.1831561940611268,
                1.2772180095309025,
                1.2301871017960146,
                1.3947952788681222
              ],
              "variance": 0.3245132633707264,
              "mean_reward": 1.2033122973760786,
              "min_reward": 0.9009707476517996,
              "max_reward": 1.3947952788681222,
              "num_responses": 7,
              "rvariance": 0.022502760852249306
            },
            {
              "id": "chat_sample_296",
              "rewards": [
                -1.7092446316344763,
                -1.5799096353635347,
                -2.294191546587144,
                -2.483050035460053
              ],
              "variance": 0.8076823545533633,
              "mean_reward": -2.016598962261302,
              "min_reward": -2.483050035460053,
              "max_reward": -1.5799096353635347,
              "num_responses": 4,
              "rvariance": 0.1449496248356139
            },
            {
              "id": "chat_sample_130",
              "rewards": [
                0.18374940469475987,
                0.47769257803780896,
                0.47769257803780896,
                0.6658162089773604,
                0.5952698473750286,
                0.6187853012424726,
                0.7833934783145801
              ],
              "variance": 0.352731808011659,
              "mean_reward": 0.5431999138114029,
              "min_reward": 0.18374940469475987,
              "max_reward": 0.7833934783145801,
              "num_responses": 7,
              "rvariance": 0.03127703194684501
            },
            {
              "id": "chat_sample_18",
              "rewards": [
                0.9950325631215754,
                0.9244862015192435,
                1.0185480169890193,
                0.9950325631215754,
                0.9715171092541315,
                1.0890943785913512,
                1.0890943785913512
              ],
              "variance": 0.13638963243117486,
              "mean_reward": 1.0118293158840355,
              "min_reward": 0.9244862015192435,
              "max_reward": 1.0890943785913512,
              "num_responses": 7,
              "rvariance": 0.0031147251731297974
            },
            {
              "id": "chat_sample_44",
              "rewards": [
                -0.42765239585878223,
                -0.7098378422681094,
                -0.0514051339796794,
                -0.08667831478084528,
                -0.27480194572039673,
                0.1132030430924281,
                -0.16898240331689904
              ],
              "variance": 0.5549647112716767,
              "mean_reward": -0.22945071326175487,
              "min_reward": -0.7098378422681094,
              "max_reward": 0.1132030430924281,
              "num_responses": 7,
              "rvariance": 0.0636092334722684
            },
            {
              "id": "chat_sample_215",
              "rewards": [
                -2.4668831609261854,
                -2.3265252956548794,
                -2.173674845516494,
                -2.4000110889906416,
                -2.3147675687211575,
                -2.3500407495223232
              ],
              "variance": 0.18922591783958786,
              "mean_reward": -2.33865045155528,
              "min_reward": -2.4668831609261854,
              "max_reward": -2.173674845516494,
              "num_responses": 6,
              "rvariance": 0.008045476092132875
            },
            {
              "id": "chat_sample_300",
              "rewards": [
                -0.0514051339796794,
                -0.3100751265215626,
                -0.4041369419913383,
                -0.3100751265215626,
                -1.156631465749544,
                -0.9332346540088267
              ],
              "variance": 0.8641929296285642,
              "mean_reward": -0.527593074795419,
              "min_reward": -1.156631465749544,
              "max_reward": -0.0514051339796794,
              "num_responses": 6,
              "rvariance": 0.14947647923811852
            },
            {
              "id": "chat_sample_169",
              "rewards": [
                -1.121358284948378,
                -1.3212396428216515,
                -1.2506932812193197,
                -0.9920232886774365,
                -1.2624510081530416,
                -0.9685078348099926
              ],
              "variance": 0.31157976374363194,
              "mean_reward": -1.1527122234383034,
              "min_reward": -1.3212396428216515,
              "max_reward": -0.9685078348099926,
              "num_responses": 6,
              "rvariance": 0.01846327327365122
            },
            {
              "id": "chat_sample_82",
              "rewards": [
                -0.6040182998646118,
                -0.48644103052739207,
                -1.0860851041472122,
                -1.4211803217582881,
                -1.144873738815822,
                -0.3806214881238944,
                -1.2389355542855978
              ],
              "variance": 0.8677202477086808,
              "mean_reward": -0.9088793625032598,
              "min_reward": -1.4211803217582881,
              "max_reward": -0.3806214881238944,
              "num_responses": 7,
              "rvariance": 0.1441336252556778
            },
            {
              "id": "chat_sample_77",
              "rewards": [
                0.04265668149009631,
                -0.180740130250621,
                -0.1454669494494551,
                -0.22777103798550885,
                -0.004374226244791544,
                -0.039647407045957435
              ],
              "variance": 0.22339681174071732,
              "mean_reward": -0.09255717824770628,
              "min_reward": -0.22777103798550885,
              "max_reward": 0.04265668149009631,
              "num_responses": 6,
              "rvariance": 0.009619488259254641
            },
            {
              "id": "chat_sample_277",
              "rewards": [
                -1.5034844102943419,
                -1.5505153180292297,
                -1.6680925873664494,
                -1.8385796279054178,
                -1.1096005580146562
              ],
              "variance": 0.5032307127633,
              "mean_reward": -1.534054500322019,
              "min_reward": -1.8385796279054178,
              "max_reward": -1.1096005580146562,
              "num_responses": 5,
              "rvariance": 0.0584136800344736
            },
            {
              "id": "chat_sample_73",
              "rewards": [
                -1.9737934876432204,
                -1.832700764438557,
                -1.6386982700321444,
                -1.6916080412338934,
                -1.9091259895077497,
                -1.6445771334990056
              ],
              "variance": 0.29982203680991004,
              "mean_reward": -1.7817506143924284,
              "min_reward": -1.9737934876432204,
              "max_reward": -1.6386982700321444,
              "num_responses": 6,
              "rvariance": 0.017184514954157484
            },
            {
              "id": "chat_sample_6",
              "rewards": [
                -1.7268812220350593,
                -1.6093039526978397,
                -1.2154201004181537,
                -1.3153607793547906,
                -1.4329380486920102,
                -1.2271778273518759,
                -1.2859664620204856
              ],
              "variance": 0.4338601238543405,
              "mean_reward": -1.4018640560814593,
              "min_reward": -1.7268812220350593,
              "max_reward": -1.2154201004181537,
              "num_responses": 7,
              "rvariance": 0.03368925117060043
            },
            {
              "id": "chat_sample_80",
              "rewards": [
                -2.1060679156475928,
                -2.754212612869016,
                -2.754212612869016,
                -2.6393451321610524
              ],
              "variance": 0.4881615322673851,
              "mean_reward": -2.563459568386669,
              "min_reward": -2.754212612869016,
              "max_reward": -2.1060679156475928,
              "num_responses": 4,
              "rvariance": 0.07193479768582703
            },
            {
              "id": "chat_sample_224",
              "rewards": [
                -1.4035437313577053,
                -1.9326414433751935,
                -1.8385796279054178,
                -1.5681519084298128,
                -1.6504559969658665,
                -1.9003076943074582,
                -1.7033657681676153
              ],
              "variance": 0.4109325563335826,
              "mean_reward": -1.7138637386441524,
              "min_reward": -1.9326414433751935,
              "max_reward": -1.4035437313577053,
              "num_responses": 7,
              "rvariance": 0.03140575417150445
            },
            {
              "id": "chat_sample_267",
              "rewards": [
                0.47769257803780896,
                -0.004374226244791544,
                0.16023395082731595,
                0.43066167030292113,
                0.23078031242964772,
                0.04265668149009631,
                0.1719916777610379
              ],
              "variance": 0.42562971500073515,
              "mean_reward": 0.21566323494343378,
              "min_reward": -0.004374226244791544,
              "max_reward": 0.47769257803780896,
              "num_responses": 7,
              "rvariance": 0.02834851316993493
            },
            {
              "id": "chat_sample_308",
              "rewards": [
                0.19550713162848185,
                -0.27480194572039673,
                0.136718496959872,
                0.2425380393633697,
                0.3483575817668674,
                0.21902258549592576,
                0.1132030430924281
              ],
              "variance": 0.3268648087574706,
              "mean_reward": 0.14007784751236402,
              "min_reward": -0.27480194572039673,
              "max_reward": 0.3483575817668674,
              "num_responses": 7,
              "rvariance": 0.03372028556997037
            },
            {
              "id": "chat_sample_252",
              "rewards": [
                0.3483575817668674,
                0.5012080319052529,
                0.28956894709825753,
                0.7363625705796921,
                0.5952698473750286,
                0.6658162089773604,
                0.6187853012424726
              ],
              "variance": 0.3691926257188697,
              "mean_reward": 0.5364812127064188,
              "min_reward": 0.28956894709825753,
              "max_reward": 0.7363625705796921,
              "num_responses": 7,
              "rvariance": 0.023501504250155052
            },
            {
              "id": "chat_sample_159",
              "rewards": [
                0.38363076256803325,
                0.5482389396401407,
                0.8774552937843557,
                0.7598780244471361,
                0.6658162089773604,
                0.8304243860494679,
                0.8774552937843557
              ],
              "variance": 0.39505962497305797,
              "mean_reward": 0.7061284156072641,
              "min_reward": 0.38363076256803325,
              "max_reward": 0.8774552937843557,
              "num_responses": 7,
              "rvariance": 0.029657600561540202
            },
            {
              "id": "chat_sample_188",
              "rewards": [
                1.44182618660301,
                1.7004961791448931,
                1.771042540747225,
                1.4888570943378978,
                1.7004961791448931,
                1.7240116330123372,
                1.771042540747225
              ],
              "variance": 0.30099780950328237,
              "mean_reward": 1.6568246219624974,
              "min_reward": 1.44182618660301,
              "max_reward": 1.771042540747225,
              "num_responses": 7,
              "rvariance": 0.015551055393379911
            },
            {
              "id": "chat_sample_88",
              "rewards": [
                1.4183107327355662,
                0.7128471167122482,
                1.5123725482053418,
                1.5829189098076735,
                1.5123725482053418,
                1.4888570943378978,
                1.465341640470454
              ],
              "variance": 0.4044658065200355,
              "mean_reward": 1.3847172272106463,
              "min_reward": 0.7128471167122482,
              "max_reward": 1.5829189098076735,
              "num_responses": 7,
              "rvariance": 0.07739414941059464
            },
            {
              "id": "chat_sample_27",
              "rewards": [
                -0.7686264769367191,
                -0.6510492075994996,
                -0.6510492075994996,
                -0.6863223884006654,
                -0.7215955692018313,
                -1.121358284948378,
                -0.6275337537320557
              ],
              "variance": 0.26807617408886075,
              "mean_reward": -0.7467906983455214,
              "min_reward": -1.121358284948378,
              "max_reward": -0.6275337537320557,
              "num_responses": 7,
              "rvariance": 0.02537485344848673
            },
            {
              "id": "chat_sample_167",
              "rewards": [
                0.5717543935075847,
                0.5012080319052529,
                0.7363625705796921,
                0.7598780244471361,
                0.6423007551099165,
                0.7363625705796921,
                0.8774552937843557
              ],
              "variance": 0.263373083315372,
              "mean_reward": 0.6893316628448043,
              "min_reward": 0.5012080319052529,
              "max_reward": 0.8774552937843557,
              "num_responses": 7,
              "rvariance": 0.01374541761185539
            },
            {
              "id": "chat_sample_76",
              "rewards": [
                0.03089895455637435,
                -0.4158946689250603,
                -0.6863223884006654,
                -0.29831739958784065,
                -0.2395287649192308,
                -0.13370922251573314
              ],
              "variance": 0.4997033946831835,
              "mean_reward": -0.2904789149653593,
              "min_reward": -0.6863223884006654,
              "max_reward": 0.03089895455637435,
              "num_responses": 6,
              "rvariance": 0.05048983298709781
            },
            {
              "id": "chat_sample_209",
              "rewards": [
                0.3365998548331454,
                0.7128471167122482,
                0.8539398399169118,
                0.6423007551099165,
                0.47769257803780896,
                0.7598780244471361,
                0.7833934783145801
              ],
              "variance": 0.3903565341995693,
              "mean_reward": 0.6523788067673925,
              "min_reward": 0.3365998548331454,
              "max_reward": 0.8539398399169118,
              "num_responses": 7,
              "rvariance": 0.029048197810275678
            },
            {
              "id": "chat_sample_61",
              "rewards": [
                1.6299498175425615,
                1.465341640470454,
                1.5829189098076735,
                1.7945579946146688,
                1.7240116330123372,
                1.6299498175425615,
                1.5829189098076735
              ],
              "variance": 0.2163421755804842,
              "mean_reward": 1.6299498175425615,
              "min_reward": 1.465341640470454,
              "max_reward": 1.7945579946146688,
              "num_responses": 7,
              "rvariance": 0.009637591658887109
            },
            {
              "id": "chat_sample_118",
              "rewards": [
                0.5247234857726968,
                0.8539398399169118,
                1.112609832458795,
                1.0890943785913512,
                1.0655789247239071,
                0.9715171092541315,
                1.0655789247239071
              ],
              "variance": 0.37624726187910285,
              "mean_reward": 0.9547203564916715,
              "min_reward": 0.5247234857726968,
              "max_reward": 1.112609832458795,
              "num_responses": 7,
              "rvariance": 0.03755726585570997
            },
            {
              "id": "chat_sample_150",
              "rewards": [
                -0.08667831478084528,
                0.19550713162848185,
                0.136718496959872,
                0.2660534932308136,
                0.054414408423818277,
                0.28956894709825753,
                0.148476223893594
              ],
              "variance": 0.27748235563583834,
              "mean_reward": 0.14343719806485603,
              "min_reward": -0.08667831478084528,
              "max_reward": 0.28956894709825753,
              "num_responses": 7,
              "rvariance": 0.014292751564380009
            },
            {
              "id": "chat_sample_120",
              "rewards": [
                0.18374940469475987,
                0.47769257803780896,
                0.7833934783145801,
                1.0890943785913512,
                0.9950325631215754,
                0.8539398399169118,
                0.8774552937843557
              ],
              "variance": 0.6725419806088964,
              "mean_reward": 0.751479648065906,
              "min_reward": 0.18374940469475987,
              "max_reward": 1.0890943785913512,
              "num_responses": 7,
              "rvariance": 0.08542359492031149
            },
            {
              "id": "chat_sample_244",
              "rewards": [
                -0.5452296651960019,
                -0.5334719382622799,
                -0.5452296651960019,
                -0.5569873921297238,
                -0.49819875746111403,
                -0.6863223884006654
              ],
              "variance": 0.10581954240349767,
              "mean_reward": -0.5609066344409644,
              "min_reward": -0.6863223884006654,
              "max_reward": -0.49819875746111403,
              "num_responses": 6,
              "rvariance": 0.003486824486787708
            },
            {
              "id": "chat_sample_8",
              "rewards": [
                0.8539398399169118,
                0.9950325631215754,
                0.9480016553866876,
                0.43066167030292113,
                0.8539398399169118,
                0.8539398399169118,
                0.9715171092541315
              ],
              "variance": 0.2962947187297935,
              "mean_reward": 0.8438617882594358,
              "min_reward": 0.43066167030292113,
              "max_reward": 0.9950325631215754,
              "num_responses": 7,
              "rvariance": 0.03157609070441001
            },
            {
              "id": "chat_sample_40",
              "rewards": [
                0.136718496959872,
                0.0779298622912622,
                0.136718496959872,
                0.10144531615870613,
                0.38363076256803325,
                0.10144531615870613,
                0.136718496959872
              ],
              "variance": 0.14344426859140805,
              "mean_reward": 0.15351524972233196,
              "min_reward": 0.0779298622912622,
              "max_reward": 0.38363076256803325,
              "num_responses": 7,
              "rvariance": 0.00927646410258221
            },
            {
              "id": "chat_sample_286",
              "rewards": [
                -0.7333532961355533,
                -0.016131953178513507,
                -0.20425558411806494,
                -0.1454669494494551,
                0.054414408423818277,
                -0.06316286091340137,
                -0.004374226244791544
              ],
              "variance": 0.4350358965477127,
              "mean_reward": -0.15890435165942307,
              "min_reward": -0.7333532961355533,
              "max_reward": 0.054414408423818277,
              "num_responses": 7,
              "rvariance": 0.061594818822255114
            },
            {
              "id": "chat_sample_307",
              "rewards": [
                -0.13370922251573314,
                0.2778112201645356,
                0.25429576629709166,
                -0.3335905803890065,
                0.16023395082731595,
                -0.07492058784712333,
                0.25429576629709166
              ],
              "variance": 0.4773637135091117,
              "mean_reward": 0.05777375897631027,
              "min_reward": -0.3335905803890065,
              "max_reward": 0.2778112201645356,
              "num_responses": 7,
              "rvariance": 0.04908513456713055
            },
            {
              "id": "chat_sample_206",
              "rewards": [
                0.806908932182024,
                1.0185480169890193,
                0.8304243860494679,
                0.6423007551099165,
                1.0655789247239071,
                1.0185480169890193,
                1.0890943785913512
              ],
              "variance": 0.33391944491770387,
              "mean_reward": 0.9244862015192437,
              "min_reward": 0.6423007551099165,
              "max_reward": 1.0890943785913512,
              "num_responses": 7,
              "rvariance": 0.023856989188392692
            },
            {
              "id": "chat_sample_261",
              "rewards": [
                -2.644833602350817,
                -2.7593566184025193,
                -2.728492585201499,
                -2.927639085141415,
                -2.8034480944039766,
                -2.7975692309371154,
                -3.096656409813668
              ],
              "variance": 0.30021702294909014,
              "mean_reward": -2.822570803750144,
              "min_reward": -3.096656409813668,
              "max_reward": -2.644833602350817,
              "num_responses": 7,
              "rvariance": 0.018798611008186174
            },
            {
              "id": "chat_sample_79",
              "rewards": [
                0.806908932182024,
                0.5012080319052529,
                0.9715171092541315,
                0.7833934783145801,
                0.806908932182024,
                1.0890943785913512,
                0.8774552937843557
              ],
              "variance": 0.3480287172381701,
              "mean_reward": 0.8337837366019599,
              "min_reward": 0.5012080319052529,
              "max_reward": 1.0890943785913512,
              "num_responses": 7,
              "rvariance": 0.028664499781701724
            },
            {
              "id": "chat_sample_69",
              "rewards": [
                -0.509956484394836,
                -0.36886376119017245,
                -0.22777103798550885,
                -0.6628069345332215,
                -0.2865596726541187,
                -0.29831739958784065
              ],
              "variance": 0.3292163541442149,
              "mean_reward": -0.39237921505761636,
              "min_reward": -0.6628069345332215,
              "max_reward": -0.22777103798550885,
              "num_responses": 6,
              "rvariance": 0.022441632489853935
            },
            {
              "id": "chat_sample_203",
              "rewards": [
                -0.25128649185295276,
                -0.039647407045957435,
                -0.06316286091340137,
                -0.039647407045957435,
                -0.12195149558201118,
                -0.0514051339796794
              ],
              "variance": 0.14697158667152455,
              "mean_reward": -0.09451679940332659,
              "min_reward": -0.25128649185295276,
              "max_reward": -0.039647407045957435,
              "num_responses": 6,
              "rvariance": 0.005698730769155243
            },
            {
              "id": "chat_sample_168",
              "rewards": [
                -0.27480194572039673,
                -0.11019376864828921,
                -0.02788968011223547,
                -0.004374226244791544,
                -0.12195149558201118,
                -0.016131953178513507,
                0.12496077002615005
              ],
              "variance": 0.23045144790095054,
              "mean_reward": -0.06148318563715538,
              "min_reward": -0.27480194572039673,
              "max_reward": 0.12496077002615005,
              "num_responses": 7,
              "rvariance": 0.01324886722193615
            },
            {
              "id": "chat_sample_265",
              "rewards": [
                -0.27480194572039673,
                -0.2865596726541187,
                -0.48644103052739207,
                -0.3100751265215626,
                -0.27480194572039673,
                -0.35710603425645043
              ],
              "variance": 0.14697158667152455,
              "mean_reward": -0.3316309592333862,
              "min_reward": -0.48644103052739207,
              "max_reward": -0.27480194572039673,
              "num_responses": 6,
              "rvariance": 0.005595047662169266
            },
            {
              "id": "chat_sample_301",
              "rewards": [
                -0.7921419308041631,
                -0.8156573846716071,
                -0.6863223884006654,
                -0.6392914806657776,
                -0.5805028459971677,
                -0.7333532961355533,
                -0.5452296651960019
              ],
              "variance": 0.23515453867443925,
              "mean_reward": -0.6846427131244195,
              "min_reward": -0.8156573846716071,
              "max_reward": -0.5452296651960019,
              "num_responses": 7,
              "rvariance": 0.009062044616026175
            },
            {
              "id": "chat_sample_196",
              "rewards": [
                -1.180146919616988,
                -1.162510329216405,
                -1.162510329216405,
                -1.1331160118821,
                -1.0860851041472122,
                -1.0155387425448805,
                -1.2095412369512928
              ],
              "variance": 0.13403808704443043,
              "mean_reward": -1.1356355247964691,
              "min_reward": -1.2095412369512928,
              "max_reward": -1.0155387425448805,
              "num_responses": 7,
              "rvariance": 0.003681808288889835
            },
            {
              "id": "chat_sample_225",
              "rewards": [
                -0.08667831478084528,
                0.3130844009657015,
                0.45417712417036504,
                0.47769257803780896,
                0.6187853012424726,
                0.3365998548331454,
                0.32484212789942346
              ],
              "variance": 0.38095035265259164,
              "mean_reward": 0.3483575817668673,
              "min_reward": -0.08667831478084528,
              "max_reward": 0.6187853012424726,
              "num_responses": 7,
              "rvariance": 0.041749731079687206
            },
            {
              "id": "chat_sample_126",
              "rewards": [
                0.6423007551099165,
                1.3242489172657903,
                1.3712798250006781,
                1.3947952788681222,
                1.465341640470454,
                1.2537025556634587,
                1.1831561940611268
              ],
              "variance": 0.4561998050284123,
              "mean_reward": 1.2335464523485065,
              "min_reward": 0.6423007551099165,
              "max_reward": 1.465341640470454,
              "num_responses": 7,
              "rvariance": 0.06563493335841622
            },
            {
              "id": "chat_sample_162",
              "rewards": [
                0.7128471167122482,
                0.47769257803780896,
                0.6893316628448043,
                0.5247234857726968,
                0.7363625705796921,
                0.7598780244471361,
                0.6893316628448043
              ],
              "variance": 0.2398576294479281,
              "mean_reward": 0.6557381573198844,
              "min_reward": 0.47769257803780896,
              "max_reward": 0.7598780244471361,
              "num_responses": 7,
              "rvariance": 0.01024699441015164
            },
            {
              "id": "chat_sample_49",
              "rewards": [
                0.32484212789942346,
                0.45417712417036504,
                0.47769257803780896,
                0.6187853012424726,
                0.6893316628448043,
                0.7128471167122482,
                0.5717543935075847
              ],
              "variance": 0.29629471872979346,
              "mean_reward": 0.5499186149163868,
              "min_reward": 0.32484212789942346,
              "max_reward": 0.7128471167122482,
              "num_responses": 7,
              "rvariance": 0.016606224971958298
            },
            {
              "id": "chat_sample_177",
              "rewards": [
                -1.2565721446861806,
                -1.0272964694786024,
                -1.2389355542855978,
                -1.2448144177524587,
                -0.8038996577378851
              ],
              "variance": 0.35861067147851977,
              "mean_reward": -1.114303648788145,
              "min_reward": -1.2565721446861806,
              "max_reward": -0.8038996577378851,
              "num_responses": 5,
              "rvariance": 0.03134547690400091
            },
            {
              "id": "chat_sample_273",
              "rewards": [
                -0.6745646614669435,
                -0.8156573846716071,
                -0.46292557665994816,
                -0.6745646614669435,
                -0.7098378422681094,
                -0.49819875746111403,
                -0.6040182998646118
              ],
              "variance": 0.26807617408886086,
              "mean_reward": -0.6342524548370397,
              "min_reward": -0.8156573846716071,
              "max_reward": -0.46292557665994816,
              "num_responses": 7,
              "rvariance": 0.012949808464371151
            },
            {
              "id": "chat_sample_285",
              "rewards": [
                -0.7568687500029972,
                -0.3806214881238944,
                -0.12195149558201118,
                -0.22777103798550885,
                -0.3100751265215626,
                -0.16898240331689904,
                -0.2395287649192308
              ],
              "variance": 0.3809503526525916,
              "mean_reward": -0.3151141523503006,
              "min_reward": -0.7568687500029972,
              "max_reward": -0.12195149558201118,
              "num_responses": 7,
              "rvariance": 0.03878171397630629
            },
            {
              "id": "chat_sample_293",
              "rewards": [
                -0.8038996577378851,
                -0.6628069345332215,
                -0.7568687500029972,
                -0.6275337537320557,
                -0.7921419308041631,
                -0.6157760267983337,
                -0.7921419308041631
              ],
              "variance": 0.1740143586190851,
              "mean_reward": -0.7215955692018314,
              "min_reward": -0.8038996577378851,
              "max_reward": -0.6157760267983337,
              "num_responses": 7,
              "rvariance": 0.005924748970627322
            },
            {
              "id": "chat_sample_233",
              "rewards": [
                -1.180146919616988,
                -1.2624510081530416,
                -0.9097192001413827,
                -0.9920232886774365,
                -1.0155387425448805,
                -0.839172838539051,
                -1.0155387425448805
              ],
              "variance": 0.33156789953095955,
              "mean_reward": -1.0306558200310945,
              "min_reward": -1.2624510081530416,
              "max_reward": -0.839172838539051,
              "num_responses": 7,
              "rvariance": 0.018473931552222714
            },
            {
              "id": "chat_sample_235",
              "rewards": [
                -1.3741494140234003,
                -1.4153014582914272,
                -1.2448144177524587,
                -1.150752602282683,
                -1.3447550966890953,
                -1.427059185225149,
                -0.9685078348099926
              ],
              "variance": 0.34214985377130924,
              "mean_reward": -1.2750485727248866,
              "min_reward": -1.427059185225149,
              "max_reward": -0.9685078348099926,
              "num_responses": 7,
              "rvariance": 0.023969841549737962
            },
            {
              "id": "chat_sample_158",
              "rewards": [
                0.8774552937843557,
                0.9950325631215754,
                1.2066716479285706,
                1.1831561940611268,
                1.0420634708564633,
                1.2066716479285706,
                0.8774552937843557
              ],
              "variance": 0.3292163541442149,
              "mean_reward": 1.0555008730664313,
              "min_reward": 0.8774552937843557,
              "max_reward": 1.2066716479285706,
              "num_responses": 7,
              "rvariance": 0.018462646316088186
            },
            {
              "id": "chat_sample_216",
              "rewards": [
                0.1719916777610379,
                0.45417712417036504,
                0.8304243860494679,
                0.5717543935075847,
                0.9009707476517996,
                0.7128471167122482,
                0.5952698473750286
              ],
              "variance": 0.5173399850837664,
              "mean_reward": 0.6053478990325045,
              "min_reward": 0.1719916777610379,
              "max_reward": 0.9009707476517996,
              "num_responses": 7,
              "rvariance": 0.05164124055160121
            },
            {
              "id": "chat_sample_242",
              "rewards": [
                0.2072648585622038,
                0.38363076256803325,
                0.6658162089773604,
                0.5717543935075847,
                0.28956894709825753,
                -0.06316286091340137,
                0.38363076256803325
              ],
              "variance": 0.5102853489235332,
              "mean_reward": 0.34835758176686743,
              "min_reward": -0.06316286091340137,
              "max_reward": 0.6658162089773604,
              "num_responses": 7,
              "rvariance": 0.049412406415031876
            },
            {
              "id": "chat_sample_92",
              "rewards": [
                2.358928887433323,
                2.076743441023996,
                2.382444341300767,
                2.10025889489144,
                2.2883825258309916,
                2.3118979796984354,
                2.147289802626328
              ],
              "variance": 0.27748235563583856,
              "mean_reward": 2.2379922675436115,
              "min_reward": 2.076743441023996,
              "max_reward": 2.382444341300767,
              "num_responses": 7,
              "rvariance": 0.01381312902866257
            },
            {
              "id": "chat_sample_250",
              "rewards": [
                -0.7098378422681094,
                -1.150752602282683,
                -1.0743273772134903,
                -0.8744460193402168,
                -0.839172838539051,
                -0.8744460193402168
              ],
              "variance": 0.33803464934450633,
              "mean_reward": -0.9204971164972946,
              "min_reward": -1.150752602282683,
              "max_reward": -0.7098378422681094,
              "num_responses": 6,
              "rvariance": 0.021985618824869314
            },
            {
              "id": "chat_sample_283",
              "rewards": [
                -0.6392914806657776,
                -0.5452296651960019,
                -0.6392914806657776,
                -0.5922605729308897,
                -0.7215955692018313,
                -0.5922605729308897,
                -0.6275337537320557
              ],
              "variance": 0.0987649062432645,
              "mean_reward": -0.6224947279033177,
              "min_reward": -0.7215955692018313,
              "max_reward": -0.5452296651960019,
              "num_responses": 7,
              "rvariance": 0.002601246929008757
            },
            {
              "id": "chat_sample_140",
              "rewards": [
                -0.7451110230692752,
                -0.25128649185295276,
                -0.19249785718434295,
                -0.2865596726541187,
                -0.7215955692018313,
                -0.49819875746111403,
                -0.42765239585878223
              ],
              "variance": 0.5032307127633001,
              "mean_reward": -0.4461288238974882,
              "min_reward": -0.7451110230692752,
              "max_reward": -0.19249785718434295,
              "num_responses": 7,
              "rvariance": 0.042297065032211825
            },
            {
              "id": "chat_sample_232",
              "rewards": [
                -1.2506932812193197,
                -0.9802655617437145,
                -0.839172838539051,
                -0.8509305654727729,
                -0.7333532961355533,
                -0.7568687500029972,
                -0.7451110230692752
              ],
              "variance": 0.3480287172381701,
              "mean_reward": -0.8794850451689549,
              "min_reward": -1.2506932812193197,
              "max_reward": -0.7333532961355533,
              "num_responses": 7,
              "rvariance": 0.029262617296831706
            },
            {
              "id": "chat_sample_0",
              "rewards": [
                1.4888570943378978,
                1.6064343636751175,
                1.7945579946146688,
                1.7240116330123372,
                1.5594034559402297,
                1.7004961791448931,
                1.7004961791448931
              ],
              "variance": 0.2210452663539728,
              "mean_reward": 1.6534652714100055,
              "min_reward": 1.4888570943378978,
              "max_reward": 1.7945579946146688,
              "num_responses": 7,
              "rvariance": 0.009637591658887109
            },
            {
              "id": "chat_sample_34",
              "rewards": [
                0.9009707476517996,
                0.806908932182024,
                0.9244862015192435,
                0.7363625705796921,
                0.8304243860494679,
                1.0655789247239071,
                1.0185480169890193
              ],
              "variance": 0.2586699925418833,
              "mean_reward": 0.8976113970993076,
              "min_reward": 0.7363625705796921,
              "max_reward": 1.0655789247239071,
              "num_responses": 7,
              "rvariance": 0.01175921605217842
            },
            {
              "id": "chat_sample_68",
              "rewards": [
                0.5247234857726968,
                0.47769257803780896,
                0.6658162089773604,
                0.6658162089773604,
                0.4071462164354772,
                0.806908932182024,
                0.6423007551099165
              ],
              "variance": 0.27277926486234966,
              "mean_reward": 0.5986291979275206,
              "min_reward": 0.4071462164354772,
              "max_reward": 0.806908932182024,
              "num_responses": 7,
              "rvariance": 0.0158670420051467
            },
            {
              "id": "chat_sample_149",
              "rewards": [
                -0.5334719382622799,
                -0.3453483073227285,
                -0.25128649185295276,
                -0.5687451190634458,
                -0.6040182998646118,
                -0.2865596726541187,
                -0.36886376119017245
              ],
              "variance": 0.31040399105025984,
              "mean_reward": -0.42261337003004423,
              "min_reward": -0.6040182998646118,
              "max_reward": -0.25128649185295276,
              "num_responses": 7,
              "rvariance": 0.017610610987931315
            },
            {
              "id": "chat_sample_309",
              "rewards": [
                -0.8156573846716071,
                -1.0037810156111584,
                -0.49819875746111403,
                -0.48644103052739207,
                -0.4394101227925042,
                -0.509956484394836,
                -0.4746833035936701
              ],
              "variance": 0.43033280577422384,
              "mean_reward": -0.6040182998646119,
              "min_reward": -1.0037810156111584,
              "max_reward": -0.4394101227925042,
              "num_responses": 7,
              "rvariance": 0.040327791326736646
            },
            {
              "id": "chat_sample_243",
              "rewards": [
                -0.7921419308041631,
                -0.8979614732076608,
                -0.8744460193402168,
                -0.7215955692018313,
                -0.6628069345332215,
                -1.2742087350867637,
                -0.3453483073227285
              ],
              "variance": 0.5126368943102779,
              "mean_reward": -0.7955012813566551,
              "min_reward": -1.2742087350867637,
              "max_reward": -0.3453483073227285,
              "num_responses": 7,
              "rvariance": 0.06737285972313357
            },
            {
              "id": "chat_sample_281",
              "rewards": [
                -1.4388169121588712,
                -1.485847819893759,
                -1.485847819893759,
                -1.3388762332222344,
                -1.462332366026315,
                -1.3565128236228174,
                -1.4329380486920102
              ],
              "variance": 0.13638963243117486,
              "mean_reward": -1.428738860501395,
              "min_reward": -1.485847819893759,
              "max_reward": -1.3388762332222344,
              "num_responses": 7,
              "rvariance": 0.003008926084368593
            },
            {
              "id": "chat_sample_99",
              "rewards": [
                2.123774348758884,
                2.123774348758884,
                2.452990702903099,
                2.382444341300767,
                2.2178361642286597,
                2.2883825258309916,
                2.452990702903099
              ],
              "variance": 0.329216354144215,
              "mean_reward": 2.291741876383483,
              "min_reward": 2.123774348758884,
              "max_reward": 2.452990702903099,
              "num_responses": 7,
              "rvariance": 0.017446975063980654
            },
            {
              "id": "chat_sample_43",
              "rewards": [
                -0.004374226244791544,
                0.1719916777610379,
                0.28956894709825753,
                0.148476223893594,
                0.2425380393633697,
                0.28956894709825753,
                0.2425380393633697
              ],
              "variance": 0.20223290326001775,
              "mean_reward": 0.19718680690472784,
              "min_reward": -0.004374226244791544,
              "max_reward": 0.28956894709825753,
              "num_responses": 7,
              "rvariance": 0.009259536248380416
            },
            {
              "id": "chat_sample_148",
              "rewards": [
                -0.3806214881238944,
                -0.22777103798550885,
                -0.20425558411806494,
                -0.36886376119017245
              ],
              "variance": 0.16578394976547972,
              "mean_reward": -0.2953779678544101,
              "min_reward": -0.3806214881238944,
              "max_reward": -0.20425558411806494,
              "num_responses": 4,
              "rvariance": 0.006385151338553157
            },
            {
              "id": "chat_sample_249",
              "rewards": [
                -0.32183285345528456,
                -0.27480194572039673,
                0.04265668149009631,
                -0.19249785718434295,
                -0.02788968011223547,
                -0.06316286091340137,
                0.19550713162848185
              ],
              "variance": 0.39741117035980245,
              "mean_reward": -0.09171734060958328,
              "min_reward": -0.32183285345528456,
              "max_reward": 0.19550713162848185,
              "num_responses": 7,
              "rvariance": 0.028867634032123227
            },
            {
              "id": "chat_sample_100",
              "rewards": [
                0.5012080319052529,
                1.2301871017960146,
                1.0890943785913512,
                0.9950325631215754,
                1.2537025556634587,
                1.1831561940611268
              ],
              "variance": 0.4938245312163224,
              "mean_reward": 1.0420634708564631,
              "min_reward": 0.5012080319052529,
              "max_reward": 1.2537025556634587,
              "num_responses": 6,
              "rvariance": 0.0661728629474954
            },
            {
              "id": "chat_sample_141",
              "rewards": [
                -1.7386389489687812,
                -1.4446957756257321,
                -1.2389355542855978,
                -1.427059185225149,
                -1.4329380486920102,
                -1.3859071409571222,
                -1.7210023585681982
              ],
              "variance": 0.40093848843991897,
              "mean_reward": -1.484168144617513,
              "min_reward": -1.7386389489687812,
              "max_reward": -1.2389355542855978,
              "num_responses": 7,
              "rvariance": 0.028297729607329552
            },
            {
              "id": "chat_sample_97",
              "rewards": [
                0.7833934783145801,
                0.7128471167122482,
                1.0655789247239071,
                0.8774552937843557,
                0.9715171092541315,
                0.9480016553866876,
                0.9950325631215754
              ],
              "variance": 0.26807617408886086,
              "mean_reward": 0.9076894487567836,
              "min_reward": 0.7128471167122482,
              "max_reward": 1.0655789247239071,
              "num_responses": 7,
              "rvariance": 0.013226296749667093
            },
            {
              "id": "chat_sample_137",
              "rewards": [
                -0.9214769270751048,
                -0.6628069345332215,
                -0.6628069345332215,
                -0.5452296651960019,
                -0.6980801153343874,
                -0.4394101227925042,
                -0.6157760267983337
              ],
              "variance": 0.2845369917960715,
              "mean_reward": -0.6493695323232535,
              "min_reward": -0.9214769270751048,
              "max_reward": -0.4394101227925042,
              "num_responses": 7,
              "rvariance": 0.01897612456020923
            },
            {
              "id": "chat_sample_207",
              "rewards": [
                0.2425380393633697,
                0.5247234857726968,
                0.2425380393633697,
                0.2778112201645356,
                0.2778112201645356,
                0.32484212789942346,
                0.2425380393633697
              ],
              "variance": 0.16225663168536314,
              "mean_reward": 0.30468602458447147,
              "min_reward": 0.2425380393633697,
              "max_reward": 0.5247234857726968,
              "num_responses": 7,
              "rvariance": 0.008836339893335607
            },
            {
              "id": "chat_sample_190",
              "rewards": [
                -0.2865596726541187,
                -0.016131953178513507,
                -0.016131953178513507,
                0.25429576629709166,
                0.36011530870058933,
                0.21902258549592576,
                0.2660534932308136
              ],
              "variance": 0.42798126038747947,
              "mean_reward": 0.11152336781618209,
              "min_reward": -0.2865596726541187,
              "max_reward": 0.36011530870058933,
              "num_responses": 7,
              "rvariance": 0.04409706019566908
            },
            {
              "id": "chat_sample_254",
              "rewards": [
                -0.2395287649192308,
                -0.13370922251573314,
                -0.3335905803890065,
                -0.1454669494494551,
                -0.27480194572039673,
                -0.0514051339796794,
                -0.20425558411806494
              ],
              "variance": 0.19752981248652904,
              "mean_reward": -0.19753688301308098,
              "min_reward": -0.3335905803890065,
              "max_reward": -0.0514051339796794,
              "num_responses": 7,
              "rvariance": 0.007775527696689956
            },
            {
              "id": "chat_sample_171",
              "rewards": [
                -0.6863223884006654,
                -0.6628069345332215,
                -0.7451110230692752,
                -0.7215955692018313,
                -0.4394101227925042,
                -0.45116784972622614,
                -0.5334719382622799
              ],
              "variance": 0.28453699179607156,
              "mean_reward": -0.6056979751408578,
              "min_reward": -0.7451110230692752,
              "max_reward": -0.4394101227925042,
              "num_responses": 7,
              "rvariance": 0.014196827057236521
            },
            {
              "id": "chat_sample_131",
              "rewards": [
                0.7128471167122482,
                0.9009707476517996,
                0.7833934783145801,
                0.5717543935075847,
                0.7128471167122482,
                0.7363625705796921,
                0.806908932182024
              ],
              "variance": 0.18812363093955153,
              "mean_reward": 0.7464406222371682,
              "min_reward": 0.5717543935075847,
              "max_reward": 0.9009707476517996,
              "num_responses": 7,
              "rvariance": 0.008825054657201079
            },
            {
              "id": "chat_sample_272",
              "rewards": [
                -0.8744460193402168,
                -0.8156573846716071,
                -0.8038996577378851,
                -0.7098378422681094,
                -1.0743273772134903,
                -0.7098378422681094,
                -0.6863223884006654
              ],
              "variance": 0.2539669017683943,
              "mean_reward": -0.810618358842869,
              "min_reward": -1.0743273772134903,
              "max_reward": -0.6863223884006654,
              "num_responses": 7,
              "rvariance": 0.015635694664388872
            },
            {
              "id": "chat_sample_317",
              "rewards": [
                -1.121358284948378,
                -0.5569873921297238,
                -0.6040182998646118,
                -0.6157760267983337,
                -0.5452296651960019,
                -0.5687451190634458,
                -0.7215955692018313
              ],
              "variance": 0.3292163541442149,
              "mean_reward": -0.6762443367431894,
              "min_reward": -1.121358284948378,
              "max_reward": -0.5452296651960019,
              "num_responses": 7,
              "rvariance": 0.035999903269145074
            },
            {
              "id": "chat_sample_221",
              "rewards": [
                -1.6680925873664494,
                -1.5975462257641175,
                -1.3682705505565393,
                -1.7092446316344763,
                -1.526999864161786,
                -1.2683298716199027,
                -1.526999864161786
              ],
              "variance": 0.35625912609177557,
              "mean_reward": -1.5236405136092939,
              "min_reward": -1.7092446316344763,
              "max_reward": -1.2683298716199027,
              "num_responses": 7,
              "rvariance": 0.02144618061915408
            },
            {
              "id": "chat_sample_263",
              "rewards": [
                -0.4394101227925042,
                -0.16898240331689904,
                0.0779298622912622,
                0.32484212789942346,
                0.3130844009657015,
                0.0779298622912622,
                0.00738350068893042
              ],
              "variance": 0.5949409828463315,
              "mean_reward": 0.02753960400388237,
              "min_reward": -0.4394101227925042,
              "max_reward": 0.32484212789942346,
              "num_responses": 7,
              "rvariance": 0.06172459903780218
            },
            {
              "id": "chat_sample_112",
              "rewards": [
                0.8539398399169118,
                0.8774552937843557,
                1.0655789247239071,
                0.9950325631215754,
                0.7833934783145801,
                0.9480016553866876,
                0.9009707476517996
              ],
              "variance": 0.197529812486529,
              "mean_reward": 0.9177675004142597,
              "min_reward": 0.7833934783145801,
              "max_reward": 1.0655789247239071,
              "num_responses": 7,
              "rvariance": 0.00753853773786486
            },
            {
              "id": "chat_sample_138",
              "rewards": [
                -0.9332346540088267,
                -0.27480194572039673,
                -0.2395287649192308,
                -0.3453483073227285,
                -0.27480194572039673,
                -0.22777103798550885,
                -0.3100751265215626
              ],
              "variance": 0.3456771718514257,
              "mean_reward": -0.37222311174266437,
              "min_reward": -0.9332346540088267,
              "max_reward": -0.22777103798550885,
              "num_responses": 7,
              "rvariance": 0.05382493374363244
            },
            {
              "id": "chat_sample_1",
              "rewards": [
                -1.2624510081530416,
                -1.180146919616988,
                -1.2506932812193197,
                -1.162510329216405,
                -1.156631465749544,
                -1.2389355542855978
              ],
              "variance": 0.09700124720320602,
              "mean_reward": -1.2085614263734827,
              "min_reward": -1.2624510081530416,
              "max_reward": -1.156631465749544,
              "num_responses": 6,
              "rvariance": 0.001871096069589547
            },
            {
              "id": "chat_sample_42",
              "rewards": [
                -1.3623916870896784,
                -1.150752602282683,
                -1.2330566908187368,
                -1.0978428310809343,
                -1.2742087350867637,
                -1.0508119233460462,
                -1.1742680561501269
              ],
              "variance": 0.2304514479009505,
              "mean_reward": -1.1919046465507097,
              "min_reward": -1.3623916870896784,
              "max_reward": -1.0508119233460462,
              "num_responses": 7,
              "rvariance": 0.009756086638299664
            },
            {
              "id": "chat_sample_101",
              "rewards": [
                -1.5799096353635347,
                -1.1331160118821,
                -0.9802655617437145,
                -0.8862037462739388,
                -0.9802655617437145,
                -0.8862037462739388,
                -0.7215955692018313
              ],
              "variance": 0.4914729858295781,
              "mean_reward": -1.0239371189261104,
              "min_reward": -1.5799096353635347,
              "max_reward": -0.7215955692018313,
              "num_responses": 7,
              "rvariance": 0.0648844651554701
            },
            {
              "id": "chat_sample_21",
              "rewards": [
                -1.2154201004181537,
                -0.8509305654727729,
                -0.9214769270751048,
                -0.7803842038704412,
                -0.8156573846716071,
                -0.8862037462739388,
                -0.8744460193402168
              ],
              "variance": 0.23750608406118368,
              "mean_reward": -0.9063598495888908,
              "min_reward": -1.2154201004181537,
              "max_reward": -0.7803842038704412,
              "num_responses": 7,
              "rvariance": 0.017762961675747438
            },
            {
              "id": "chat_sample_66",
              "rewards": [
                -1.0625696502797684,
                -1.144873738815822,
                -1.121358284948378,
                -1.0155387425448805,
                -1.0390541964123243,
                -1.0625696502797684,
                -0.8509305654727729
              ],
              "variance": 0.18106899477931837,
              "mean_reward": -1.0424135469648166,
              "min_reward": -1.144873738815822,
              "max_reward": -0.8509305654727729,
              "num_responses": 7,
              "rvariance": 0.007848881731564393
            },
            {
              "id": "chat_sample_151",
              "rewards": [
                -0.6510492075994996,
                -0.7098378422681094,
                -0.8509305654727729,
                -0.8979614732076608,
                -0.7803842038704412,
                -0.827415111605329,
                -0.827415111605329
              ],
              "variance": 0.18342054016606257,
              "mean_reward": -0.7921419308041632,
              "min_reward": -0.8979614732076608,
              "max_reward": -0.6510492075994996,
              "num_responses": 7,
              "rvariance": 0.006280233908864961
            },
            {
              "id": "chat_sample_33",
              "rewards": [
                0.5012080319052529,
                0.806908932182024,
                0.6423007551099165,
                0.7363625705796921,
                0.6893316628448043,
                0.7598780244471361,
                0.8539398399169118
              ],
              "variance": 0.2398576294479281,
              "mean_reward": 0.7128471167122482,
              "min_reward": 0.5012080319052529,
              "max_reward": 0.8539398399169118,
              "num_responses": 7,
              "rvariance": 0.011691504635371256
            },
            {
              "id": "chat_sample_219",
              "rewards": [
                -0.9685078348099926,
                -0.8509305654727729,
                -0.8979614732076608,
                -0.9214769270751048
              ],
              "variance": 0.08935872469628703,
              "mean_reward": -0.9097192001413827,
              "min_reward": -0.9685078348099926,
              "max_reward": -0.8509305654727729,
              "num_responses": 4,
              "rvariance": 0.001797173854423623
            },
            {
              "id": "chat_sample_5",
              "rewards": [
                1.1596407401936828,
                0.8774552937843557,
                1.0655789247239071,
                1.2066716479285706,
                1.0420634708564633,
                1.0420634708564633,
                1.3007334633983465
              ],
              "variance": 0.26807617408886064,
              "mean_reward": 1.0991724302488273,
              "min_reward": 0.8774552937843557,
              "max_reward": 1.3007334633983465,
              "num_responses": 7,
              "rvariance": 0.01609274672783726
            },
            {
              "id": "chat_sample_86",
              "rewards": [
                1.3712798250006781,
                1.4888570943378978,
                1.5123725482053418,
                1.6064343636751175,
                1.6064343636751175,
                1.6064343636751175,
                1.6534652714100053
              ],
              "variance": 0.18342054016606268,
              "mean_reward": 1.5493254042827533,
              "min_reward": 1.3712798250006781,
              "max_reward": 1.6534652714100053,
              "num_responses": 7,
              "rvariance": 0.008193081433667503
            },
            {
              "id": "chat_sample_108",
              "rewards": [
                0.16023395082731595,
                0.5482389396401407,
                0.6658162089773604,
                0.5952698473750286,
                0.6423007551099165,
                0.5482389396401407,
                0.6423007551099165
              ],
              "variance": 0.2586699925418832,
              "mean_reward": 0.5431999138114028,
              "min_reward": 0.16023395082731595,
              "max_reward": 0.6658162089773604,
              "num_responses": 7,
              "rvariance": 0.026300242811518052
            },
            {
              "id": "chat_sample_28",
              "rewards": [
                -0.9567501078762706,
                -0.7333532961355533,
                -0.9097192001413827,
                -0.827415111605329,
                -0.8979614732076608,
                -0.839172838539051,
                -0.7686264769367191
              ],
              "variance": 0.1740143586190851,
              "mean_reward": -0.847571214920281,
              "min_reward": -0.9567501078762706,
              "max_reward": -0.7333532961355533,
              "num_responses": 7,
              "rvariance": 0.005439483816842609
            },
            {
              "id": "chat_sample_255",
              "rewards": [
                0.136718496959872,
                0.4071462164354772,
                0.5482389396401407,
                0.45417712417036504,
                0.7363625705796921,
                0.47769257803780896,
                0.5717543935075847
              ],
              "variance": 0.33862253569119255,
              "mean_reward": 0.476012902761563,
              "min_reward": 0.136718496959872,
              "max_reward": 0.7363625705796921,
              "num_responses": 7,
              "rvariance": 0.02892970283086313
            },
            {
              "id": "chat_sample_29",
              "rewards": [
                1.8651043562170007,
                2.0297125332891084,
                2.053227987156552,
                2.1708052564937717,
                2.10025889489144,
                1.9356507178193325,
                2.076743441023996
              ],
              "variance": 0.2210452663539726,
              "mean_reward": 2.0330718838416,
              "min_reward": 1.8651043562170007,
              "max_reward": 2.1708052564937717,
              "num_responses": 7,
              "rvariance": 0.009073329852160694
            },
            {
              "id": "chat_sample_60",
              "rewards": [
                1.771042540747225,
                1.7004961791448931,
                1.6064343636751175,
                1.7945579946146688,
                1.9121352639518885,
                1.8180734484821128,
                1.8415889023495569
              ],
              "variance": 0.2069359940335067,
              "mean_reward": 1.777761241852209,
              "min_reward": 1.6064343636751175,
              "max_reward": 1.9121352639518885,
              "num_responses": 7,
              "rvariance": 0.008486497573165231
            },
            {
              "id": "chat_sample_125",
              "rewards": [
                -1.1977835100175709,
                -1.1331160118821,
                -1.2095412369512928,
                -1.5446364545623688,
                -0.9802655617437145,
                -1.1331160118821,
                -1.0390541964123243
              ],
              "variance": 0.3280405814508429,
              "mean_reward": -1.176787569064496,
              "min_reward": -1.5446364545623688,
              "max_reward": -0.9802655617437145,
              "num_responses": 7,
              "rvariance": 0.028318889425081793
            },
            {
              "id": "chat_sample_314",
              "rewards": [
                -0.08667831478084528,
                0.47769257803780896,
                0.12496077002615005,
                0.3013266740319795,
                0.36011530870058933,
                0.1719916777610379,
                0.18374940469475987
              ],
              "variance": 0.36684108033212526,
              "mean_reward": 0.21902258549592576,
              "min_reward": -0.08667831478084528,
              "max_reward": 0.47769257803780896,
              "num_responses": 7,
              "rvariance": 0.028478293385482002
            },
            {
              "id": "chat_sample_310",
              "rewards": [
                1.5123725482053418,
                1.6534652714100053,
                1.8415889023495569,
                1.747527086879781,
                1.8415889023495569,
                1.8651043562170007,
                1.8886198100844447
              ],
              "variance": 0.27748235563583834,
              "mean_reward": 1.764323839642241,
              "min_reward": 1.5123725482053418,
              "max_reward": 1.8886198100844447,
              "num_responses": 7,
              "rvariance": 0.016228169561451605
            },
            {
              "id": "chat_sample_222",
              "rewards": [
                0.36011530870058933,
                1.0420634708564633,
                1.0420634708564633,
                0.9480016553866876,
                0.7833934783145801,
                1.0655789247239071,
                0.7363625705796921
              ],
              "variance": 0.46560598657538976,
              "mean_reward": 0.8539398399169118,
              "min_reward": 0.36011530870058933,
              "max_reward": 1.0655789247239071,
              "num_responses": 7,
              "rvariance": 0.05529765705918837
            },
            {
              "id": "chat_sample_143",
              "rewards": [
                -0.5805028459971677,
                0.16023395082731595,
                0.00738350068893042,
                -0.09843604171456725,
                -0.06316286091340137,
                0.019141227622652385,
                0.054414408423818277
              ],
              "variance": 0.38800498881282475,
              "mean_reward": -0.07156123729463135,
              "min_reward": -0.5805028459971677,
              "max_reward": 0.16023395082731595,
              "num_responses": 7,
              "rvariance": 0.0491246328936014
            },
            {
              "id": "chat_sample_12",
              "rewards": [
                0.7833934783145801,
                0.7128471167122482,
                1.136125286326239,
                1.1596407401936828,
                1.1596407401936828,
                1.0890943785913512,
                1.136125286326239
              ],
              "variance": 0.4044658065200355,
              "mean_reward": 1.0252667180940034,
              "min_reward": 0.7128471167122482,
              "max_reward": 1.1596407401936828,
              "num_responses": 7,
              "rvariance": 0.031553520232140954
            },
            {
              "id": "chat_sample_248",
              "rewards": [
                -2.288312683120283,
                -2.050218712712413,
                -2.120765074314745,
                -2.0854918935135793,
                -1.964975192442929
              ],
              "variance": 0.22222103904734491,
              "mean_reward": -2.1019527112207896,
              "min_reward": -2.288312683120283,
              "max_reward": -1.964975192442929,
              "num_responses": 5,
              "rvariance": 0.01135882998067052
            },
            {
              "id": "chat_sample_64",
              "rewards": [
                1.0890943785913512,
                0.9244862015192435,
                0.9715171092541315,
                1.0185480169890193,
                0.9950325631215754,
                0.9950325631215754,
                0.9715171092541315
              ],
              "variance": 0.09406181546977588,
              "mean_reward": 0.9950325631215754,
              "min_reward": 0.9244862015192435,
              "max_reward": 1.0890943785913512,
              "num_responses": 7,
              "rvariance": 0.002211906282367537
            },
            {
              "id": "chat_sample_4",
              "rewards": [
                0.19550713162848185,
                0.2778112201645356,
                0.43066167030292113,
                0.5482389396401407,
                0.47769257803780896,
                0.43066167030292113,
                0.45417712417036504
              ],
              "variance": 0.2610215379286276,
              "mean_reward": 0.4021071906067392,
              "min_reward": 0.19550713162848185,
              "max_reward": 0.5482389396401407,
              "num_responses": 7,
              "rvariance": 0.012791815158487752
            },
            {
              "id": "chat_sample_311",
              "rewards": [
                -0.7098378422681094,
                -0.35710603425645043,
                -0.3453483073227285,
                -0.36886376119017245,
                -0.27480194572039673,
                -0.16898240331689904,
                -0.16898240331689904
              ],
              "variance": 0.3362709903044482,
              "mean_reward": -0.34198895677023655,
              "min_reward": -0.7098378422681094,
              "max_reward": -0.16898240331689904,
              "num_responses": 7,
              "rvariance": 0.028664499781701724
            },
            {
              "id": "chat_sample_117",
              "rewards": [
                -1.515242137228064,
                -0.9449923809425487,
                -1.144873738815822,
                -1.0272964694786024,
                -0.839172838539051,
                -1.180146919616988,
                -1.19190464655071
              ],
              "variance": 0.41857507884050194,
              "mean_reward": -1.1205184473102554,
              "min_reward": -1.515242137228064,
              "max_reward": -0.839172838539051,
              "num_responses": 7,
              "rvariance": 0.04052951492264134
            },
            {
              "id": "chat_sample_39",
              "rewards": [
                0.03089895455637435,
                0.054414408423818277,
                0.03089895455637435,
                0.28956894709825753,
                0.2425380393633697,
                0.136718496959872,
                -0.20425558411806494
              ],
              "variance": 0.3245132633707262,
              "mean_reward": 0.08296888812000021,
              "min_reward": -0.20425558411806494,
              "max_reward": 0.28956894709825753,
              "num_responses": 7,
              "rvariance": 0.022824390082083357
            },
            {
              "id": "chat_sample_287",
              "rewards": [
                0.806908932182024,
                0.8304243860494679,
                1.0890943785913512,
                0.8304243860494679,
                0.9244862015192435,
                0.9950325631215754
              ],
              "variance": 0.22339681174071746,
              "mean_reward": 0.9127284745855216,
              "min_reward": 0.806908932182024,
              "max_reward": 1.0890943785913512,
              "num_responses": 6,
              "rvariance": 0.010460473460363134
            },
            {
              "id": "chat_sample_313",
              "rewards": [
                -0.6628069345332215,
                -0.5334719382622799,
                -0.3335905803890065,
                -0.3100751265215626,
                -0.25128649185295276,
                -0.22777103798550885,
                -0.2395287649192308
              ],
              "variance": 0.35038026262491456,
              "mean_reward": -0.3655044106376804,
              "min_reward": -0.6628069345332215,
              "max_reward": -0.22777103798550885,
              "num_responses": 7,
              "rvariance": 0.024082693911083253
            },
            {
              "id": "chat_sample_3",
              "rewards": [
                1.3242489172657903,
                1.4183107327355662,
                1.465341640470454,
                1.4183107327355662,
                1.44182618660301,
                1.5594034559402297,
                1.5829189098076735
              ],
              "variance": 0.1881236309395513,
              "mean_reward": 1.4586229393654702,
              "min_reward": 1.3242489172657903,
              "max_reward": 1.5829189098076735,
              "num_responses": 7,
              "rvariance": 0.006748571208447883
            },
            {
              "id": "chat_sample_170",
              "rewards": [
                -1.5740307718966737,
                -1.7327600855019203,
                -1.4329380486920102,
                -1.4094225948245662,
                -1.6034250892309787,
                -1.468211229493176
              ],
              "variance": 0.24691226560816126,
              "mean_reward": -1.5367979699398875,
              "min_reward": -1.7327600855019203,
              "max_reward": -1.4094225948245662,
              "num_responses": 6,
              "rvariance": 0.01265701928243645
            },
            {
              "id": "chat_sample_83",
              "rewards": [
                0.16023395082731595,
                0.0779298622912622,
                0.28956894709825753,
                0.10144531615870613,
                0.148476223893594,
                -0.004374226244791544,
                0.25429576629709166
              ],
              "variance": 0.22339681174071735,
              "mean_reward": 0.14679654861734798,
              "min_reward": -0.004374226244791544,
              "max_reward": 0.28956894709825753,
              "num_responses": 7,
              "rvariance": 0.00882505465720108
            },
            {
              "id": "chat_sample_279",
              "rewards": [
                0.9950325631215754,
                0.4071462164354772,
                1.3477643711332343,
                1.0185480169890193,
                1.1596407401936828,
                1.2066716479285706,
                1.2301871017960146
              ],
              "variance": 0.5173399850837663,
              "mean_reward": 1.052141522513939,
              "min_reward": 0.4071462164354772,
              "max_reward": 1.3477643711332343,
              "num_responses": 7,
              "rvariance": 0.08213394858709651
            },
            {
              "id": "chat_sample_55",
              "rewards": [
                -1.3682705505565393,
                -1.3506339601559565,
                -1.2742087350867637,
                -1.3623916870896784,
                -1.4153014582914272,
                -1.3506339601559565
              ],
              "variance": 0.07936465680262295,
              "mean_reward": -1.3535733918893869,
              "min_reward": -1.4153014582914272,
              "max_reward": -1.2742087350867637,
              "num_responses": 6,
              "rvariance": 0.0017366920420151322
            },
            {
              "id": "chat_sample_103",
              "rewards": [
                -0.16898240331689904,
                0.1132030430924281,
                0.3365998548331454,
                0.0779298622912622,
                0.148476223893594,
                0.23078031242964772,
                0.21902258549592576
              ],
              "variance": 0.2939431733430491,
              "mean_reward": 0.136718496959872,
              "min_reward": -0.16898240331689904,
              "max_reward": 0.3365998548331454,
              "num_responses": 7,
              "rvariance": 0.02188207286485025
            },
            {
              "id": "chat_sample_113",
              "rewards": [
                0.23078031242964772,
                0.6658162089773604,
                0.5717543935075847,
                0.5952698473750286,
                0.5952698473750286,
                0.7363625705796921,
                0.47769257803780896
              ],
              "variance": 0.3151070818237487,
              "mean_reward": 0.5532779654688788,
              "min_reward": 0.23078031242964772,
              "max_reward": 0.7363625705796921,
              "num_responses": 7,
              "rvariance": 0.02282439008208336
            },
            {
              "id": "chat_sample_104",
              "rewards": [
                -0.6863223884006654,
                -0.3453483073227285,
                -0.180740130250621,
                -0.1454669494494551,
                -0.1454669494494551,
                -0.180740130250621,
                -0.180740130250621
              ],
              "variance": 0.3362709903044481,
              "mean_reward": -0.26640356933916676,
              "min_reward": -0.6863223884006654,
              "max_reward": -0.1454669494494551,
              "num_responses": 7,
              "rvariance": 0.03340429895820358
            },
            {
              "id": "chat_sample_282",
              "rewards": [
                0.7128471167122482,
                1.0655789247239071,
                0.9480016553866876,
                1.0655789247239071,
                1.0420634708564633,
                0.9950325631215754,
                1.0420634708564633
              ],
              "variance": 0.21163908480699534,
              "mean_reward": 0.9815951609116075,
              "min_reward": 0.7128471167122482,
              "max_reward": 1.0655789247239071,
              "num_responses": 7,
              "rvariance": 0.013564853833702943
            },
            {
              "id": "chat_sample_62",
              "rewards": [
                1.44182618660301,
                1.5123725482053418,
                1.4183107327355662,
                1.465341640470454,
                1.5594034559402297,
                1.3947952788681222,
                1.4183107327355662
              ],
              "variance": 0.12228036011070853,
              "mean_reward": 1.4586229393654702,
              "min_reward": 1.3947952788681222,
              "max_reward": 1.5594034559402297,
              "num_responses": 7,
              "rvariance": 0.002956731867246397
            },
            {
              "id": "chat_sample_91",
              "rewards": [
                0.43066167030292113,
                0.2660534932308136,
                0.6187853012424726,
                0.6187853012424726,
                0.4071462164354772,
                0.6187853012424726,
                0.43066167030292113
              ],
              "variance": 0.26807617408886075,
              "mean_reward": 0.484411279142793,
              "min_reward": 0.2660534932308136,
              "max_reward": 0.6187853012424726,
              "num_responses": 7,
              "rvariance": 0.016228169561451605
            },
            {
              "id": "chat_sample_284",
              "rewards": [
                -1.0743273772134903,
                -0.7803842038704412,
                -0.6040182998646118,
                -0.5687451190634458,
                -0.8744460193402168,
                -0.7451110230692752,
                -0.49819875746111403
              ],
              "variance": 0.4138719880670131,
              "mean_reward": -0.7350329714117994,
              "min_reward": -1.0743273772134903,
              "max_reward": -0.49819875746111403,
              "num_responses": 7,
              "rvariance": 0.03394599029266093
            },
            {
              "id": "chat_sample_84",
              "rewards": [
                -0.180740130250621,
                -0.016131953178513507,
                -0.180740130250621,
                -0.06316286091340137,
                -0.08667831478084528,
                -0.180740130250621,
                -0.15722467638317708
              ],
              "variance": 0.1363896324311748,
              "mean_reward": -0.12363117085825717,
              "min_reward": -0.180740130250621,
              "max_reward": -0.016131953178513507,
              "num_responses": 7,
              "rvariance": 0.003927262174815827
            },
            {
              "id": "chat_sample_175",
              "rewards": [
                0.4071462164354772,
                0.6658162089773604,
                0.9244862015192435,
                0.9009707476517996,
                0.8304243860494679,
                0.9480016553866876,
                0.8774552937843557
              ],
              "variance": 0.371544171105614,
              "mean_reward": 0.793471529972056,
              "min_reward": 0.4071462164354772,
              "max_reward": 0.9480016553866876,
              "num_responses": 7,
              "rvariance": 0.032366057233826975
            },
            {
              "id": "chat_sample_185",
              "rewards": [
                1.3242489172657903,
                1.1831561940611268,
                1.6299498175425615,
                1.8415889023495569,
                1.771042540747225,
                1.8651043562170007,
                1.8651043562170007
              ],
              "variance": 0.5972925282330757,
              "mean_reward": 1.6400278692000376,
              "min_reward": 1.1831561940611268,
              "max_reward": 1.8651043562170007,
              "num_responses": 7,
              "rvariance": 0.06680859791640716
            },
            {
              "id": "chat_sample_154",
              "rewards": [
                -0.9214769270751048,
                -0.49819875746111403,
                -0.3453483073227285,
                -0.4746833035936701,
                -0.42765239585878223,
                -0.3806214881238944,
                -0.42765239585878223
              ],
              "variance": 0.3009978095032823,
              "mean_reward": -0.496519082184868,
              "min_reward": -0.9214769270751048,
              "max_reward": -0.3453483073227285,
              "num_responses": 7,
              "rvariance": 0.03240555556029784
            },
            {
              "id": "chat_sample_189",
              "rewards": [
                -1.5622730449629518,
                -0.8862037462739388,
                -0.7921419308041631,
                -0.8038996577378851,
                -0.839172838539051,
                -0.6863223884006654,
                -0.6628069345332215
              ],
              "variance": 0.4797152588958562,
              "mean_reward": -0.8904029344645538,
              "min_reward": -1.5622730449629518,
              "max_reward": -0.6628069345332215,
              "num_responses": 7,
              "rvariance": 0.08066263592605741
            },
            {
              "id": "chat_sample_218",
              "rewards": [
                -0.46292557665994816,
                -0.7451110230692752,
                -0.4158946689250603,
                -0.39237921505761636,
                -0.521714211328558,
                -0.4394101227925042
              ],
              "variance": 0.2292756752075783,
              "mean_reward": -0.4962391363054937,
              "min_reward": -0.7451110230692752,
              "max_reward": -0.39237921505761636,
              "num_responses": 6,
              "rvariance": 0.014027940363695486
            },
            {
              "id": "chat_sample_257",
              "rewards": [
                0.5247234857726968,
                0.8539398399169118,
                0.8304243860494679,
                0.8774552937843557,
                0.9480016553866876,
                1.0185480169890193,
                0.8774552937843557
              ],
              "variance": 0.26807617408886086,
              "mean_reward": 0.8472211388119277,
              "min_reward": 0.5247234857726968,
              "max_reward": 1.0185480169890193,
              "num_responses": 7,
              "rvariance": 0.020809975432070076
            },
            {
              "id": "chat_sample_13",
              "rewards": [
                0.136718496959872,
                0.2660534932308136,
                0.23078031242964772,
                0.25429576629709166,
                0.2425380393633697
              ],
              "variance": 0.08700717930954252,
              "mean_reward": 0.22607722165615893,
              "min_reward": 0.136718496959872,
              "max_reward": 0.2660534932308136,
              "num_responses": 5,
              "rvariance": 0.002134489562484671
            },
            {
              "id": "chat_sample_237",
              "rewards": [
                -1.4740900929600371,
                -1.150752602282683,
                -1.2389355542855978,
                -1.1331160118821,
                -1.2800875985536246,
                -1.0743273772134903,
                -1.0625696502797684
              ],
              "variance": 0.28806430987618814,
              "mean_reward": -1.2019826982081858,
              "min_reward": -1.4740900929600371,
              "max_reward": -1.0625696502797684,
              "num_responses": 7,
              "rvariance": 0.017801049347701485
            },
            {
              "id": "chat_sample_89",
              "rewards": [
                1.7004961791448931,
                1.8886198100844447,
                1.5358880020727856,
                1.7240116330123372,
                1.771042540747225,
                2.006197079421664,
                1.8651043562170007
              ],
              "variance": 0.30099780950328237,
              "mean_reward": 1.784479942957193,
              "min_reward": 1.5358880020727856,
              "max_reward": 2.006197079421664,
              "num_responses": 7,
              "rvariance": 0.01988458606903875
            },
            {
              "id": "chat_sample_23",
              "rewards": [
                0.9715171092541315,
                0.7128471167122482,
                1.0890943785913512,
                0.9480016553866876,
                1.112609832458795,
                0.9950325631215754,
                1.0420634708564633
              ],
              "variance": 0.24456072022141684,
              "mean_reward": 0.9815951609116075,
              "min_reward": 0.7128471167122482,
              "max_reward": 1.112609832458795,
              "num_responses": 7,
              "rvariance": 0.015144786892536899
            },
            {
              "id": "chat_sample_236",
              "rewards": [
                -0.8156573846716071,
                -0.4746833035936701,
                -0.521714211328558,
                -0.46292557665994816,
                -0.5334719382622799,
                -0.7215955692018313,
                -0.45116784972622614
              ],
              "variance": 0.3009978095032822,
              "mean_reward": -0.5687451190634458,
              "min_reward": -0.8156573846716071,
              "max_reward": -0.45116784972622614,
              "num_responses": 7,
              "rvariance": 0.017379263647173484
            },
            {
              "id": "chat_sample_234",
              "rewards": [
                -2.0443398492455525,
                -2.061976439646135,
                -1.803306447104252,
                -1.797427583637391,
                -1.9385203068420547,
                -1.856216218306001,
                -1.8738528087065838
              ],
              "variance": 0.250439583688278,
              "mean_reward": -1.9108056647839955,
              "min_reward": -2.061976439646135,
              "max_reward": -1.797427583637391,
              "num_responses": 7,
              "rvariance": 0.010029753614561977
            },
            {
              "id": "chat_sample_194",
              "rewards": [
                0.9244862015192435,
                1.136125286326239,
                1.2301871017960146,
                0.9244862015192435,
                1.2301871017960146,
                1.2537025556634587,
                1.3477643711332343
              ],
              "variance": 0.3668410803321255,
              "mean_reward": 1.149562688536207,
              "min_reward": 0.9244862015192435,
              "max_reward": 1.3477643711332343,
              "num_responses": 7,
              "rvariance": 0.023518432104356855
            },
            {
              "id": "chat_sample_70",
              "rewards": [
                1.2066716479285706,
                1.3007334633983465,
                1.44182618660301,
                1.3242489172657903,
                1.3242489172657903,
                1.3477643711332343,
                1.4183107327355662
              ],
              "variance": 0.1646081770721075,
              "mean_reward": 1.3376863194757582,
              "min_reward": 1.2066716479285706,
              "max_reward": 1.44182618660301,
              "num_responses": 7,
              "rvariance": 0.005191208621882994
            },
            {
              "id": "chat_sample_74",
              "rewards": [
                0.03089895455637435,
                0.136718496959872,
                0.148476223893594,
                0.148476223893594,
                -0.02788968011223547,
                -0.2160133110517869,
                -0.2160133110517869
              ],
              "variance": 0.3644895349453809,
              "mean_reward": 0.0006647995839464405,
              "min_reward": -0.2160133110517869,
              "max_reward": 0.148476223893594,
              "num_responses": 7,
              "rvariance": 0.022547901796787416
            },
            {
              "id": "chat_sample_200",
              "rewards": [
                -0.42765239585878223,
                -0.46292557665994816,
                -0.07492058784712333,
                -0.09843604171456725,
                -0.45116784972622614,
                0.00738350068893042,
                -0.12195149558201118
              ],
              "variance": 0.41387198806701314,
              "mean_reward": -0.23281006381424682,
              "min_reward": -0.46292557665994816,
              "max_reward": 0.00738350068893042,
              "num_responses": 7,
              "rvariance": 0.03593783447040516
            },
            {
              "id": "chat_sample_260",
              "rewards": [
                -0.3335905803890065,
                -0.039647407045957435,
                -0.0514051339796794,
                -0.12195149558201118,
                -0.12195149558201118,
                0.00738350068893042,
                -0.22777103798550885
              ],
              "variance": 0.2492638109949056,
              "mean_reward": -0.12699052141074915,
              "min_reward": -0.3335905803890065,
              "max_reward": 0.00738350068893042,
              "num_responses": 7,
              "rvariance": 0.012041346955541626
            },
            {
              "id": "chat_sample_315",
              "rewards": [
                0.36011530870058933,
                0.9715171092541315,
                0.806908932182024,
                0.806908932182024,
                1.136125286326239,
                1.136125286326239,
                1.0890943785913512
              ],
              "variance": 0.5079338035367889,
              "mean_reward": 0.9009707476517997,
              "min_reward": 0.36011530870058933,
              "max_reward": 1.136125286326239,
              "num_responses": 7,
              "rvariance": 0.06588320855337584
            },
            {
              "id": "chat_sample_240",
              "rewards": [
                0.5012080319052529,
                0.5482389396401407,
                0.5482389396401407,
                0.45417712417036504,
                0.5952698473750286,
                0.5717543935075847,
                0.5482389396401407
              ],
              "variance": 0.09876490624326456,
              "mean_reward": 0.5381608879826648,
              "min_reward": 0.45417712417036504,
              "max_reward": 0.5952698473750286,
              "num_responses": 7,
              "rvariance": 0.001873349198331688
            },
            {
              "id": "chat_sample_20",
              "rewards": [
                2.2178361642286597,
                2.076743441023996,
                1.9826816255542203,
                2.053227987156552,
                2.0297125332891084,
                2.2883825258309916,
                2.10025889489144
              ],
              "variance": 0.23515453867443936,
              "mean_reward": 2.106977595996424,
              "min_reward": 1.9826816255542203,
              "max_reward": 2.2883825258309916,
              "num_responses": 7,
              "rvariance": 0.010066430631999194
            },
            {
              "id": "chat_sample_210",
              "rewards": [
                0.3013266740319795,
                0.7598780244471361,
                0.5482389396401407,
                0.36011530870058933,
                0.6423007551099165,
                0.5717543935075847,
                0.8539398399169118
              ],
              "variance": 0.4609028958019011,
              "mean_reward": 0.5767934193363227,
              "min_reward": 0.3013266740319795,
              "max_reward": 0.8539398399169118,
              "num_responses": 7,
              "rvariance": 0.03404191479980443
            },
            {
              "id": "chat_sample_93",
              "rewards": [
                -0.08667831478084528,
                -0.11019376864828921,
                -0.09843604171456725,
                -0.4394101227925042,
                -0.29831739958784065,
                0.12496077002615005,
                -0.2395287649192308
              ],
              "variance": 0.352731808011659,
              "mean_reward": -0.1639433774881611,
              "min_reward": -0.4394101227925042,
              "max_reward": 0.12496077002615005,
              "num_responses": 7,
              "rvariance": 0.0280381691762354
            },
            {
              "id": "chat_sample_226",
              "rewards": [
                0.43066167030292113,
                0.7363625705796921,
                0.8304243860494679,
                0.9244862015192435,
                0.8774552937843557,
                0.8539398399169118,
                0.9244862015192435
              ],
              "variance": 0.31040399105025973,
              "mean_reward": 0.7968308805245481,
              "min_reward": 0.43066167030292113,
              "max_reward": 0.9244862015192435,
              "num_responses": 7,
              "rvariance": 0.025888331692607767
            },
            {
              "id": "chat_sample_30",
              "rewards": [
                1.0420634708564633,
                1.136125286326239,
                1.3477643711332343,
                1.136125286326239,
                1.1596407401936828,
                1.136125286326239,
                1.2301871017960146
              ],
              "variance": 0.17871744939257383,
              "mean_reward": 1.169718791851159,
              "min_reward": 1.0420634708564633,
              "max_reward": 1.3477643711332343,
              "num_responses": 7,
              "rvariance": 0.007877094821900705
            },
            {
              "id": "chat_sample_142",
              "rewards": [
                -0.25128649185295276,
                -0.2630442187866747,
                0.21902258549592576,
                0.21902258549592576,
                0.3365998548331454,
                0.2425380393633697,
                0.136718496959872
              ],
              "variance": 0.5361523481777215,
              "mean_reward": 0.09136726450123016,
              "min_reward": -0.2630442187866747,
              "max_reward": 0.3365998548331454,
              "num_responses": 7,
              "rvariance": 0.051522745572188666
            },
            {
              "id": "chat_sample_136",
              "rewards": [
                -0.7803842038704412,
                -0.6040182998646118,
                -0.4158946689250603,
                -0.35710603425645043,
                -0.509956484394836,
                -0.6745646614669435,
                -0.4041369419913383
              ],
              "variance": 0.33156789953095944,
              "mean_reward": -0.5351516135385259,
              "min_reward": -0.7803842038704412,
              "max_reward": -0.35710603425645043,
              "num_responses": 7,
              "rvariance": 0.021148532516105923
            },
            {
              "id": "chat_sample_16",
              "rewards": [
                1.1596407401936828,
                1.3242489172657903,
                1.2772180095309025,
                1.2301871017960146,
                1.0655789247239071,
                1.112609832458795,
                1.2772180095309025
              ],
              "variance": 0.20223290326001786,
              "mean_reward": 1.2066716479285708,
              "min_reward": 1.0655789247239071,
              "max_reward": 1.3242489172657903,
              "num_responses": 7,
              "rvariance": 0.007899665294169765
            },
            {
              "id": "chat_sample_22",
              "rewards": [
                1.1831561940611268,
                1.3007334633983465,
                1.3242489172657903,
                1.2537025556634587,
                1.3007334633983465,
                1.2066716479285706,
                1.2301871017960146
              ],
              "variance": 0.11287417856373083,
              "mean_reward": 1.2570619062159505,
              "min_reward": 1.1831561940611268,
              "max_reward": 1.3242489172657903,
              "num_responses": 7,
              "rvariance": 0.0024376110050581
            },
            {
              "id": "chat_sample_217",
              "rewards": [
                -0.19249785718434295,
                -0.11019376864828921,
                -0.08667831478084528,
                -0.39237921505761636,
                0.10144531615870613,
                -0.0514051339796794,
                -0.004374226244791544
              ],
              "variance": 0.31040399105025984,
              "mean_reward": -0.10515474281955124,
              "min_reward": -0.39237921505761636,
              "max_reward": 0.10144531615870613,
              "num_responses": 7,
              "rvariance": 0.02088897208501177
            }
          ]
        },
        "semantic_benchmark_chat_hard_filtered.json": {
          "file_name": "semantic_benchmark_chat_hard_filtered.json",
          "processed_samples": 200,
          "global_mean": 2.357257827939723,
          "global_std": 2.259938334279243,
          "mean_variance": 0.4197105217755629,
          "mean_rvariance": 0.05893580239078901,
          "sample_results": [
            {
              "id": "chat_hard_sample_121",
              "rewards": [
                0.6231883192111276,
                -0.1027717546168341,
                0.6231883192111276,
                -0.1027717546168341,
                0.6231883192111276,
                -0.1027717546168341
              ],
              "variance": 0.7259600738279617,
              "mean_reward": 0.26020828229714676,
              "min_reward": -0.1027717546168341,
              "max_reward": 0.6231883192111276,
              "num_responses": 6,
              "rvariance": 0.13175450719807488
            },
            {
              "id": "chat_hard_sample_77",
              "rewards": [
                1.3629762039691458,
                0.401943344330225,
                0.8236915776969456,
                0.3881155334001686,
                0.38120162793514034,
                0.8236915776969456,
                1.4874265023396533
              ],
              "variance": 1.0274063521031915,
              "mean_reward": 0.8098637667668892,
              "min_reward": 0.38120162793514034,
              "max_reward": 1.4874265023396533,
              "num_responses": 7,
              "rvariance": 0.18477555974165266
            },
            {
              "id": "chat_hard_sample_265",
              "rewards": [
                0.27749304595971724,
                0.27749304595971724,
                -0.8451523539242378,
                -0.1027717546168341,
                0.27749304595971724,
                0.20144008584440698,
                -0.49686436612344187
              ],
              "variance": 0.9136726072034774,
              "mean_reward": -0.058695607277279294,
              "min_reward": -0.8451523539242378,
              "max_reward": 0.27749304595971724,
              "num_responses": 7,
              "rvariance": 0.1741696846959171
            },
            {
              "id": "chat_hard_sample_334",
              "rewards": [
                2.4968567002337716,
                1.805466153730951,
                1.8469495865211203,
                1.805466153730951,
                1.8884330193112897,
                1.9852276958216846
              ],
              "variance": 0.4355760442967771,
              "mean_reward": 1.971399884891628,
              "min_reward": 1.805466153730951,
              "max_reward": 2.4968567002337716,
              "num_responses": 6,
              "rvariance": 0.05895590949452783
            },
            {
              "id": "chat_hard_sample_61",
              "rewards": [
                1.6671880444303868,
                1.3906318258292585,
                1.3906318258292585,
                1.6948436662904995,
                1.3629762039691458,
                1.0311087416477918,
                1.473598691409597
              ],
              "variance": 0.44802107413382775,
              "mean_reward": 1.430139857057991,
              "min_reward": 1.0311087416477918,
              "max_reward": 1.6948436662904995,
              "num_responses": 7,
              "rvariance": 0.0421438823524038
            },
            {
              "id": "chat_hard_sample_133",
              "rewards": [
                0.8790028214171712,
                -0.019804889036495625,
                0.19452618037937877,
                0.07007588200887106,
                -0.12351347101191873,
                -0.27561939124253926
              ],
              "variance": 0.736330932025504,
              "mean_reward": 0.12077785541907793,
              "min_reward": -0.27561939124253926,
              "max_reward": 0.8790028214171712,
              "num_responses": 6,
              "rvariance": 0.1365811903289895
            },
            {
              "id": "chat_hard_sample_62",
              "rewards": [
                0.7960359558368327,
                0.2083539913094352,
                0.9619696869975097,
                1.0172809307177353
              ],
              "variance": 0.6160289769340132,
              "mean_reward": 0.7459101412153782,
              "min_reward": 0.2083539913094352,
              "max_reward": 1.0172809307177353,
              "num_responses": 4,
              "rvariance": 0.10295076107796966
            },
            {
              "id": "chat_hard_sample_84",
              "rewards": [
                0.021678543753673618,
                -0.99336920233078,
                -0.3309306349627649,
                -0.9829983441332376,
                -0.9829983441332376,
                -0.99336920233078
              ],
              "variance": 0.8387431567262343,
              "mean_reward": -0.7103311973561878,
              "min_reward": -0.99336920233078,
              "max_reward": 0.021678543753673618,
              "num_responses": 6,
              "rvariance": 0.1647831363678735
            },
            {
              "id": "chat_hard_sample_343",
              "rewards": [
                0.29132085688977366,
                -0.2168511947897995,
                -0.17882471473214437,
                0.436512871655366
              ],
              "variance": 0.5983985179981913,
              "mean_reward": 0.08303945475579895,
              "min_reward": -0.2168511947897995,
              "max_reward": 0.436512871655366,
              "num_responses": 4,
              "rvariance": 0.08170796096901023
            },
            {
              "id": "chat_hard_sample_87",
              "rewards": [
                1.0311087416477918,
                0.13230103119412492,
                -0.15808299833705974,
                -0.16499690380208795,
                -0.13042737647694694
              ],
              "variance": 0.8338169990824017,
              "mean_reward": 0.1419804988451644,
              "min_reward": -0.16499690380208795,
              "max_reward": 1.0311087416477918,
              "num_responses": 5,
              "rvariance": 0.20982440057161647
            },
            {
              "id": "chat_hard_sample_110",
              "rewards": [
                0.8928306323472277,
                -1.4993806585525318,
                -1.4181422693384504,
                -2.951300806208455,
                -1.4181422693384504,
                -1.3904866474783375,
                -1.4181422693384504
              ],
              "variance": 1.6029889820667904,
              "mean_reward": -1.3146806125582067,
              "min_reward": -2.951300806208455,
              "max_reward": 0.8928306323472277,
              "num_responses": 7,
              "rvariance": 1.0890864514056393
            },
            {
              "id": "chat_hard_sample_150",
              "rewards": [
                0.10464540933401209,
                0.13230103119412492,
                0.27057914049468906,
                0.471082398980507,
                0.07007588200887106,
                0.471082398980507,
                0.15304274758920955
              ],
              "variance": 0.3802648005765513,
              "mean_reward": 0.238972715511703,
              "min_reward": 0.07007588200887106,
              "max_reward": 0.471082398980507,
              "num_responses": 7,
              "rvariance": 0.024868792799247162
            },
            {
              "id": "chat_hard_sample_65",
              "rewards": [
                -0.8918212158131782,
                -0.6040299008313791,
                -0.5452617043786393,
                -0.7250232464693727,
                -0.45883788606578674,
                -1.003307941436758,
                -0.45883788606578674
              ],
              "variance": 0.4775780199968234,
              "mean_reward": -0.6695885401515573,
              "min_reward": -1.003307941436758,
              "max_reward": -0.45883788606578674,
              "num_responses": 7,
              "rvariance": 0.03891654018119972
            },
            {
              "id": "chat_hard_sample_46",
              "rewards": [
                0.24983742409960444,
                0.9066584432772841,
                1.1970424728084688,
                1.1693868509483558,
                1.100247796298074,
                0.9896253088576226,
                1.0449365525778482
              ],
              "variance": 0.5365190640861888,
              "mean_reward": 0.9511049784096083,
              "min_reward": 0.24983742409960444,
              "max_reward": 1.1970424728084688,
              "num_responses": 7,
              "rvariance": 0.09063080921997727
            },
            {
              "id": "chat_hard_sample_114",
              "rewards": [
                2.5245123220938845,
                2.0958501832621357,
                1.1693868509483558,
                1.1693868509483558
              ],
              "variance": 1.2265268294960043,
              "mean_reward": 1.7397840518131829,
              "min_reward": 1.1693868509483558,
              "max_reward": 2.5245123220938845,
              "num_responses": 4,
              "rvariance": 0.3483218704129062
            },
            {
              "id": "chat_hard_sample_371",
              "rewards": [
                0.2982347623548019,
                0.5609631700258737,
                0.29132085688977366,
                0.06316197654384285
              ],
              "variance": 0.35053500707693014,
              "mean_reward": 0.303420191453573,
              "min_reward": 0.06316197654384285,
              "max_reward": 0.5609631700258737,
              "num_responses": 4,
              "rvariance": 0.031056419553831937
            },
            {
              "id": "chat_hard_sample_223",
              "rewards": [
                0.18069836944932238,
                0.9896253088576226,
                0.4503406825854224,
                0.2290957077045198,
                0.9481418760674533
              ],
              "variance": 0.7729746309901535,
              "mean_reward": 0.5595803889328681,
              "min_reward": 0.18069836944932238,
              "max_reward": 0.9896253088576226,
              "num_responses": 5,
              "rvariance": 0.12012473701894759
            },
            {
              "id": "chat_hard_sample_52",
              "rewards": [
                -0.08203003822174948,
                0.06316197654384285,
                0.6439300356062122,
                0.39502943886519676,
                0.12538712572909672,
                0.33971819514497115,
                0.06316197654384285
              ],
              "variance": 0.48950450692399705,
              "mean_reward": 0.22119410145877333,
              "min_reward": -0.08203003822174948,
              "max_reward": 0.6439300356062122,
              "num_responses": 7,
              "rvariance": 0.05343493083265198
            },
            {
              "id": "chat_hard_sample_372",
              "rewards": [
                0.3051486678198301,
                -0.7077384828068022,
                -0.9246622667720622,
                -1.0743915319990793
              ],
              "variance": 1.0307552750628148,
              "mean_reward": -0.6004109034395284,
              "min_reward": -1.0743915319990793,
              "max_reward": 0.3051486678198301,
              "num_responses": 4,
              "rvariance": 0.29033848231624637
            },
            {
              "id": "chat_hard_sample_346",
              "rewards": [
                1.8192939646610076,
                1.7639827209407817,
                1.266181527458751,
                1.2800093383888071,
                1.833121775591064
              ],
              "variance": 0.5558779993882681,
              "mean_reward": 1.5925178654080825,
              "min_reward": 1.266181527458751,
              "max_reward": 1.833121775591064,
              "num_responses": 5,
              "rvariance": 0.06857496447929992
            },
            {
              "id": "chat_hard_sample_108",
              "rewards": [
                1.003453119787679,
                0.13921493665915313,
                1.3214927711789766,
                1.3214927711789766,
                1.1140756072281304
              ],
              "variance": 0.836582561268413,
              "mean_reward": 0.9799458412065831,
              "min_reward": 0.13921493665915313,
              "max_reward": 1.3214927711789766,
              "num_responses": 5,
              "rvariance": 0.19173609017751164
            },
            {
              "id": "chat_hard_sample_64",
              "rewards": [
                3.1882472467365925,
                2.2894395362829254,
                1.7916383428008946,
                1.9160886411714024,
                2.261783914422813,
                2.6904460532545618
              ],
              "variance": 1.0854831580094284,
              "mean_reward": 2.356273955778198,
              "min_reward": 1.7916383428008946,
              "max_reward": 3.1882472467365925,
              "num_responses": 6,
              "rvariance": 0.22163704029704082
            },
            {
              "id": "chat_hard_sample_233",
              "rewards": [
                -0.2963611076376239,
                -0.4173544532756175,
                -0.17191080926711616,
                -0.4104405478105893,
                0.021678543753673618,
                -0.27216243851002514,
                -0.25487767484745466
              ],
              "variance": 0.3187310419378004,
              "mean_reward": -0.2573469267992504,
              "min_reward": -0.4173544532756175,
              "max_reward": 0.021678543753673618,
              "num_responses": 7,
              "rvariance": 0.019420330231233855
            },
            {
              "id": "chat_hard_sample_47",
              "rewards": [
                -2.1078043394750137,
                -2.2875658815657474,
                -1.710254775235892,
                -2.0870626230799294
              ],
              "variance": 0.4103402893494241,
              "mean_reward": -2.048171904839146,
              "min_reward": -2.2875658815657474,
              "max_reward": -1.710254775235892,
              "num_responses": 4,
              "rvariance": 0.04414149444954097
            },
            {
              "id": "chat_hard_sample_26",
              "rewards": [
                0.36045991154005574,
                0.6854134683963815,
                0.671585657466325,
                1.2108702837385252,
                0.2636652350296608,
                1.5150821241997663,
                0.6439300356062122
              ],
              "variance": 1.010812978987124,
              "mean_reward": 0.7644295308538467,
              "min_reward": 0.2636652350296608,
              "max_reward": 1.5150821241997663,
              "num_responses": 7,
              "rvariance": 0.17230409233440427
            },
            {
              "id": "chat_hard_sample_379",
              "rewards": [
                0.9066584432772841,
                1.266181527458751,
                1.473598691409597,
                1.4874265023396533,
                1.5289099351298228,
                0.6093605082810711,
                1.2800093383888071
              ],
              "variance": 0.7162806061769221,
              "mean_reward": 1.2217349923264267,
              "min_reward": 0.6093605082810711,
              "max_reward": 1.5289099351298228,
              "num_responses": 7,
              "rvariance": 0.10114726875143361
            },
            {
              "id": "chat_hard_sample_247",
              "rewards": [
                0.7545525230466635,
                0.9066584432772841,
                0.6093605082810711,
                0.9757974979275661
              ],
              "variance": 0.30213766882173265,
              "mean_reward": 0.8115922431331462,
              "min_reward": 0.6093605082810711,
              "max_reward": 0.9757974979275661,
              "num_responses": 4,
              "rvariance": 0.02003803809019248
            },
            {
              "id": "chat_hard_sample_215",
              "rewards": [
                1.003453119787679,
                1.3214927711789766,
                1.0449365525778482,
                0.7822081449067764,
                1.141731229088243,
                1.0587643635079047,
                1.1555590400182996
              ],
              "variance": 0.3069774026472525,
              "mean_reward": 1.0725921744379612,
              "min_reward": 0.7822081449067764,
              "max_reward": 1.3214927711789766,
              "num_responses": 7,
              "rvariance": 0.02338205028292626
            },
            {
              "id": "chat_hard_sample_49",
              "rewards": [
                -0.39315578414801877,
                -0.7232947701031156,
                -0.635142475424006,
                -0.4761226497283573,
                -0.35858625682287776,
                -0.019804889036495625,
                -0.5348908461810971
              ],
              "variance": 0.4473296835873251,
              "mean_reward": -0.44871395306342404,
              "min_reward": -0.7232947701031156,
              "max_reward": -0.019804889036495625,
              "num_responses": 7,
              "rvariance": 0.04478580136619092
            },
            {
              "id": "chat_hard_sample_415",
              "rewards": [
                1.3214927711789766,
                1.542737746059879,
                1.9990555067517408,
                1.8746052083812332,
                1.7778105318708384,
                1.902260830241346,
                1.9437442630315152
              ],
              "variance": 0.5116290044120875,
              "mean_reward": 1.7659581225022183,
              "min_reward": 1.3214927711789766,
              "max_reward": 1.9990555067517408,
              "num_responses": 7,
              "rvariance": 0.05197745490129803
            },
            {
              "id": "chat_hard_sample_297",
              "rewards": [
                -1.0524074732157473,
                -0.5590895153086958,
                -0.7889768720208836,
                -0.7250232464693727,
                -0.7111954355393163,
                -0.88490731034815,
                -0.3758710204854483
              ],
              "variance": 0.4661052581157922,
              "mean_reward": -0.7282101247696591,
              "min_reward": -1.0524074732157473,
              "max_reward": -0.3758710204854483,
              "num_responses": 7,
              "rvariance": 0.04091354386776317
            },
            {
              "id": "chat_hard_sample_80",
              "rewards": [
                -0.012890983571467417,
                -0.012890983571467417,
                0.29132085688977366,
                0.29132085688977366,
                -0.24104986391739824
              ],
              "variance": 0.44110716866879957,
              "mean_reward": 0.06316197654384285,
              "min_reward": -0.24104986391739824,
              "max_reward": 0.29132085688977366,
              "num_responses": 5,
              "rvariance": 0.04164517974456702
            },
            {
              "id": "chat_hard_sample_413",
              "rewards": [
                -0.5210630352510406,
                -0.49340741339092775,
                -0.8589801648542942,
                -0.569460373506238,
                -0.5348908461810971,
                -0.4311822642056739
              ],
              "variance": 0.25192543038196535,
              "mean_reward": -0.5681640162315452,
              "min_reward": -0.8589801648542942,
              "max_reward": -0.4311822642056739,
              "num_responses": 6,
              "rvariance": 0.01870897819213858
            },
            {
              "id": "chat_hard_sample_306",
              "rewards": [
                -0.1822816674646585,
                -0.02671879450152383,
                -0.13734128194197515,
                -0.13042737647694694,
                -0.1027717546168341,
                -0.00597707810643921,
                -0.012890983571467417
              ],
              "variance": 0.14519201476559235,
              "mean_reward": -0.0854869909542636,
              "min_reward": -0.1822816674646585,
              "max_reward": -0.00597707810643921,
              "num_responses": 7,
              "rvariance": 0.004203169377669717
            },
            {
              "id": "chat_hard_sample_43",
              "rewards": [
                -1.2461588708958737,
                -1.8035924990137728,
                -1.5858044768653845,
                -1.8312481208738856,
                -0.8252748757122818,
                -1.6272879096555537,
                -1.4959237058200177
              ],
              "variance": 0.7368494749353811,
              "mean_reward": -1.4878986369766811,
              "min_reward": -1.8312481208738856,
              "max_reward": -0.8252748757122818,
              "num_responses": 7,
              "rvariance": 0.106305595809936
            },
            {
              "id": "chat_hard_sample_102",
              "rewards": [
                0.837519388627002,
                1.100247796298074,
                0.9066584432772841,
                0.8928306323472277,
                1.3906318258292585,
                1.1140756072281304
              ],
              "variance": 0.38717870604157956,
              "mean_reward": 1.0403272822678293,
              "min_reward": 0.837519388627002,
              "max_reward": 1.3906318258292585,
              "num_responses": 6,
              "rvariance": 0.03541603644229834
            },
            {
              "id": "chat_hard_sample_187",
              "rewards": [
                -1.152821147117993,
                -1.7932216408162305,
                -1.0054685368945793,
                -1.2452946327127452,
                -1.0080612514439649,
                -1.0054685368945793
              ],
              "variance": 0.5137895998699087,
              "mean_reward": -1.2017226243133485,
              "min_reward": -1.7932216408162305,
              "max_reward": -1.0054685368945793,
              "num_responses": 6,
              "rvariance": 0.07811617031842065
            },
            {
              "id": "chat_hard_sample_360",
              "rewards": [
                0.39502943886519676,
                -0.88490731034815,
                -0.88490731034815,
                -1.502837611285046,
                -0.7371225810331721,
                -0.7371225810331721
              ],
              "variance": 1.0228258897326103,
              "mean_reward": -0.7253113258637489,
              "min_reward": -1.502837611285046,
              "max_reward": 0.39502943886519676,
              "num_responses": 6,
              "rvariance": 0.3184885536098206
            },
            {
              "id": "chat_hard_sample_236",
              "rewards": [
                0.09081759840395569,
                -0.15808299833705974,
                -0.06128832182666486,
                0.20144008584440698,
                -0.13734128194197515,
                0.021678543753673618,
                0.0009368273585889964
              ],
              "variance": 0.28070456188014525,
              "mean_reward": -0.005977078106439211,
              "min_reward": -0.15808299833705974,
              "max_reward": 0.20144008584440698,
              "num_responses": 7,
              "rvariance": 0.013807974787405633
            },
            {
              "id": "chat_hard_sample_259",
              "rewards": [
                1.7224992881506125,
                1.5150821241997663,
                1.542737746059879,
                1.2108702837385252,
                1.5150821241997663,
                1.570393367919992,
                1.8192939646610076
              ],
              "variance": 0.36781977073950056,
              "mean_reward": 1.5565655569899355,
              "min_reward": 1.2108702837385252,
              "max_reward": 1.8192939646610076,
              "num_responses": 7,
              "rvariance": 0.03141280119785655
            },
            {
              "id": "chat_hard_sample_127",
              "rewards": [
                1.6948436662904995,
                1.570393367919992,
                1.2800093383888071,
                1.5980489897801047,
                1.3491483930390893
              ],
              "variance": 0.34846083543742146,
              "mean_reward": 1.4984887510836984,
              "min_reward": 1.2800093383888071,
              "max_reward": 1.6948436662904995,
              "num_responses": 5,
              "rvariance": 0.024734712817985262
            },
            {
              "id": "chat_hard_sample_280",
              "rewards": [
                -0.7820629665558554,
                -0.9661456995622314,
                -0.45192398060075856,
                -0.6506987627203195,
                -0.8382384484592096,
                -0.6818113373129464,
                -0.6455133336215483
              ],
              "variance": 0.32132375648718603,
              "mean_reward": -0.716627789833267,
              "min_reward": -0.9661456995622314,
              "max_reward": -0.45192398060075856,
              "num_responses": 7,
              "rvariance": 0.023144899486615966
            },
            {
              "id": "chat_hard_sample_421",
              "rewards": [
                -0.40352664234556107,
                -0.6420563808890343,
                -0.3274736822302508,
                -0.1027717546168341,
                -0.5245199879835547,
                -0.26524853304499696,
                -0.2030233838597431
              ],
              "variance": 0.40861181298316707,
              "mean_reward": -0.3526600521385678,
              "min_reward": -0.6420563808890343,
              "max_reward": -0.1027717546168341,
              "num_responses": 7,
              "rvariance": 0.02985484332478272
            },
            {
              "id": "chat_hard_sample_270",
              "rewards": [
                0.2221818022394916,
                0.021678543753673618,
                0.2290957077045198,
                -0.23067900571985592,
                0.2221818022394916,
                -0.18573862019717258
              ],
              "variance": 0.43384756793051993,
              "mean_reward": 0.04645337167002469,
              "min_reward": -0.23067900571985592,
              "max_reward": 0.2290957077045198,
              "num_responses": 6,
              "rvariance": 0.03774140888604366
            },
            {
              "id": "chat_hard_sample_276",
              "rewards": [
                1.3353205821090328,
                1.3491483930390893,
                2.0405389395419102,
                0.9896253088576226,
                1.404459636759315,
                1.5289099351298228
              ],
              "variance": 0.6222514918525386,
              "mean_reward": 1.4413337992394653,
              "min_reward": 0.9896253088576226,
              "max_reward": 2.0405389395419102,
              "num_responses": 6,
              "rvariance": 0.09864226586778124
            },
            {
              "id": "chat_hard_sample_349",
              "rewards": [
                0.2982347623548019,
                0.2982347623548019,
                0.007850732823617203,
                0.007850732823617203,
                -0.2030233838597431,
                0.007850732823617203,
                0.13921493665915313
              ],
              "variance": 0.3747336762045288,
              "mean_reward": 0.07945903942569507,
              "min_reward": -0.2030233838597431,
              "max_reward": 0.2982347623548019,
              "num_responses": 7,
              "rvariance": 0.027782281332706753
            },
            {
              "id": "chat_hard_sample_267",
              "rewards": [
                -0.7371225810331721,
                -0.9566390795478176,
                -0.6835398136792035,
                -0.8270033520785387,
                -0.6524272390865765,
                -0.6800828609466893,
                -0.635142475424006
              ],
              "variance": 0.23334430944470197,
              "mean_reward": -0.738851057399429,
              "min_reward": -0.9566390795478176,
              "max_reward": -0.635142475424006,
              "num_responses": 7,
              "rvariance": 0.01142043117462289
            },
            {
              "id": "chat_hard_sample_14",
              "rewards": [
                0.8513471995570584,
                0.5125658317706763,
                0.6923273738614096,
                0.6992412793264379,
                0.48491020991056344,
                0.6577578465362687
              ],
              "variance": 0.2765562186011283,
              "mean_reward": 0.6496916234937357,
              "min_reward": 0.48491020991056344,
              "max_reward": 0.8513471995570584,
              "num_responses": 6,
              "rvariance": 0.015159901322050098
            },
            {
              "id": "chat_hard_sample_13",
              "rewards": [
                1.7916383428008946,
                2.1511614269823616,
                2.2894395362829254,
                1.8607773974511768,
                1.929916452101459,
                -0.3205597767652226,
                2.206472670702587
              ],
              "variance": 1.2929003219602744,
              "mean_reward": 1.701263721365169,
              "min_reward": -0.3205597767652226,
              "max_reward": 2.2894395362829254,
              "num_responses": 7,
              "rvariance": 0.7110370473125568
            },
            {
              "id": "chat_hard_sample_147",
              "rewards": [
                -0.3205597767652226,
                -0.5072352243209842,
                -0.299818060370138,
                -0.36550016228790594,
                -0.24104986391739824
              ],
              "variance": 0.18598405700925874,
              "mean_reward": -0.34683261753232986,
              "min_reward": -0.5072352243209842,
              "max_reward": -0.24104986391739824,
              "num_responses": 5,
              "rvariance": 0.008033619040257043
            },
            {
              "id": "chat_hard_sample_173",
              "rewards": [
                0.29132085688977366,
                0.028592449218701823,
                0.0009368273585889964,
                0.028592449218701823,
                0.0009368273585889964,
                0.028592449218701823
              ],
              "variance": 0.15901982569564874,
              "mean_reward": 0.06316197654384285,
              "min_reward": 0.0009368273585889964,
              "max_reward": 0.29132085688977366,
              "num_responses": 6,
              "rvariance": 0.010564261620235662
            },
            {
              "id": "chat_hard_sample_345",
              "rewards": [
                0.7407247121166071,
                0.38120162793514034,
                -0.1891955729296867,
                0.10464540933401209,
                -0.12351347101191873,
                -0.05437441636163666
              ],
              "variance": 0.7173176919966764,
              "mean_reward": 0.14324804818041956,
              "min_reward": -0.1891955729296867,
              "max_reward": 0.7407247121166071,
              "num_responses": 6,
              "rvariance": 0.10597092360376477
            },
            {
              "id": "chat_hard_sample_412",
              "rewards": [
                -0.38969883141550465,
                -0.5763742789712663,
                -0.5106921770534983,
                -0.2687054857775111,
                -0.5763742789712663,
                -0.5106921770534983,
                -0.4069835950780752
              ],
              "variance": 0.23507278581095908,
              "mean_reward": -0.46278868918866,
              "min_reward": -0.5763742789712663,
              "max_reward": -0.2687054857775111,
              "num_responses": 7,
              "rvariance": 0.010931069485154736
            },
            {
              "id": "chat_hard_sample_21",
              "rewards": [
                1.3629762039691458,
                1.404459636759315,
                1.570393367919992,
                1.902260830241346,
                1.5842211788500484,
                1.805466153730951
              ],
              "variance": 0.47014557162191806,
              "mean_reward": 1.604962895245133,
              "min_reward": 1.3629762039691458,
              "max_reward": 1.902260830241346,
              "num_responses": 6,
              "rvariance": 0.03816200087551196
            },
            {
              "id": "chat_hard_sample_357",
              "rewards": [
                -1.537407138610187,
                -1.404314458408394,
                -1.2988774000667138,
                -1.1640562434986639,
                -1.3766588365482813,
                -1.1994900090069334,
                -1.215046296303247
              ],
              "variance": 0.27223502768548546,
              "mean_reward": -1.3136929117774885,
              "min_reward": -1.537407138610187,
              "max_reward": -1.1640562434986639,
              "num_responses": 7,
              "rvariance": 0.015372731044279069
            },
            {
              "id": "chat_hard_sample_184",
              "rewards": [
                -0.42772531147315984,
                -0.13734128194197515,
                -0.05437441636163666,
                -0.15116909287203156,
                0.09081759840395569,
                0.20144008584440698
              ],
              "variance": 0.435576044296777,
              "mean_reward": -0.0797254030667401,
              "min_reward": -0.42772531147315984,
              "max_reward": 0.20144008584440698,
              "num_responses": 6,
              "rvariance": 0.039718224432439574
            },
            {
              "id": "chat_hard_sample_348",
              "rewards": [
                0.27057914049468906,
                0.7960359558368327,
                0.9757974979275661,
                0.7960359558368327,
                0.7960359558368327,
                0.837519388627002
              ],
              "variance": 0.3733508951115232,
              "mean_reward": 0.7453339824266259,
              "min_reward": 0.27057914049468906,
              "max_reward": 0.9757974979275661,
              "num_responses": 6,
              "rvariance": 0.049119301892377794
            },
            {
              "id": "chat_hard_sample_283",
              "rewards": [
                -1.9626123247094216,
                -1.914214986454224,
                -2.073234812149873,
                -1.9764401356394778,
                -2.1354599613351266,
                -1.9902679465695343
              ],
              "variance": 0.16593373116067722,
              "mean_reward": -2.0087050278096097,
              "min_reward": -2.1354599613351266,
              "max_reward": -1.914214986454224,
              "num_responses": 6,
              "rvariance": 0.005444126777647845
            },
            {
              "id": "chat_hard_sample_0",
              "rewards": [
                -0.7042815300742881,
                -0.04054660543158024,
                0.5540492645608456,
                0.5333075481657609,
                0.6646717520012968,
                -0.14425518740700335,
                1.1279034181581866
              ],
              "variance": 1.21823014293797,
              "mean_reward": 0.2844069514247454,
              "min_reward": -0.7042815300742881,
              "max_reward": 1.1279034181581866,
              "num_responses": 7,
              "rvariance": 0.32251386412442795
            },
            {
              "id": "chat_hard_sample_258",
              "rewards": [
                0.13230103119412492,
                0.021678543753673618,
                0.38120162793514034,
                0.3673738170050839,
                0.2636652350296608,
                0.32589038421491473,
                0.4295989661903378
              ],
              "variance": 0.3125085270192749,
              "mean_reward": 0.27452994361756233,
              "min_reward": 0.021678543753673618,
              "max_reward": 0.4295989661903378,
              "num_responses": 7,
              "rvariance": 0.01870915221653704
            },
            {
              "id": "chat_hard_sample_161",
              "rewards": [
                -0.26524853304499696,
                -0.37932797321796236,
                -0.3758710204854483,
                -0.3862418786829906,
                -0.3032750131026521
              ],
              "variance": 0.10301719142892024,
              "mean_reward": -0.3419928837068101,
              "min_reward": -0.3862418786829906,
              "max_reward": -0.26524853304499696,
              "num_responses": 5,
              "rvariance": 0.0023776758958847155
            },
            {
              "id": "chat_hard_sample_4",
              "rewards": [
                0.2221818022394916,
                0.8236915776969456,
                0.7407247121166071,
                0.8236915776969456,
                0.9204862542073404,
                0.7683803339767199,
                0.9343140651373969
              ],
              "variance": 0.3927098304136021,
              "mean_reward": 0.7476386175816353,
              "min_reward": 0.2221818022394916,
              "max_reward": 0.9343140651373969,
              "num_responses": 7,
              "rvariance": 0.05041071705273413
            },
            {
              "id": "chat_hard_sample_238",
              "rewards": [
                0.15995665305423776,
                -0.22722205298734183,
                -0.033632699966552035,
                -0.17882471473214437,
                0.23600961316954802,
                0.07007588200887106
              ],
              "variance": 0.40100651697163603,
              "mean_reward": 0.0043937800911031,
              "min_reward": -0.22722205298734183,
              "max_reward": 0.23600961316954802,
              "num_responses": 6,
              "rvariance": 0.028470127375499355
            },
            {
              "id": "chat_hard_sample_8",
              "rewards": [
                -0.733665628300658,
                0.27749304595971724,
                0.4295989661903378,
                -0.48303655519338545,
                0.5540492645608456,
                0.6439300356062122,
                0.6093605082810711
              ],
              "variance": 1.206476503647422,
              "mean_reward": 0.18538994815773435,
              "min_reward": -0.733665628300658,
              "max_reward": 0.6439300356062122,
              "num_responses": 7,
              "rvariance": 0.269356843904858
            },
            {
              "id": "chat_hard_sample_32",
              "rewards": [
                -0.12351347101191873,
                0.7130690902564942,
                0.5747909809559302,
                0.602446602816043,
                0.7130690902564942,
                1.1140756072281304,
                0.6992412793264379
              ],
              "variance": 0.5780024968763582,
              "mean_reward": 0.6133113114039446,
              "min_reward": -0.12351347101191873,
              "max_reward": 1.1140756072281304,
              "num_responses": 7,
              "rvariance": 0.1175092408536215
            },
            {
              "id": "chat_hard_sample_109",
              "rewards": [
                -0.04746051089660845,
                -0.4138975005431034,
                -0.13734128194197515,
                0.0977315038689839,
                -0.13734128194197515,
                -0.13734128194197515,
                -0.1027717546168341
              ],
              "variance": 0.25858006439205494,
              "mean_reward": -0.12548887257335536,
              "min_reward": -0.4138975005431034,
              "max_reward": 0.0977315038689839,
              "num_responses": 7,
              "rvariance": 0.020004686377740572
            },
            {
              "id": "chat_hard_sample_188",
              "rewards": [
                -0.5521756098436675,
                -0.8270033520785387,
                -1.2608509200090587,
                -0.766506679259542,
                -0.7440364864982003,
                -0.7319371519344009,
                -0.6144007590289214
              ],
              "variance": 0.4110316798959268,
              "mean_reward": -0.7852729940931901,
              "min_reward": -1.2608509200090587,
              "max_reward": -0.5521756098436675,
              "num_responses": 7,
              "rvariance": 0.04519211912081537
            },
            {
              "id": "chat_hard_sample_53",
              "rewards": [
                -1.7897646880837164,
                -1.8589037427339985,
                -1.672228295178237,
                -1.8485328845364561,
                -1.9349567028493087,
                -1.568519713202814,
                -1.8554467900014844
              ],
              "variance": 0.25858006439205483,
              "mean_reward": -1.7897646880837164,
              "min_reward": -1.9349567028493087,
              "max_reward": -1.568519713202814,
              "num_responses": 7,
              "rvariance": 0.013770416003364705
            },
            {
              "id": "chat_hard_sample_356",
              "rewards": [
                -1.2936919709679426,
                -1.1614635289492783,
                -0.733665628300658,
                -0.9963940359717298,
                -0.8598444030374227,
                -0.766506679259542,
                -0.7647782028932849
              ],
              "variance": 0.46202173270050984,
              "mean_reward": -0.9394777784828369,
              "min_reward": -1.2936919709679426,
              "max_reward": -0.733665628300658,
              "num_responses": 7,
              "rvariance": 0.04101769806567047
            },
            {
              "id": "chat_hard_sample_63",
              "rewards": [
                1.0449365525778482,
                1.3214927711789766,
                2.3170951581430383,
                2.0543667504719667,
                1.8607773974511768,
                1.8746052083812332,
                1.8192939646610076
              ],
              "variance": 0.9485878298018704,
              "mean_reward": 1.7560811146950353,
              "min_reward": 1.0449365525778482,
              "max_reward": 2.3170951581430383,
              "num_responses": 7,
              "rvariance": 0.16104426154478751
            },
            {
              "id": "chat_hard_sample_159",
              "rewards": [
                -0.5037782715884701,
                -0.5487186571111534,
                -0.5348908461810971,
                -0.3413014931603072
              ],
              "variance": 0.15452578714338044,
              "mean_reward": -0.482172317010257,
              "min_reward": -0.5487186571111534,
              "max_reward": -0.3413014931603072,
              "num_responses": 4,
              "rvariance": 0.006879766246040068
            },
            {
              "id": "chat_hard_sample_152",
              "rewards": [
                -0.5902020899013227,
                -0.6213146644939496,
                -0.5348908461810971,
                -0.5487186571111534,
                -0.5798312317037804,
                -0.5279769407160688
              ],
              "variance": 0.0743244837490532,
              "mean_reward": -0.5671557383512286,
              "min_reward": -0.6213146644939496,
              "max_reward": -0.5279769407160688,
              "num_responses": 6,
              "rvariance": 0.001090153191328994
            },
            {
              "id": "chat_hard_sample_318",
              "rewards": [
                0.2221818022394916,
                0.9757974979275661,
                1.0311087416477918,
                0.10464540933401209,
                0.9896253088576226,
                1.100247796298074
              ],
              "variance": 0.902264663186181,
              "mean_reward": 0.7372677593840931,
              "min_reward": 0.10464540933401209,
              "max_reward": 1.100247796298074,
              "num_responses": 6,
              "rvariance": 0.16736706333868834
            },
            {
              "id": "chat_hard_sample_176",
              "rewards": [
                -1.6756852479107511,
                -1.1847979598937484,
                -1.3732018838157671,
                -1.1951688180912907,
                -1.139857574371065,
                -1.0730951747243864,
                -0.7699636319920561
              ],
              "variance": 0.5423526718223066,
              "mean_reward": -1.201681470114152,
              "min_reward": -1.6756852479107511,
              "max_reward": -0.7699636319920561,
              "num_responses": 7,
              "rvariance": 0.06588046034789809
            },
            {
              "id": "chat_hard_sample_274",
              "rewards": [
                -0.45192398060075856,
                -0.25142072211494054,
                -0.11659956554689052,
                -0.199566431127229,
                -0.20993728932477132,
                -0.27561939124253926
              ],
              "variance": 0.20568868758458914,
              "mean_reward": -0.2508445633261882,
              "min_reward": -0.45192398060075856,
              "max_reward": -0.11659956554689052,
              "num_responses": 6,
              "rvariance": 0.010561937907586671
            },
            {
              "id": "chat_hard_sample_389",
              "rewards": [
                -0.2963611076376239,
                -0.3516723513578495,
                -0.033632699966552035,
                -0.23067900571985592,
                -0.14425518740700335,
                -0.2790763439750534,
                -0.2030233838597431
              ],
              "variance": 0.21847941269489138,
              "mean_reward": -0.21981429713195447,
              "min_reward": -0.3516723513578495,
              "max_reward": -0.033632699966552035,
              "num_responses": 7,
              "rvariance": 0.009647241957937992
            },
            {
              "id": "chat_hard_sample_42",
              "rewards": [
                -1.4527117966635914,
                -1.3956720765771087,
                -1.2936919709679426,
                -1.1303509543566512,
                -1.056512604585608,
                -1.1472035989276577,
                -1.1338079070891653
              ],
              "variance": 0.31767235016346773,
              "mean_reward": -1.2299929870239608,
              "min_reward": -1.4527117966635914,
              "max_reward": -1.056512604585608,
              "num_responses": 7,
              "rvariance": 0.019605774226629045
            },
            {
              "id": "chat_hard_sample_5",
              "rewards": [
                -0.28599024944008156,
                -0.1027717546168341,
                -0.00597707810643921,
                0.06316197654384285,
                0.24983742409960444,
                0.13921493665915313,
                0.05624807107881465
              ],
              "variance": 0.3595230841814668,
              "mean_reward": 0.016246189459722893,
              "min_reward": -0.28599024944008156,
              "max_reward": 0.24983742409960444,
              "num_responses": 7,
              "rvariance": 0.025641918418790686
            },
            {
              "id": "chat_hard_sample_17",
              "rewards": [
                1.736327099080669,
                1.266181527458751,
                1.7778105318708384,
                1.805466153730951,
                1.8192939646610076,
                1.6118768007101612
              ],
              "variance": 0.3733508951115234,
              "mean_reward": 1.6694926795853966,
              "min_reward": 1.266181527458751,
              "max_reward": 1.8192939646610076,
              "num_responses": 6,
              "rvariance": 0.03718471372713421
            },
            {
              "id": "chat_hard_sample_182",
              "rewards": [
                -0.08894394368677769,
                -0.019804889036495625,
                -0.26524853304499696,
                -0.06820222729169308
              ],
              "variance": 0.1780330657244763,
              "mean_reward": -0.11054989826499083,
              "min_reward": -0.26524853304499696,
              "max_reward": -0.019804889036495625,
              "num_responses": 4,
              "rvariance": 0.008606616703193974
            },
            {
              "id": "chat_hard_sample_140",
              "rewards": [
                -0.799347730218426,
                -0.7768775374570842,
                -0.7388510573994291,
                -0.43809616967070214,
                -0.7094669591730592
              ],
              "variance": 0.2437151676422442,
              "mean_reward": -0.6925278907837401,
              "min_reward": -0.799347730218426,
              "max_reward": -0.43809616967070214,
              "num_responses": 5,
              "rvariance": 0.01713872190050314
            },
            {
              "id": "chat_hard_sample_251",
              "rewards": [
                -0.8278675902616672,
                -0.4173544532756175,
                -1.0319358312528903,
                -0.7474934392307143,
                -0.7630497265270278,
                -0.6904537191442317
              ],
              "variance": 0.3759976245473542,
              "mean_reward": -0.7463591266153582,
              "min_reward": -1.0319358312528903,
              "max_reward": -0.4173544532756175,
              "num_responses": 6,
              "rvariance": 0.033307839388672815
            },
            {
              "id": "chat_hard_sample_98",
              "rewards": [
                0.8098637667668892,
                0.671585657466325,
                1.3491483930390893,
                1.100247796298074,
                0.8651750104871149,
                1.1279034181581866,
                1.404459636759315
              ],
              "variance": 0.6167203674805161,
              "mean_reward": 1.0469119541392848,
              "min_reward": 0.671585657466325,
              "max_reward": 1.404459636759315,
              "num_responses": 7,
              "rvariance": 0.06552593263533005
            },
            {
              "id": "chat_hard_sample_409",
              "rewards": [
                0.03550635468373003,
                -0.15116909287203156,
                -0.02671879450152383,
                -0.2064803365922572,
                -0.019804889036495625,
                -0.18573862019717258
              ],
              "variance": 0.20396021121833208,
              "mean_reward": -0.09240089641929179,
              "min_reward": -0.2064803365922572,
              "max_reward": 0.03550635468373003,
              "num_responses": 6,
              "rvariance": 0.008520722324918585
            },
            {
              "id": "chat_hard_sample_248",
              "rewards": [
                -0.6766259082141752,
                -0.9255265049551907,
                -0.6627980972841189,
                -0.8952781685456923,
                -0.8468808302904949,
                -0.6576126681853477,
                -0.7716921083583131
              ],
              "variance": 0.24665357746488137,
              "mean_reward": -0.7766306122619048,
              "min_reward": -0.9255265049551907,
              "max_reward": -0.6576126681853477,
              "num_responses": 7,
              "rvariance": 0.011190109248138225
            },
            {
              "id": "chat_hard_sample_382",
              "rewards": [
                -0.8546589739386515,
                -0.6092153299301503,
                -0.45192398060075856,
                -0.8183609702472535,
                -0.600572948098865,
                -0.6887252427779746,
                -0.6506987627203195
              ],
              "variance": 0.2917668106241903,
              "mean_reward": -0.6677366011877103,
              "min_reward": -0.8546589739386515,
              "max_reward": -0.45192398060075856,
              "num_responses": 7,
              "rvariance": 0.016124181099331437
            },
            {
              "id": "chat_hard_sample_254",
              "rewards": [
                -0.48303655519338545,
                -0.6195861881276925,
                -0.2963611076376239,
                -0.45192398060075856,
                -0.4069835950780752,
                -0.4450100751357303
              ],
              "variance": 0.19963902030268943,
              "mean_reward": -0.4504835836288777,
              "min_reward": -0.6195861881276925,
              "max_reward": -0.2963611076376239,
              "num_responses": 6,
              "rvariance": 0.00922223457570299
            },
            {
              "id": "chat_hard_sample_2",
              "rewards": [
                -0.35858625682287776,
                0.3328042896799429,
                0.15995665305423776,
                -0.24450681664991233,
                0.3673738170050839,
                0.20144008584440698,
                -0.1027717546168341
              ],
              "variance": 0.6367706933290977,
              "mean_reward": 0.050815716784863914,
              "min_reward": -0.35858625682287776,
              "max_reward": 0.3673738170050839,
              "num_responses": 7,
              "rvariance": 0.070391502386085
            },
            {
              "id": "chat_hard_sample_203",
              "rewards": [
                -0.08894394368677769,
                0.16687055851926597,
                0.2844069514247455,
                -0.18573862019717258,
                0.20144008584440698,
                0.23600961316954802,
                0.20144008584440698
              ],
              "variance": 0.3830303627625627,
              "mean_reward": 0.11649781870263189,
              "min_reward": -0.18573862019717258,
              "max_reward": 0.2844069514247455,
              "num_responses": 7,
              "rvariance": 0.027571074144528616
            },
            {
              "id": "chat_hard_sample_68",
              "rewards": [
                -0.6645265736503759,
                -0.7146523882718304,
                -0.6368709517902631,
                -0.6627980972841189,
                -0.6420563808890343
              ],
              "variance": 0.05565693899347701,
              "mean_reward": -0.6641808783771246,
              "min_reward": -0.7146523882718304,
              "max_reward": -0.6368709517902631,
              "num_responses": 5,
              "rvariance": 0.0007569460758209579
            },
            {
              "id": "chat_hard_sample_220",
              "rewards": [
                -0.6178577117614354,
                -0.6489702863540624,
                -0.5176060825185265,
                -0.4899504606584137,
                -0.4553809333332726,
                -0.4899504606584137,
                -0.4311822642056739
              ],
              "variance": 0.18460127591625308,
              "mean_reward": -0.5215568856413998,
              "min_reward": -0.6489702863540624,
              "max_reward": -0.4311822642056739,
              "num_responses": 7,
              "rvariance": 0.005724056243118732
            },
            {
              "id": "chat_hard_sample_11",
              "rewards": [
                0.15304274758920955,
                0.7683803339767199,
                0.8236915776969456,
                0.7822081449067764
              ],
              "variance": 0.4736025243544321,
              "mean_reward": 0.6318307010424129,
              "min_reward": 0.15304274758920955,
              "max_reward": 0.8236915776969456,
              "num_responses": 4,
              "rvariance": 0.07682691956005659
            },
            {
              "id": "chat_hard_sample_6",
              "rewards": [
                0.07698978747389927,
                0.2982347623548019,
                0.5540492645608456,
                0.20144008584440698,
                0.602446602816043,
                0.5609631700258737
              ],
              "variance": 0.4424899497618053,
              "mean_reward": 0.38235394551264507,
              "min_reward": 0.07698978747389927,
              "max_reward": 0.602446602816043,
              "num_responses": 6,
              "rvariance": 0.04047907434551084
            },
            {
              "id": "chat_hard_sample_286",
              "rewards": [
                -2.7991948859778346,
                -2.709314114932468,
                -2.882161751558173,
                -2.4880691400515653,
                -2.481155234586537,
                -2.806108791442863
              ],
              "variance": 0.3595230841814665,
              "mean_reward": -2.694333986424907,
              "min_reward": -2.882161751558173,
              "max_reward": -2.481155234586537,
              "num_responses": 6,
              "rvariance": 0.024497242663615856
            },
            {
              "id": "chat_hard_sample_400",
              "rewards": [
                -0.0958578491518059,
                0.5333075481657609,
                0.06316197654384285,
                -0.46920874426332904,
                0.18069836944932238,
                -0.3516723513578495,
                -0.17882471473214437
              ],
              "variance": 0.7204289494559392,
              "mean_reward": -0.04548510933517182,
              "min_reward": -0.46920874426332904,
              "max_reward": 0.5333075481657609,
              "num_responses": 7,
              "rvariance": 0.0987961864257555
            },
            {
              "id": "chat_hard_sample_209",
              "rewards": [
                -0.48649350792589957,
                -0.2790763439750534,
                -0.43809616967070214,
                -0.4553809333332726,
                -0.3032750131026521,
                -0.24104986391739824,
                -0.3827849259504765
              ],
              "variance": 0.20396021121833208,
              "mean_reward": -0.3694509654107792,
              "min_reward": -0.48649350792589957,
              "max_reward": -0.24104986391739824,
              "num_responses": 7,
              "rvariance": 0.007858078063625292
            },
            {
              "id": "chat_hard_sample_337",
              "rewards": [
                2.068194561402023,
                1.7916383428008946,
                1.7501549100107252,
                1.805466153730951,
                1.4597708804795406,
                1.6257046116402176,
                1.8607773974511768
              ],
              "variance": 0.38441314385556846,
              "mean_reward": 1.7659581225022183,
              "min_reward": 1.4597708804795406,
              "max_reward": 2.068194561402023,
              "num_responses": 7,
              "rvariance": 0.03088990487978045
            },
            {
              "id": "chat_hard_sample_268",
              "rewards": [
                -0.28599024944008156,
                0.2290957077045198,
                -0.6195861881276925,
                0.2290957077045198,
                0.2290957077045198,
                0.15995665305423776
              ],
              "variance": 0.6818839264884069,
              "mean_reward": -0.009722110233329478,
              "min_reward": -0.6195861881276925,
              "max_reward": 0.2290957077045198,
              "num_responses": 6,
              "rvariance": 0.10802516857521478
            },
            {
              "id": "chat_hard_sample_249",
              "rewards": [
                0.0009368273585889964,
                0.27057914049468906,
                0.38120162793514034,
                0.1115593147990403,
                0.25675132956463265,
                0.3120625732848583,
                0.03550635468373003
              ],
              "variance": 0.31803965139129753,
              "mean_reward": 0.1955138811600971,
              "min_reward": 0.0009368273585889964,
              "max_reward": 0.38120162793514034,
              "num_responses": 7,
              "rvariance": 0.018279908970355148
            },
            {
              "id": "chat_hard_sample_295",
              "rewards": [
                0.13921493665915313,
                1.266181527458751,
                1.4321152586194277,
                1.4321152586194277,
                1.3906318258292585,
                1.2246980946685815,
                1.5289099351298228
              ],
              "variance": 0.6803282977587755,
              "mean_reward": 1.2019809767120602,
              "min_reward": 0.13921493665915313,
              "max_reward": 1.5289099351298228,
              "num_responses": 7,
              "rvariance": 0.1975006708852812
            },
            {
              "id": "chat_hard_sample_153",
              "rewards": [
                -1.9349567028493087,
                -1.9349567028493087,
                -1.9349567028493087,
                -1.6272879096555537,
                -1.9349567028493087,
                -1.9626123247094216
              ],
              "variance": 0.16766220752693384,
              "mean_reward": -1.8882878409603683,
              "min_reward": -1.9626123247094216,
              "max_reward": -1.6272879096555537,
              "num_responses": 6,
              "rvariance": 0.01372617061761953
            },
            {
              "id": "chat_hard_sample_192",
              "rewards": [
                -0.3136458713001944,
                -0.38969883141550465,
                -0.27561939124253926,
                -0.3309306349627649,
                -0.2687054857775111
              ],
              "variance": 0.0947205048708864,
              "mean_reward": -0.31572004293970285,
              "min_reward": -0.38969883141550465,
              "max_reward": -0.2687054857775111,
              "num_responses": 5,
              "rvariance": 0.001905391258744767
            },
            {
              "id": "chat_hard_sample_363",
              "rewards": [
                -1.1260297634410086,
                -1.5097515167500741,
                -1.0291270571577227,
                -1.1221406916169303,
                -1.267764825474087,
                -1.3248045455605697
              ],
              "variance": 0.34164415676799553,
              "mean_reward": -1.2299364000000654,
              "min_reward": -1.5097515167500741,
              "max_reward": -1.0291270571577227,
              "num_responses": 6,
              "rvariance": 0.025244725069560835
            },
            {
              "id": "chat_hard_sample_129",
              "rewards": [
                -0.48649350792589957,
                -0.6299570463252349,
                -0.7077384828068022,
                -0.7250232464693727,
                -0.7250232464693727
              ],
              "variance": 0.18114432318373896,
              "mean_reward": -0.6548471059993364,
              "min_reward": -0.7250232464693727,
              "max_reward": -0.48649350792589957,
              "num_responses": 5,
              "rvariance": 0.0083218656355965
            },
            {
              "id": "chat_hard_sample_359",
              "rewards": [
                -0.9108344558420057,
                -1.0847623901966217,
                -0.9940173809681264,
                -0.8944139303625638,
                -0.8970066449119494,
                -0.5106921770534983,
                -0.8382384484592096
              ],
              "variance": 0.32309544476259955,
              "mean_reward": -0.8757093468277108,
              "min_reward": -1.0847623901966217,
              "max_reward": -0.5106921770534983,
              "num_responses": 7,
              "rvariance": 0.027768396853237086
            },
            {
              "id": "chat_hard_sample_7",
              "rewards": [
                1.072592174437961,
                1.5150821241997663,
                1.5565655569899355,
                1.5012543132697098,
                1.3629762039691458,
                1.6257046116402176
              ],
              "variance": 0.3733508951115234,
              "mean_reward": 1.4390291640844561,
              "min_reward": 1.072592174437961,
              "max_reward": 1.6257046116402176,
              "num_responses": 6,
              "rvariance": 0.033063111405714954
            },
            {
              "id": "chat_hard_sample_316",
              "rewards": [
                -0.9354652440611687,
                -0.8624371175868083,
                -0.7492219155969714,
                -0.8131755411484823,
                -0.8563874503049086,
                -0.7181093410043445,
                -0.7492219155969714
              ],
              "variance": 0.15487148241663184,
              "mean_reward": -0.8120026464713793,
              "min_reward": -0.9354652440611687,
              "max_reward": -0.7181093410043445,
              "num_responses": 7,
              "rvariance": 0.0052081183604787635
            },
            {
              "id": "chat_hard_sample_41",
              "rewards": [
                -1.1243012870747517,
                -0.3966127368805329,
                -0.1027717546168341,
                -0.2064803365922572,
                -0.2790763439750534,
                -0.9004635976444635
              ],
              "variance": 0.8577563967550621,
              "mean_reward": -0.5016176761306488,
              "min_reward": -1.1243012870747517,
              "max_reward": -0.1027717546168341,
              "num_responses": 6,
              "rvariance": 0.14225795808818376
            },
            {
              "id": "chat_hard_sample_143",
              "rewards": [
                0.3535460060750275,
                -0.012890983571467417,
                0.07698978747389927,
                0.15995665305423776
              ],
              "variance": 0.28139595242664805,
              "mean_reward": 0.14440036575792428,
              "min_reward": -0.012890983571467417,
              "max_reward": 0.3535460060750275,
              "num_responses": 4,
              "rvariance": 0.01831716289413599
            },
            {
              "id": "chat_hard_sample_370",
              "rewards": [
                0.3328042896799429,
                0.16687055851926597,
                0.7199829957215225,
                0.36045991154005574,
                0.19452618037937877,
                0.4157711552602814,
                0.6923273738614096
              ],
              "variance": 0.5199256909701211,
              "mean_reward": 0.4118203521374081,
              "min_reward": 0.16687055851926597,
              "max_reward": 0.7199829957215225,
              "num_responses": 7,
              "rvariance": 0.041394657777249946
            },
            {
              "id": "chat_hard_sample_91",
              "rewards": [
                0.7130690902564942,
                0.5194797372357045,
                0.2844069514247455,
                0.6162744137460994,
                0.2290957077045198,
                0.5886187918859865,
                0.2844069514247455
              ],
              "variance": 0.39270983041360213,
              "mean_reward": 0.4621930919540422,
              "min_reward": 0.2290957077045198,
              "max_reward": 0.7130690902564942,
              "num_responses": 7,
              "rvariance": 0.031927893093274796
            },
            {
              "id": "chat_hard_sample_245",
              "rewards": [
                0.021678543753673618,
                -0.3620432095553919,
                -0.07511613275672127,
                0.049334165613786445,
                0.06316197654384285,
                -0.0958578491518059,
                -0.15116909287203156
              ],
              "variance": 0.2903840295311847,
              "mean_reward": -0.07857308548923538,
              "min_reward": -0.3620432095553919,
              "max_reward": 0.06316197654384285,
              "num_responses": 7,
              "rvariance": 0.018919383851882944
            },
            {
              "id": "chat_hard_sample_131",
              "rewards": [
                0.18069836944932238,
                0.25675132956463265,
                0.2290957077045198,
                0.10464540933401209,
                0.3328042896799429,
                0.18069836944932238
              ],
              "variance": 0.15210592023062053,
              "mean_reward": 0.21411557919695867,
              "min_reward": 0.10464540933401209,
              "max_reward": 0.3328042896799429,
              "num_responses": 6,
              "rvariance": 0.005057726560014787
            },
            {
              "id": "chat_hard_sample_171",
              "rewards": [
                -0.12351347101191873,
                0.4157711552602814,
                0.33971819514497115,
                0.18761227491435056,
                0.049334165613786445,
                -0.13042737647694694,
                0.2636652350296608
              ],
              "variance": 0.4964184123890253,
              "mean_reward": 0.14316573978202637,
              "min_reward": -0.13042737647694694,
              "max_reward": 0.4157711552602814,
              "num_responses": 7,
              "rvariance": 0.04060250887747791
            },
            {
              "id": "chat_hard_sample_329",
              "rewards": [
                2.4968567002337716,
                2.137333616052305,
                2.303267347212982,
                1.708671477220556,
                1.708671477220556
              ],
              "variance": 0.7107494818048996,
              "mean_reward": 2.070960123588034,
              "min_reward": 1.708671477220556,
              "max_reward": 2.4968567002337716,
              "num_responses": 5,
              "rvariance": 0.1004532214444708
            },
            {
              "id": "chat_hard_sample_384",
              "rewards": [
                -1.2764072073053723,
                -1.2608509200090587,
                -1.1057201661374882,
                -1.1951688180912907,
                -1.267764825474087,
                -1.3144336873630273,
                -1.2435661563464881
              ],
              "variance": 0.13222844201866457,
              "mean_reward": -1.237701682960973,
              "min_reward": -1.3144336873630273,
              "max_reward": -1.1057201661374882,
              "num_responses": 7,
              "rvariance": 0.0040125936075919855
            },
            {
              "id": "chat_hard_sample_29",
              "rewards": [
                -0.14425518740700335,
                -0.42772531147315984,
                0.671585657466325,
                0.6231883192111276,
                0.9757974979275661,
                0.15995665305423776,
                0.47799630444553526
              ],
              "variance": 1.0509136306842874,
              "mean_reward": 0.3337919904606612,
              "min_reward": -0.42772531147315984,
              "max_reward": 0.9757974979275661,
              "num_responses": 7,
              "rvariance": 0.2099253117565825
            },
            {
              "id": "chat_hard_sample_106",
              "rewards": [
                -1.5754336186678422,
                -1.668771342445723,
                -1.7448243025610333,
                -1.6307448623880678,
                -1.471725036692419,
                -1.3887581711120804,
                -1.6514865787831523
              ],
              "variance": 0.26065423603156357,
              "mean_reward": -1.5902491303786168,
              "min_reward": -1.7448243025610333,
              "max_reward": -1.3887581711120804,
              "num_responses": 7,
              "rvariance": 0.01290217398267863
            },
            {
              "id": "chat_hard_sample_320",
              "rewards": [
                -0.3378445404277931,
                -0.3171028240327085,
                -0.5452617043786393,
                -0.4069835950780752,
                -0.3620432095553919,
                -0.5210630352510406
              ],
              "variance": 0.2056886875845892,
              "mean_reward": -0.4150498181206081,
              "min_reward": -0.5452617043786393,
              "max_reward": -0.3171028240327085,
              "num_responses": 6,
              "rvariance": 0.007770495098242723
            },
            {
              "id": "chat_hard_sample_23",
              "rewards": [
                1.3214927711789766,
                1.833121775591064,
                2.1511614269823616,
                1.6810158553604433,
                2.1511614269823616,
                1.8746052083812332,
                2.261783914422813
              ],
              "variance": 0.6582038002706856,
              "mean_reward": 1.8963346255570361,
              "min_reward": 1.3214927711789766,
              "max_reward": 2.261783914422813,
              "num_responses": 7,
              "rvariance": 0.09209999178531805
            },
            {
              "id": "chat_hard_sample_235",
              "rewards": [
                -1.3230760691943126,
                -1.3127052109967703,
                -0.944107625892454,
                -1.304062829165485,
                -1.34208930922314,
                -1.0141109187258646,
                -1.3576455965194536
              ],
              "variance": 0.3622022225491651,
              "mean_reward": -1.2282567942453544,
              "min_reward": -1.3576455965194536,
              "max_reward": -0.944107625892454,
              "num_responses": 7,
              "rvariance": 0.025452470631675217
            },
            {
              "id": "chat_hard_sample_202",
              "rewards": [
                0.7130690902564942,
                0.6992412793264379,
                0.505651926305648,
                0.5817048864209583,
                0.4918241153755917,
                0.505651926305648,
                0.6093605082810711
              ],
              "variance": 0.20465160176483488,
              "mean_reward": 0.5866433903245498,
              "min_reward": 0.4918241153755917,
              "max_reward": 0.7130690902564942,
              "num_responses": 7,
              "rvariance": 0.007330303981388013
            },
            {
              "id": "chat_hard_sample_304",
              "rewards": [
                -0.02671879450152383,
                -0.15808299833705974,
                -0.07511613275672127,
                0.10464540933401209,
                -0.033632699966552035,
                0.07007588200887106,
                0.15304274758920955
              ],
              "variance": 0.23230722362494774,
              "mean_reward": 0.004887630481462261,
              "min_reward": -0.15808299833705974,
              "max_reward": 0.15304274758920955,
              "num_responses": 7,
              "rvariance": 0.010227695893115772
            },
            {
              "id": "chat_hard_sample_277",
              "rewards": [
                -0.3724140677529342,
                -0.19265252566220079,
                -0.3378445404277931,
                -0.3724140677529342,
                -0.299818060370138,
                -0.2894472021725957
              ],
              "variance": 0.13136420383553593,
              "mean_reward": -0.3107650773564326,
              "min_reward": -0.3724140677529342,
              "max_reward": -0.19265252566220079,
              "num_responses": 6,
              "rvariance": 0.0038098928675039203
            },
            {
              "id": "chat_hard_sample_196",
              "rewards": [
                0.8236915776969456,
                1.1832146618784123,
                0.9757974979275661,
                1.266181527458751,
                1.0864199853680174,
                1.1970424728084688,
                1.3491483930390893
              ],
              "variance": 0.38441314385556835,
              "mean_reward": 1.12592801659675,
              "min_reward": 0.8236915776969456,
              "max_reward": 1.3491483930390893,
              "num_responses": 7,
              "rvariance": 0.02761204736348235
            },
            {
              "id": "chat_hard_sample_185",
              "rewards": [
                -1.9418706083143369,
                -2.3843605580761422,
                -1.8001355462812587,
                -2.2391685433105497,
                -1.8934732700591395,
                -1.634201815120582,
                -1.8347050736063997
              ],
              "variance": 0.5634832953997988,
              "mean_reward": -1.9611307735383439,
              "min_reward": -2.3843605580761422,
              "max_reward": -1.634201815120582,
              "num_responses": 7,
              "rvariance": 0.05859462976232473
            },
            {
              "id": "chat_hard_sample_160",
              "rewards": [
                -0.36550016228790594,
                -0.4242683587406457,
                -0.4173544532756175,
                -0.4450100751357303,
                -0.42772531147315984,
                -0.465751791530815,
                -0.3205597767652226
              ],
              "variance": 0.10578275361493156,
              "mean_reward": -0.409452847029871,
              "min_reward": -0.465751791530815,
              "max_reward": -0.3205597767652226,
              "num_responses": 7,
              "rvariance": 0.002126217397848706
            },
            {
              "id": "chat_hard_sample_163",
              "rewards": [
                -0.49340741339092775,
                -0.48303655519338545,
                -0.48303655519338545,
                -0.6818113373129464,
                -0.48303655519338545,
                -0.4069835950780752
              ],
              "variance": 0.14259930021620681,
              "mean_reward": -0.5052186685603509,
              "min_reward": -0.6818113373129464,
              "max_reward": -0.4069835950780752,
              "num_responses": 6,
              "rvariance": 0.007075124088030662
            },
            {
              "id": "chat_hard_sample_266",
              "rewards": [
                -0.10968566008186231,
                -0.2237651002548277,
                0.08390369293892748,
                -0.07511613275672127,
                0.07698978747389927,
                -0.3032750131026521,
                -0.07511613275672127
              ],
              "variance": 0.335324415053868,
              "mean_reward": -0.08943779407713684,
              "min_reward": -0.3032750131026521,
              "max_reward": 0.08390369293892748,
              "num_responses": 7,
              "rvariance": 0.01747654121301245
            },
            {
              "id": "chat_hard_sample_289",
              "rewards": [
                -1.185662198076877,
                -1.1839337217106198,
                -0.7042815300742881,
                -0.8754006903337362,
                -0.7803344901895983,
                -0.7094669591730592,
                -0.5487186571111534
              ],
              "variance": 0.5425687313680886,
              "mean_reward": -0.8553997495241903,
              "min_reward": -1.185662198076877,
              "max_reward": -0.5487186571111534,
              "num_responses": 7,
              "rvariance": 0.0516041535128394
            },
            {
              "id": "chat_hard_sample_69",
              "rewards": [
                0.8651750104871149,
                0.6231883192111276,
                0.5678770754909019,
                0.5955326973510148,
                0.6923273738614096,
                0.7061551847914661,
                0.8236915776969456
              ],
              "variance": 0.25581450220604374,
              "mean_reward": 0.6962781769842828,
              "min_reward": 0.5678770754909019,
              "max_reward": 0.8651750104871149,
              "num_responses": 7,
              "rvariance": 0.010978871573934084
            },
            {
              "id": "chat_hard_sample_40",
              "rewards": [
                -1.1787482926118487,
                -1.2764072073053723,
                -1.304062829165485,
                -1.3282614982930838,
                -1.2625793963753158,
                -1.256529729093416,
                -1.1752913398793348
              ],
              "variance": 0.13637678529768138,
              "mean_reward": -1.2545543275319793,
              "min_reward": -1.3282614982930838,
              "max_reward": -1.1752913398793348,
              "num_responses": 7,
              "rvariance": 0.00292269531331377
            },
            {
              "id": "chat_hard_sample_313",
              "rewards": [
                -0.3205597767652226,
                -0.4208114060081316,
                -0.24796376938242645,
                -0.48303655519338545,
                -0.2168511947897995,
                -0.14425518740700335,
                -0.08203003822174948
              ],
              "variance": 0.32633633794933137,
              "mean_reward": -0.27364398968110265,
              "min_reward": -0.48303655519338545,
              "max_reward": -0.08203003822174948,
              "num_responses": 7,
              "rvariance": 0.017863835687408382
            },
            {
              "id": "chat_hard_sample_226",
              "rewards": [
                1.376804014899202,
                1.0864199853680174,
                1.0172809307177353,
                1.141731229088243,
                1.0172809307177353,
                1.570393367919992,
                1.0172809307177353
              ],
              "variance": 0.4369588253897827,
              "mean_reward": 1.1753130556326659,
              "min_reward": 1.0172809307177353,
              "max_reward": 1.570393367919992,
              "num_responses": 7,
              "rvariance": 0.04009131919338859
            },
            {
              "id": "chat_hard_sample_28",
              "rewards": [
                0.2844069514247455,
                0.7199829957215225,
                0.6854134683963815,
                0.7268969011865507,
                0.8236915776969456,
                0.7130690902564942,
                0.8928306323472277
              ],
              "variance": 0.32633633794933126,
              "mean_reward": 0.6923273738614096,
              "min_reward": 0.2844069514247455,
              "max_reward": 0.8928306323472277,
              "num_responses": 7,
              "rvariance": 0.03232786975448975
            },
            {
              "id": "chat_hard_sample_323",
              "rewards": [
                1.4321152586194277,
                1.9437442630315152,
                1.8192939646610076,
                2.2203004816326435
              ],
              "variance": 0.5890647456204035,
              "mean_reward": 1.8538634919861483,
              "min_reward": 1.4321152586194277,
              "max_reward": 2.2203004816326435,
              "num_responses": 4,
              "rvariance": 0.08035531123808219
            },
            {
              "id": "chat_hard_sample_116",
              "rewards": [
                -0.6524272390865765,
                0.028592449218701823,
                -0.15808299833705974,
                0.09081759840395569,
                0.27057914049468906,
                0.11847322026406851,
                0.09081759840395569
              ],
              "variance": 0.5351362829931832,
              "mean_reward": -0.030175747234037924,
              "min_reward": -0.6524272390865765,
              "max_reward": 0.27057914049468906,
              "num_responses": 7,
              "rvariance": 0.07840566890286735
            },
            {
              "id": "chat_hard_sample_36",
              "rewards": [
                0.4088572497952532,
                0.5194797372357045,
                0.8651750104871149,
                0.7061551847914661,
                0.8928306323472277,
                1.0311087416477918,
                0.8928306323472277
              ],
              "variance": 0.4729111338079294,
              "mean_reward": 0.7594910269502552,
              "min_reward": 0.4088572497952532,
              "max_reward": 1.0311087416477918,
              "num_responses": 7,
              "rvariance": 0.0434140521399693
            },
            {
              "id": "chat_hard_sample_351",
              "rewards": [
                -0.3724140677529342,
                -0.4450100751357303,
                0.24292351863457623,
                0.01476463828864541,
                0.2844069514247455,
                0.19452618037937877,
                0.2221818022394916
              ],
              "variance": 0.6609693624566966,
              "mean_reward": 0.020196992582596145,
              "min_reward": -0.4450100751357303,
              "max_reward": 0.2844069514247455,
              "num_responses": 7,
              "rvariance": 0.08017044397637428
            },
            {
              "id": "chat_hard_sample_296",
              "rewards": [
                -0.5418047516461252,
                -0.1027717546168341,
                -0.24796376938242645,
                -0.465751791530815,
                -0.5348908461810971,
                -0.16499690380208795
              ],
              "variance": 0.40446346970415015,
              "mean_reward": -0.3430299695265642,
              "min_reward": -0.5418047516461252,
              "max_reward": -0.1027717546168341,
              "num_responses": 6,
              "rvariance": 0.0316400033876798
            },
            {
              "id": "chat_hard_sample_338",
              "rewards": [
                -1.3455462619556542,
                -1.5201223749476165,
                -1.2781356836716293,
                -1.185662198076877,
                -1.4578972257623626,
                -1.1718343871468206,
                -1.333446927391855
              ],
              "variance": 0.3026562117316096,
              "mean_reward": -1.3275207227075452,
              "min_reward": -1.5201223749476165,
              "max_reward": -1.1718343871468206,
              "num_responses": 7,
              "rvariance": 0.014464918161835575
            },
            {
              "id": "chat_hard_sample_354",
              "rewards": [
                0.15304274758920955,
                0.2152678967744634,
                0.3881155334001686,
                0.2221818022394916,
                0.3466321006099993,
                0.12538712572909672,
                0.049334165613786445
              ],
              "variance": 0.26825953204309444,
              "mean_reward": 0.2142801959937451,
              "min_reward": 0.049334165613786445,
              "max_reward": 0.3881155334001686,
              "num_responses": 7,
              "rvariance": 0.012379765441018617
            },
            {
              "id": "chat_hard_sample_186",
              "rewards": [
                0.4918241153755917,
                0.38120162793514034,
                0.2290957077045198,
                0.39502943886519676,
                0.3535460060750275,
                0.47799630444553526
              ],
              "variance": 0.19358935302078978,
              "mean_reward": 0.3881155334001685,
              "min_reward": 0.2290957077045198,
              "max_reward": 0.4918241153755917,
              "num_responses": 6,
              "rvariance": 0.007568664056729926
            },
            {
              "id": "chat_hard_sample_54",
              "rewards": [
                0.637016130141184,
                1.100247796298074,
                0.837519388627002,
                0.9757974979275661,
                0.9481418760674533,
                1.0172809307177353,
                1.1279034181581866
              ],
              "variance": 0.3539919598094441,
              "mean_reward": 0.9491295768481715,
              "min_reward": 0.637016130141184,
              "max_reward": 1.1279034181581866,
              "num_responses": 7,
              "rvariance": 0.024289314416901613
            },
            {
              "id": "chat_hard_sample_241",
              "rewards": [
                -0.3101889185676803,
                -0.299818060370138,
                -0.25142072211494054,
                -0.26524853304499696,
                -0.25487767484745466,
                -0.20993728932477132,
                -0.24450681664991233
              ],
              "variance": 0.07328739792929898,
              "mean_reward": -0.262285430702842,
              "min_reward": -0.3101889185676803,
              "max_reward": -0.20993728932477132,
              "num_responses": 7,
              "rvariance": 0.0009916494539633901
            },
            {
              "id": "chat_hard_sample_67",
              "rewards": [
                0.38120162793514034,
                0.6784995629313533,
                0.5609631700258737,
                0.5194797372357045,
                0.5194797372357045,
                0.7061551847914661,
                0.7683803339767199
              ],
              "variance": 0.2668767509500888,
              "mean_reward": 0.5905941934474231,
              "min_reward": 0.38120162793514034,
              "max_reward": 0.7683803339767199,
              "num_responses": 7,
              "rvariance": 0.015361054896318295
            },
            {
              "id": "chat_hard_sample_262",
              "rewards": [
                0.6646717520012968,
                0.837519388627002,
                1.003453119787679,
                0.7130690902564942,
                1.0311087416477918,
                1.1693868509483558,
                1.1279034181581866
              ],
              "variance": 0.45078663631983906,
              "mean_reward": 0.935301765918115,
              "min_reward": 0.6646717520012968,
              "max_reward": 1.1693868509483558,
              "num_responses": 7,
              "rvariance": 0.03398630956928341
            },
            {
              "id": "chat_hard_sample_244",
              "rewards": [
                -1.0305314442053066,
                -1.0342584713700484,
                -1.033718322505593,
                -0.8261391138954102,
                -1.1251655252578803,
                -0.766506679259542,
                -0.7837914429221124
              ],
              "variance": 0.29374375546809706,
              "mean_reward": -0.942872999916556,
              "min_reward": -1.1251655252578803,
              "max_reward": -0.766506679259542,
              "num_responses": 7,
              "rvariance": 0.01822250938042737
            },
            {
              "id": "chat_hard_sample_85",
              "rewards": [
                1.2246980946685815,
                1.5289099351298228,
                1.4874265023396533,
                1.6118768007101612,
                1.1970424728084688,
                1.3906318258292585,
                1.6257046116402176
              ],
              "variance": 0.40377207915764735,
              "mean_reward": 1.438041463303738,
              "min_reward": 1.1970424728084688,
              "max_reward": 1.6257046116402176,
              "num_responses": 7,
              "rvariance": 0.02599653187330687
            },
            {
              "id": "chat_hard_sample_398",
              "rewards": [
                0.37428772247011216,
                -0.9510215313574822,
                -0.9510215313574822,
                -1.0815214970098896,
                -1.0864908665628785,
                -0.9510215313574822,
                -1.3092482582642562
              ],
              "variance": 0.7546959934169855,
              "mean_reward": -0.8508624990627656,
              "min_reward": -1.3092482582642562,
              "max_reward": 0.37428772247011216,
              "num_responses": 7,
              "rvariance": 0.2642757665308812
            },
            {
              "id": "chat_hard_sample_319",
              "rewards": [
                -1.0370132305787705,
                -0.9531821268153036,
                -0.968738414111617,
                -1.034420516029385,
                -1.3974005529433657,
                -1.3870296947458234,
                -0.9909925473271766
              ],
              "variance": 0.42866213883174875,
              "mean_reward": -1.1098252975073488,
              "min_reward": -1.3974005529433657,
              "max_reward": -0.9531821268153036,
              "num_responses": 7,
              "rvariance": 0.032727585379106985
            },
            {
              "id": "chat_hard_sample_190",
              "rewards": [
                -0.08203003822174948,
                -0.24796376938242645,
                0.08390369293892748,
                0.028592449218701823,
                -0.019804889036495625,
                0.14612884212418134
              ],
              "variance": 0.2800131713336424,
              "mean_reward": -0.015195618726476826,
              "min_reward": -0.24796376938242645,
              "max_reward": 0.14612884212418134,
              "num_responses": 6,
              "rvariance": 0.016072124516255972
            },
            {
              "id": "chat_hard_sample_20",
              "rewards": [
                0.5540492645608456,
                0.5747909809559302,
                0.5817048864209583,
                0.9619696869975097,
                0.5333075481657609,
                0.837519388627002,
                0.8651750104871149
              ],
              "variance": 0.3581403030884611,
              "mean_reward": 0.7012166808878745,
              "min_reward": 0.5333075481657609,
              "max_reward": 0.9619696869975097,
              "num_responses": 7,
              "rvariance": 0.027653020582436072
            },
            {
              "id": "chat_hard_sample_264",
              "rewards": [
                0.049334165613786445,
                0.505651926305648,
                0.4226850607253096,
                0.028592449218701823,
                0.27057914049468906,
                0.37428772247011216,
                0.3328042896799429
              ],
              "variance": 0.4148343279016924,
              "mean_reward": 0.2834192506440272,
              "min_reward": 0.028592449218701823,
              "max_reward": 0.505651926305648,
              "num_responses": 7,
              "rvariance": 0.028482240489832895
            },
            {
              "id": "chat_hard_sample_27",
              "rewards": [
                0.837519388627002,
                1.0449365525778482,
                1.1970424728084688,
                1.1693868509483558,
                1.1832146618784123,
                1.238525905598638,
                1.2108702837385252
              ],
              "variance": 0.25996284548506055,
              "mean_reward": 1.12592801659675,
              "min_reward": 0.837519388627002,
              "max_reward": 1.238525905598638,
              "num_responses": 7,
              "rvariance": 0.017122903311328496
            },
            {
              "id": "chat_hard_sample_115",
              "rewards": [
                -0.8097185884159682,
                -0.8408311630085952,
                -0.7388510573994291,
                -1.0039561200741045,
                -0.5383477989136112,
                -0.8114470647822253,
                -0.8702152612349651
              ],
              "variance": 0.265061850765519,
              "mean_reward": -0.8019095791184141,
              "min_reward": -1.0039561200741045,
              "max_reward": -0.5383477989136112,
              "num_responses": 7,
              "rvariance": 0.017228070574170345
            },
            {
              "id": "chat_hard_sample_260",
              "rewards": [
                0.29132085688977366,
                0.6301022246761558,
                0.6992412793264379,
                0.5194797372357045,
                0.7407247121166071,
                0.5817048864209583,
                0.7960359558368327
              ],
              "variance": 0.3346330245073652,
              "mean_reward": 0.6083728075003528,
              "min_reward": 0.29132085688977366,
              "max_reward": 0.7960359558368327,
              "num_responses": 7,
              "rvariance": 0.024371260854809063
            },
            {
              "id": "chat_hard_sample_175",
              "rewards": [
                -0.019804889036495625,
                0.8513471995570584,
                0.5194797372357045,
                0.5609631700258737,
                0.7683803339767199,
                0.5471353590958173,
                0.3466321006099993
              ],
              "variance": 0.601509775457454,
              "mean_reward": 0.5105904302092397,
              "min_reward": -0.019804889036495625,
              "max_reward": 0.8513471995570584,
              "num_responses": 7,
              "rvariance": 0.07067490048384827
            },
            {
              "id": "chat_hard_sample_200",
              "rewards": [
                0.8651750104871149,
                1.0311087416477918,
                0.8790028214171712,
                0.837519388627002
              ],
              "variance": 0.13966089039356977,
              "mean_reward": 0.9032014905447701,
              "min_reward": 0.837519388627002,
              "max_reward": 1.0311087416477918,
              "num_responses": 4,
              "rvariance": 0.005676498042547442
            },
            {
              "id": "chat_hard_sample_240",
              "rewards": [
                -0.5210630352510406,
                -0.5452617043786393,
                -0.7077384828068022,
                -0.4899504606584137
              ],
              "variance": 0.15971121624215157,
              "mean_reward": -0.5660034207737239,
              "min_reward": -0.7077384828068022,
              "max_reward": -0.4899504606584137,
              "num_responses": 4,
              "rvariance": 0.00708068440044076
            },
            {
              "id": "chat_hard_sample_130",
              "rewards": [
                0.10464540933401209,
                -0.04746051089660845,
                0.2152678967744634,
                0.45725458805045066,
                0.2083539913094352,
                0.3189764787498865,
                0.13921493665915313
              ],
              "variance": 0.33048468122834834,
              "mean_reward": 0.19946468428297037,
              "min_reward": -0.04746051089660845,
              "max_reward": 0.45725458805045066,
              "num_responses": 7,
              "rvariance": 0.02209432054438058
            },
            {
              "id": "chat_hard_sample_374",
              "rewards": [
                0.8513471995570584,
                0.671585657466325,
                0.7822081449067764,
                0.7130690902564942,
                0.9619696869975097,
                1.003453119787679,
                0.837519388627002
              ],
              "variance": 0.28208734297315097,
              "mean_reward": 0.8315931839426921,
              "min_reward": 0.671585657466325,
              "max_reward": 1.003453119787679,
              "num_responses": 7,
              "rvariance": 0.012721208932299671
            },
            {
              "id": "chat_hard_sample_257",
              "rewards": [
                -0.7405795337656862,
                -0.7958907774859119,
                -0.8287318284447958,
                -0.919476837673291,
                -0.8097185884159682,
                -0.766506679259542,
                -0.8295960666279243
              ],
              "variance": 0.10941255398407135,
              "mean_reward": -0.8129286159533028,
              "min_reward": -0.919476837673291,
              "max_reward": -0.7405795337656862,
              "num_responses": 7,
              "rvariance": 0.0027957210149936263
            },
            {
              "id": "chat_hard_sample_237",
              "rewards": [
                -0.11659956554689052,
                -0.2583346275799688,
                0.18069836944932238,
                -0.1027717546168341,
                0.07007588200887106,
                0.07698978747389927,
                0.18761227491435056
              ],
              "variance": 0.35675752199545546,
              "mean_reward": 0.005381480871821419,
              "min_reward": -0.2583346275799688,
              "max_reward": 0.18761227491435056,
              "num_responses": 7,
              "rvariance": 0.02419712467425574
            },
            {
              "id": "chat_hard_sample_22",
              "rewards": [
                0.24983742409960444,
                0.837519388627002,
                0.7061551847914661,
                0.6508439410712404,
                0.9066584432772841
              ],
              "variance": 0.46876279052891234,
              "mean_reward": 0.6702028763733194,
              "min_reward": 0.24983742409960444,
              "max_reward": 0.9066584432772841,
              "num_responses": 5,
              "rvariance": 0.052456100142904125
            },
            {
              "id": "chat_hard_sample_292",
              "rewards": [
                -0.5936590426338367,
                -0.5625464680412099,
                -0.5832881844362945,
                -0.5902020899013227,
                -0.4208114060081316,
                -0.49340741339092775,
                -0.5625464680412099
              ],
              "variance": 0.12721586055651907,
              "mean_reward": -0.5437801532075619,
              "min_reward": -0.5936590426338367,
              "max_reward": -0.4208114060081316,
              "num_responses": 7,
              "rvariance": 0.0035095513139530724
            },
            {
              "id": "chat_hard_sample_92",
              "rewards": [
                0.837519388627002,
                1.1970424728084688,
                0.671585657466325,
                0.837519388627002,
                1.0864199853680174,
                0.7545525230466635
              ],
              "variance": 0.42866213883174886,
              "mean_reward": 0.8974399026572465,
              "min_reward": 0.671585657466325,
              "max_reward": 1.1970424728084688,
              "num_responses": 6,
              "rvariance": 0.03401384183810417
            },
            {
              "id": "chat_hard_sample_407",
              "rewards": [
                -0.7613212501607708,
                -0.5106921770534983,
                -0.6368709517902631,
                -0.8486093066567519,
                -0.6506987627203195
              ],
              "variance": 0.25253039711015535,
              "mean_reward": -0.6816384896763208,
              "min_reward": -0.8486093066567519,
              "max_reward": -0.5106921770534983,
              "num_responses": 5,
              "rvariance": 0.013282527398673227
            },
            {
              "id": "chat_hard_sample_44",
              "rewards": [
                -2.0317513793597035,
                -1.9626123247094216,
                -2.0248374738946753,
                -1.8900163173266253,
                -1.8658176481990265,
                -1.9971818520345626
              ],
              "variance": 0.15037744386436347,
              "mean_reward": -1.9620361659206693,
              "min_reward": -2.0317513793597035,
              "max_reward": -1.8658176481990265,
              "num_responses": 6,
              "rvariance": 0.004080771370586885
            },
            {
              "id": "chat_hard_sample_119",
              "rewards": [
                -0.16499690380208795,
                0.07698978747389927,
                0.007850732823617203,
                -0.23413595845237004,
                0.2152678967744634
              ],
              "variance": 0.36643698964649496,
              "mean_reward": -0.01980488903649562,
              "min_reward": -0.23413595845237004,
              "max_reward": 0.2152678967744634,
              "num_responses": 5,
              "rvariance": 0.02648235718375818
            },
            {
              "id": "chat_hard_sample_303",
              "rewards": [
                -0.5383477989136112,
                -0.6921821955104888,
                -0.1822816674646585,
                -0.3240167294977367,
                -0.34821539862533546,
                -0.4138975005431034,
                -0.3620432095553919
              ],
              "variance": 0.3325588528678568,
              "mean_reward": -0.4087120714443323,
              "min_reward": -0.6921821955104888,
              "max_reward": -0.1822816674646585,
              "num_responses": 7,
              "rvariance": 0.02306706866221949
            },
            {
              "id": "chat_hard_sample_365",
              "rewards": [
                -1.7517382080260613,
                -1.6480296260506382,
                -1.7932216408162305,
                -1.6549435315156664,
                -1.6134600987254972
              ],
              "variance": 0.1493403580446091,
              "mean_reward": -1.6922786210268188,
              "min_reward": -1.7932216408162305,
              "max_reward": -1.6134600987254972,
              "num_responses": 5,
              "rvariance": 0.004657835530659558
            },
            {
              "id": "chat_hard_sample_45",
              "rewards": [
                -0.3413014931603072,
                -0.23067900571985592,
                -0.08894394368677769,
                -0.04746051089660845,
                -0.11659956554689052,
                -0.15116909287203156,
                -0.15116909287203156
              ],
              "variance": 0.20257743012532642,
              "mean_reward": -0.1610461006792147,
              "min_reward": -0.3413014931603072,
              "max_reward": -0.04746051089660845,
              "num_responses": 7,
              "rvariance": 0.008230251469121635
            },
            {
              "id": "chat_hard_sample_78",
              "rewards": [
                -0.08203003822174948,
                0.436512871655366,
                -0.14425518740700335,
                0.505651926305648
              ],
              "variance": 0.6104978525619906,
              "mean_reward": 0.1789698930830653,
              "min_reward": -0.14425518740700335,
              "max_reward": 0.505651926305648,
              "num_responses": 4,
              "rvariance": 0.08641123836031564
            },
            {
              "id": "chat_hard_sample_189",
              "rewards": [
                1.0172809307177353,
                1.072592174437961,
                1.1970424728084688,
                1.266181527458751
              ],
              "variance": 0.21156550722986323,
              "mean_reward": 1.138274276355729,
              "min_reward": 1.0172809307177353,
              "max_reward": 1.266181527458751,
              "num_responses": 4,
              "rvariance": 0.009691873500012597
            },
            {
              "id": "chat_hard_sample_39",
              "rewards": [
                0.436512871655366,
                0.39502943886519676,
                -0.16845385653460207,
                0.5540492645608456,
                1.0449365525778482
              ],
              "variance": 0.7916421757457297,
              "mean_reward": 0.4524148542249309,
              "min_reward": -0.16845385653460207,
              "max_reward": 1.0449365525778482,
              "num_responses": 5,
              "rvariance": 0.15008708626584225
            },
            {
              "id": "chat_hard_sample_387",
              "rewards": [
                -0.8633013557699368,
                -0.8572516884880371,
                -0.5660034207737239,
                -0.8010762065846829,
                -0.8883642630806641,
                -0.7198378173706016,
                -0.6144007590289214
              ],
              "variance": 0.2782846949673853,
              "mean_reward": -0.7586050730137953,
              "min_reward": -0.8883642630806641,
              "max_reward": -0.5660034207737239,
              "num_responses": 7,
              "rvariance": 0.01410384166980586
            },
            {
              "id": "chat_hard_sample_118",
              "rewards": [
                -0.1027717546168341,
                0.15304274758920955,
                0.10464540933401209,
                0.1115593147990403,
                0.12538712572909672,
                0.16687055851926597
              ],
              "variance": 0.15901982569564876,
              "mean_reward": 0.0931222335589651,
              "min_reward": -0.1027717546168341,
              "max_reward": 0.16687055851926597,
              "num_responses": 6,
              "rvariance": 0.0081529118084775
            },
            {
              "id": "chat_hard_sample_154",
              "rewards": [
                -0.6558841918190906,
                -0.6835398136792035,
                -0.6057583771976361,
                -0.6057583771976361,
                -0.66798352638289,
                -0.6627980972841189,
                -0.6316855226914919
              ],
              "variance": 0.06844766410377923,
              "mean_reward": -0.6447725580360096,
              "min_reward": -0.6835398136792035,
              "max_reward": -0.6057583771976361,
              "num_responses": 7,
              "rvariance": 0.0008150743913294766
            },
            {
              "id": "chat_hard_sample_103",
              "rewards": [
                -0.13734128194197515,
                -0.600572948098865,
                -0.17882471473214437,
                -0.12351347101191873,
                -0.4795796024608714,
                -0.3032750131026521,
                -0.1961094783947149
              ],
              "variance": 0.39616678314611625,
              "mean_reward": -0.28845950139187737,
              "min_reward": -0.600572948098865,
              "max_reward": -0.12351347101191873,
              "num_responses": 7,
              "rvariance": 0.02925048834521526
            },
            {
              "id": "chat_hard_sample_162",
              "rewards": [
                0.6923273738614096,
                0.5817048864209583,
                0.5678770754909019,
                0.6577578465362687
              ],
              "variance": 0.10993109689394853,
              "mean_reward": 0.6249167955773847,
              "min_reward": 0.5678770754909019,
              "max_reward": 0.6923273738614096,
              "num_responses": 4,
              "rvariance": 0.0026858798632895553
            },
            {
              "id": "chat_hard_sample_321",
              "rewards": [
                0.7960359558368327,
                1.1279034181581866,
                1.238525905598638,
                1.2108702837385252,
                1.4321152586194277,
                1.1970424728084688,
                1.266181527458751
              ],
              "variance": 0.3373985866933765,
              "mean_reward": 1.181239260316976,
              "min_reward": 0.7960359558368327,
              "max_reward": 1.4321152586194277,
              "num_responses": 7,
              "rvariance": 0.032255678844904614
            },
            {
              "id": "chat_hard_sample_273",
              "rewards": [
                0.33971819514497115,
                0.33971819514497115,
                0.33971819514497115,
                -0.1891955729296867,
                0.33971819514497115,
                -0.1891955729296867,
                0.33971819514497115
              ],
              "variance": 0.5289137680746578,
              "mean_reward": 0.1885999756950689,
              "min_reward": -0.1891955729296867,
              "max_reward": 0.33971819514497115,
              "num_responses": 7,
              "rvariance": 0.05709179062427204
            },
            {
              "id": "chat_hard_sample_291",
              "rewards": [
                1.2246980946685815,
                1.3629762039691458,
                1.473598691409597,
                1.5289099351298228,
                1.5150821241997663,
                1.708671477220556,
                2.2203004816326435
              ],
              "variance": 0.6056581187364711,
              "mean_reward": 1.5763195726043018,
              "min_reward": 1.2246980946685815,
              "max_reward": 2.2203004816326435,
              "num_responses": 7,
              "rvariance": 0.08827582468297028
            },
            {
              "id": "chat_hard_sample_312",
              "rewards": [
                -0.2790763439750534,
                -0.6541557154528336,
                0.03550635468373003,
                0.007850732823617203,
                -0.2030233838597431,
                0.25675132956463265,
                -0.2237651002548277
              ],
              "variance": 0.5531124372022566,
              "mean_reward": -0.1514160180672111,
              "min_reward": -0.6541557154528336,
              "max_reward": 0.25675132956463265,
              "num_responses": 7,
              "rvariance": 0.07197836101181367
            },
            {
              "id": "chat_hard_sample_314",
              "rewards": [
                -1.6307448623880678,
                -1.437155509367278,
                -1.3870296947458234,
                -1.568519713202814,
                -1.606546193260469,
                -1.4959237058200177
              ],
              "variance": 0.20655292576771767,
              "mean_reward": -1.5209866131307448,
              "min_reward": -1.6307448623880678,
              "max_reward": -1.3870296947458234,
              "num_responses": 6,
              "rvariance": 0.007871161649786731
            },
            {
              "id": "chat_hard_sample_399",
              "rewards": [
                0.24983742409960444,
                0.8651750104871149,
                0.8651750104871149,
                0.4503406825854224,
                0.7683803339767199,
                0.4226850607253096,
                0.7960359558368327
              ],
              "variance": 0.5116290044120873,
              "mean_reward": 0.6310899254568741,
              "min_reward": 0.24983742409960444,
              "max_reward": 0.8651750104871149,
              "num_responses": 7,
              "rvariance": 0.05387197850149173
            },
            {
              "id": "chat_hard_sample_219",
              "rewards": [
                -1.2141820581201184,
                -1.3075197818979991,
                -1.2608509200090587,
                -1.3438177855893971,
                -1.2591224436428017,
                -1.2115893435707328,
                -1.2210959635851466
              ],
              "variance": 0.10889401107419405,
              "mean_reward": -1.2597397566307507,
              "min_reward": -1.3438177855893971,
              "max_reward": -1.2115893435707328,
              "num_responses": 7,
              "rvariance": 0.002177281491410823
            },
            {
              "id": "chat_hard_sample_406",
              "rewards": [
                -1.0765521274569005,
                -1.0988062606724602,
                -1.0063327750777078,
                -1.2357880126983314,
                -0.9030563121938491,
                -1.0923244742989962,
                -0.9957458573343834
              ],
              "variance": 0.19492892220463898,
              "mean_reward": -1.058372259961804,
              "min_reward": -1.2357880126983314,
              "max_reward": -0.9030563121938491,
              "num_responses": 7,
              "rvariance": 0.009335390871026836
            },
            {
              "id": "chat_hard_sample_253",
              "rewards": [
                0.8651750104871149,
                1.2246980946685815,
                1.0587643635079047,
                0.837519388627002,
                0.8651750104871149,
                0.9481418760674533,
                0.9343140651373969
              ],
              "variance": 0.2710250942291057,
              "mean_reward": 0.9619696869975096,
              "min_reward": 0.837519388627002,
              "max_reward": 1.2246980946685815,
              "num_responses": 7,
              "rvariance": 0.016225394705675456
            },
            {
              "id": "chat_hard_sample_24",
              "rewards": [
                1.1555590400182996,
                1.5150821241997663,
                1.5842211788500484,
                1.4321152586194277,
                1.3214927711789766,
                1.2800093383888071
              ],
              "variance": 0.331867462321354,
              "mean_reward": 1.381413285209221,
              "min_reward": 1.1555590400182996,
              "max_reward": 1.5842211788500484,
              "num_responses": 6,
              "rvariance": 0.021075409808494285
            },
            {
              "id": "chat_hard_sample_60",
              "rewards": [
                1.003453119787679,
                1.003453119787679,
                1.0864199853680174,
                1.3906318258292585,
                1.2800093383888071,
                1.2800093383888071,
                1.266181527458751
              ],
              "variance": 0.32080521357730873,
              "mean_reward": 1.1871654650012857,
              "min_reward": 1.003453119787679,
              "max_reward": 1.3906318258292585,
              "num_responses": 7,
              "rvariance": 0.020361738714337305
            },
            {
              "id": "chat_hard_sample_386",
              "rewards": [
                -1.3213475928280556,
                -1.2850495891366573,
                -1.253072776360902,
                -1.189119150809391,
                -1.1951688180912907,
                -1.141153931645758
              ],
              "variance": 0.13806204975478198,
              "mean_reward": -1.2308186431453425,
              "min_reward": -1.3213475928280556,
              "max_reward": -1.141153931645758,
              "num_responses": 6,
              "rvariance": 0.0037802084757847126
            },
            {
              "id": "chat_hard_sample_216",
              "rewards": [
                -1.9245858446517663,
                -1.5166654222151024,
                -1.9418706083143369,
                -1.5166654222151024,
                -1.6307448623880678,
                -1.6411157205856102
              ],
              "variance": 0.4165628042679492,
              "mean_reward": -1.6952746467283308,
              "min_reward": -1.9418706083143369,
              "max_reward": -1.5166654222151024,
              "num_responses": 6,
              "rvariance": 0.0307154977123292
            },
            {
              "id": "chat_hard_sample_300",
              "rewards": [
                1.2246980946685815,
                1.1832146618784123,
                1.4597708804795406,
                1.6810158553604433,
                1.5565655569899355,
                1.4597708804795406,
                1.6257046116402176
              ],
              "variance": 0.43972438757579413,
              "mean_reward": 1.4558200773566674,
              "min_reward": 1.1832146618784123,
              "max_reward": 1.6810158553604433,
              "num_responses": 7,
              "rvariance": 0.03106940660091104
            },
            {
              "id": "chat_hard_sample_352",
              "rewards": [
                -0.8961424067288208,
                -0.5763742789712663,
                -0.7872483956546266,
                -0.3966127368805329,
                -0.36895711502042006,
                -0.5971159953663508
              ],
              "variance": 0.45891047524124723,
              "mean_reward": -0.6037418214370028,
              "min_reward": -0.8961424067288208,
              "max_reward": -0.36895711502042006,
              "num_responses": 6,
              "rvariance": 0.03633199417469011
            },
            {
              "id": "chat_hard_sample_311",
              "rewards": [
                -1.734453444363491,
                -1.8519898372689703,
                -1.737910397096005,
                -1.6860561061082935,
                -1.5546919022727574,
                -1.7033408697708639,
                -1.4665396075936479
              ],
              "variance": 0.26411118876407746,
              "mean_reward": -1.67642602349629,
              "min_reward": -1.8519898372689703,
              "max_reward": -1.4665396075936479,
              "num_responses": 7,
              "rvariance": 0.013951259109639642
            },
            {
              "id": "chat_hard_sample_419",
              "rewards": [
                -0.22030814752231362,
                -0.4795796024608714,
                -0.3620432095553919,
                -0.3067319658351662,
                -0.3378445404277931,
                -0.35858625682287776,
                -0.26524853304499696
              ],
              "variance": 0.16178538788166005,
              "mean_reward": -0.33290603652420153,
              "min_reward": -0.4795796024608714,
              "max_reward": -0.22030814752231362,
              "num_responses": 7,
              "rvariance": 0.005855268099053881
            },
            {
              "id": "chat_hard_sample_287",
              "rewards": [
                -2.301393692495804,
                -2.2322546378455215,
                -2.1008904340099854,
                -2.4673274236564806,
                -2.252996354240606,
                -2.3083075979608316,
                -2.1838572995903243
              ],
              "variance": 0.22124497488090222,
              "mean_reward": -2.2638610628285076,
              "min_reward": -2.4673274236564806,
              "max_reward": -2.1008904340099854,
              "num_responses": 7,
              "rvariance": 0.011265684106610174
            },
            {
              "id": "chat_hard_sample_55",
              "rewards": [
                -1.2271456308670463,
                -1.3628310256182248,
                -1.1580065762167642,
                -1.0647768822117745,
                -1.3006058764329709,
                -1.1234370488916232,
                -1.2081323908382187
              ],
              "variance": 0.22552295388738863,
              "mean_reward": -1.2064193472966604,
              "min_reward": -1.3628310256182248,
              "max_reward": -1.0647768822117745,
              "num_responses": 7,
              "rvariance": 0.009008667843209875
            }
          ]
        },
        "semantic_benchmark_reasoning_filtered.json": {
          "file_name": "semantic_benchmark_reasoning_filtered.json",
          "processed_samples": 200,
          "global_mean": 1.9668792564895803,
          "global_std": 1.6843877269424294,
          "mean_variance": 0.5285187021400479,
          "mean_rvariance": 0.0765641875959744,
          "sample_results": [
            {
              "id": "reasoning_sample_9",
              "rewards": [
                1.4296712716387103,
                1.5224349492057698,
                1.6337513622862414,
                0.6875618511022332,
                0.5762454380217616,
                1.6337513622862414,
                1.6523040977996533
              ],
              "variance": 0.9981371706215616,
              "mean_reward": 1.305102904620087,
              "min_reward": 0.5762454380217616,
              "max_reward": 1.6523040977996533,
              "num_responses": 7,
              "rvariance": 0.18741556300850687
            },
            {
              "id": "reasoning_sample_5",
              "rewards": [
                -0.045271201677537856,
                -0.1333966953662445,
                0.19591435999681717,
                0.07532157915963966,
                -0.14267306312295047
              ],
              "variance": 0.2866397636822142,
              "mean_reward": -0.010021004202055196,
              "min_reward": -0.14267306312295047,
              "max_reward": 0.19591435999681717,
              "num_responses": 5,
              "rvariance": 0.016750687418164927
            },
            {
              "id": "reasoning_sample_85",
              "rewards": [
                -0.4534313829726002,
                -1.0274066379187816,
                -1.4413645490617852,
                -0.5925768993231897
              ],
              "variance": 0.8220021378411071,
              "mean_reward": -0.8786948673190891,
              "min_reward": -1.4413645490617852,
              "max_reward": -0.4534313829726002,
              "num_responses": 4,
              "rvariance": 0.15035622104898536
            },
            {
              "id": "reasoning_sample_65",
              "rewards": [
                0.242296198780347,
                0.37216534737423046,
                -0.8523151965109567,
                -0.863910656206839,
                0.733943689885763,
                -0.8314433690583682,
                0.12170341794316948
              ],
              "variance": 1.3738300647681532,
              "mean_reward": -0.15393722397037912,
              "min_reward": -0.863910656206839,
              "max_reward": 0.733943689885763,
              "num_responses": 7,
              "rvariance": 0.3927005378840272
            },
            {
              "id": "reasoning_sample_256",
              "rewards": [
                -0.9589934257130752,
                -2.1278157630580266,
                -0.8175288174233093,
                -2.549890495988148
              ],
              "variance": 1.5632998761988726,
              "mean_reward": -1.6135571255456398,
              "min_reward": -2.549890495988148,
              "max_reward": -0.8175288174233093,
              "num_responses": 4,
              "rvariance": 0.5508242078327298
            },
            {
              "id": "reasoning_sample_263",
              "rewards": [
                -0.003527546772361022,
                0.7524964253991749,
                0.047492475889521775,
                0.30723077307728874,
                -0.21688400517659817,
                0.6690091155888213
              ],
              "variance": 0.8209585464684777,
              "mean_reward": 0.2593028730009746,
              "min_reward": -0.21688400517659817,
              "max_reward": 0.7524964253991749,
              "num_responses": 6,
              "rvariance": 0.1256822642965958
            },
            {
              "id": "reasoning_sample_203",
              "rewards": [
                -0.754913335065544,
                -1.601381892864963,
                0.015025188741050903,
                -1.5573191460206097,
                -1.5573191460206097,
                0.015025188741050903
              ],
              "variance": 1.5943757081838372,
              "mean_reward": -0.9068138570816041,
              "min_reward": -1.601381892864963,
              "max_reward": 0.015025188741050903,
              "num_responses": 6,
              "rvariance": 0.5085645399337315
            },
            {
              "id": "reasoning_sample_61",
              "rewards": [
                0.047492475889521775,
                -0.2818185794735399,
                -0.40241136031071745,
                0.12170341794316948,
                0.9194710450198823,
                0.6411800123187034,
                0.32578350859070065
              ],
              "variance": 1.082552117207586,
              "mean_reward": 0.19591435999681717,
              "min_reward": -0.40241136031071745,
              "max_reward": 0.9194710450198823,
              "num_responses": 7,
              "rvariance": 0.19320293171066708
            },
            {
              "id": "reasoning_sample_319",
              "rewards": [
                0.9380237805332942,
                1.1328275034241193,
                0.34433624410411257,
                1.2441439165045909,
                0.9565765160467061,
                1.1513802389375314
              ],
              "variance": 0.5565820654023578,
              "mean_reward": 0.9612146999250591,
              "min_reward": 0.34433624410411257,
              "max_reward": 1.2441439165045909,
              "num_responses": 6,
              "rvariance": 0.08779353148249651
            },
            {
              "id": "reasoning_sample_528",
              "rewards": [
                -1.4413645490617852,
                -0.8384006448758977,
                -0.9230475006558396,
                -1.1917722791079155,
                -1.397301802217432,
                -1.397301802217432,
                -1.51093730723708
              ],
              "variance": 0.5800048939880403,
              "mean_reward": -1.2428751264819116,
              "min_reward": -1.51093730723708,
              "max_reward": -0.8384006448758977,
              "num_responses": 7,
              "rvariance": 0.06106448535806869
            },
            {
              "id": "reasoning_sample_551",
              "rewards": [
                -1.4297690893659027,
                -1.1772779544880623,
                -1.1216197479478267,
                -0.3096476827436578,
                -1.1762633517646726,
                0.19591435999681717,
                -0.89637794335531
              ],
              "variance": 1.1708515427917308,
              "mean_reward": -0.845005915666945,
              "min_reward": -1.4297690893659027,
              "max_reward": 0.19591435999681717,
              "num_responses": 7,
              "rvariance": 0.2873374173359224
            },
            {
              "id": "reasoning_sample_596",
              "rewards": [
                -1.8216956270867297,
                -0.9787057071960754,
                -1.1924969953389082,
                -1.1924969953389082,
                -0.9787057071960754,
                -0.7270842317954261,
                -0.957833879743487
              ],
              "variance": 0.5786424274737743,
              "mean_reward": -1.1212884490993729,
              "min_reward": -1.8216956270867297,
              "max_reward": -0.7270842317954261,
              "num_responses": 7,
              "rvariance": 0.10335508097888131
            },
            {
              "id": "reasoning_sample_456",
              "rewards": [
                -1.7845901560599058,
                -0.9949393507703108,
                -2.090710292031203,
                -2.0582430048827316
              ],
              "variance": 0.8491355135294723,
              "mean_reward": -1.7321207009360378,
              "min_reward": -2.090710292031203,
              "max_reward": -0.9949393507703108,
              "num_responses": 4,
              "rvariance": 0.19528290968161433
            },
            {
              "id": "reasoning_sample_306",
              "rewards": [
                -0.6807023930118963,
                -1.2143834255148862,
                -1.2259788852107687,
                -1.3404840497076078,
                -1.2627944697451954,
                -0.39313499255401146,
                -0.41632591194577634
              ],
              "variance": 0.8868207575410899,
              "mean_reward": -0.9334005896700203,
              "min_reward": -1.3404840497076078,
              "max_reward": -0.39313499255401146,
              "num_responses": 7,
              "rvariance": 0.15169717158473164
            },
            {
              "id": "reasoning_sample_231",
              "rewards": [
                -1.3138144924070783,
                -1.8031428915733179,
                -0.7781042544573089,
                -0.9033352191728394,
                -0.8453579206934272,
                -0.6899787607686023,
                -0.8105715416057798
              ],
              "variance": 0.7666917950917478,
              "mean_reward": -1.020615011525479,
              "min_reward": -1.8031428915733179,
              "max_reward": -0.6899787607686023,
              "num_responses": 7,
              "rvariance": 0.13643363901240646
            },
            {
              "id": "reasoning_sample_526",
              "rewards": [
                -0.7178078640387202,
                -0.42096409582412936,
                -0.8360815529367212,
                -0.44879319909424725,
                -0.8998565812640746
              ],
              "variance": 0.4422508328009567,
              "mean_reward": -0.6647006586315785,
              "min_reward": -0.8998565812640746,
              "max_reward": -0.42096409582412936,
              "num_responses": 5,
              "rvariance": 0.03870272745623625
            },
            {
              "id": "reasoning_sample_591",
              "rewards": [
                -1.4518004627880794,
                -1.1143725856379,
                -1.076687341626282,
                -1.119590542501047,
                -1.2993201677872253
              ],
              "variance": 0.29904690555680835,
              "mean_reward": -1.2123542200681068,
              "min_reward": -1.4518004627880794,
              "max_reward": -1.076687341626282,
              "num_responses": 5,
              "rvariance": 0.020301716336585084
            },
            {
              "id": "reasoning_sample_23",
              "rewards": [
                0.49275812821140796,
                0.5947981735351736,
                0.23301983102364102,
                0.42782355391446625,
                0.22374346326693506,
                0.40927081840105434
              ],
              "variance": 0.3153965037280028,
              "mean_reward": 0.3969023280587798,
              "min_reward": 0.22374346326693506,
              "max_reward": 0.5947981735351736,
              "num_responses": 6,
              "rvariance": 0.017716944521992545
            },
            {
              "id": "reasoning_sample_275",
              "rewards": [
                -0.3328386021354227,
                -1.3346863198596668,
                0.019663372619403884,
                0.019663372619403884,
                0.019663372619403884,
                0.39071808288764237
              ],
              "variance": 1.038953188751068,
              "mean_reward": -0.20296945354153917,
              "min_reward": -1.3346863198596668,
              "max_reward": 0.39071808288764237,
              "num_responses": 6,
              "rvariance": 0.29980167967166665
            },
            {
              "id": "reasoning_sample_656",
              "rewards": [
                -2.3087049343137926,
                -1.747484685033082,
                -1.8588010981135537,
                -1.8356101787217887
              ],
              "variance": 0.3998114503140269,
              "mean_reward": -1.9376502240455542,
              "min_reward": -2.3087049343137926,
              "max_reward": -1.747484685033082,
              "num_responses": 4,
              "rvariance": 0.04761847143751677
            },
            {
              "id": "reasoning_sample_405",
              "rewards": [
                0.14953252121328736,
                0.7061145866156451,
                0.6504563800754094,
                0.33505987634740664,
                0.5391399669949378,
                0.7988782641827048
              ],
              "variance": 0.5102002266188279,
              "mean_reward": 0.5298635992382318,
              "min_reward": 0.14953252121328736,
              "max_reward": 0.7988782641827048,
              "num_responses": 6,
              "rvariance": 0.0501103649432072
            },
            {
              "id": "reasoning_sample_330",
              "rewards": [
                -1.0581346061128702,
                -1.4900654797844917,
                -1.4564386466664325,
                -0.9265261385646043,
                -1.4344072732442559,
                -1.4900654797844917
              ],
              "variance": 0.49773510744575433,
              "mean_reward": -1.3092729373595244,
              "min_reward": -1.4900654797844917,
              "max_reward": -0.9265261385646043,
              "num_responses": 6,
              "rvariance": 0.05204230136919977
            },
            {
              "id": "reasoning_sample_451",
              "rewards": [
                -1.742846501154729,
                -1.2494596910949307,
                -1.1432162916314077,
                -1.0158111782228991,
                -1.245981053186166,
                -1.090022120276547,
                -2.1510066824497915
              ],
              "variance": 0.8457728302176661,
              "mean_reward": -1.3769062168594959,
              "min_reward": -2.1510066824497915,
              "max_reward": -1.0158111782228991,
              "num_responses": 7,
              "rvariance": 0.14769013298040345
            },
            {
              "id": "reasoning_sample_314",
              "rewards": [
                -0.9601529716826634,
                -0.49981322175613,
                -0.24007492456836307,
                -1.3717917908864905
              ],
              "variance": 0.9303037314006493,
              "mean_reward": -0.7679582272234118,
              "min_reward": -1.3717917908864905,
              "max_reward": -0.24007492456836307,
              "num_responses": 4,
              "rvariance": 0.18802907939571517
            },
            {
              "id": "reasoning_sample_593",
              "rewards": [
                -0.3050094988653048,
                0.1680852567266993,
                0.08459794691634562,
                0.22374346326693506,
                0.17736162448340526
              ],
              "variance": 0.35435724830616777,
              "mean_reward": 0.06975575850561608,
              "min_reward": -0.3050094988653048,
              "max_reward": 0.22374346326693506,
              "num_responses": 5,
              "rvariance": 0.03712584290400226
            },
            {
              "id": "reasoning_sample_599",
              "rewards": [
                -0.3282004182570697,
                0.242296198780347,
                0.39999445064434835,
                0.03821610813281581,
                0.39999445064434835,
                0.39999445064434835,
                0.39999445064434835
              ],
              "variance": 0.5083449530674867,
              "mean_reward": 0.22175567017621237,
              "min_reward": -0.3282004182570697,
              "max_reward": 0.39999445064434835,
              "num_responses": 7,
              "rvariance": 0.06623380497233264
            },
            {
              "id": "reasoning_sample_301",
              "rewards": [
                -1.44484318697055,
                -1.2575765128820484,
                -1.2575765128820484,
                -1.2396035503534306,
                -1.2569967398972541,
                -0.996098896739899,
                -0.9995775346486637
              ],
              "variance": 0.3342971030322912,
              "mean_reward": -1.2074675620534134,
              "min_reward": -1.44484318697055,
              "max_reward": -0.996098896739899,
              "num_responses": 7,
              "rvariance": 0.02182140551196627
            },
            {
              "id": "reasoning_sample_77",
              "rewards": [
                1.2812493875314148,
                1.5409876847191817,
                1.5780931557460056,
                1.745067775366713,
                1.503882213692358,
                1.6337513622862414,
                1.8563841884471846
              ],
              "variance": 0.37476525737092103,
              "mean_reward": 1.591345109684157,
              "min_reward": 1.2812493875314148,
              "max_reward": 1.8563841884471846,
              "num_responses": 7,
              "rvariance": 0.02888503729726313
            },
            {
              "id": "reasoning_sample_511",
              "rewards": [
                -0.32356223437871673,
                -0.24935129232506903,
                -0.10556759209612661,
                -0.10556759209612661,
                -0.17514035027142133,
                0.06604521140293369,
                -0.17514035027142133
              ],
              "variance": 0.24211319845002569,
              "mean_reward": -0.15261202857656397,
              "min_reward": -0.32356223437871673,
              "max_reward": 0.06604521140293369,
              "num_responses": 7,
              "rvariance": 0.013119265024878656
            },
            {
              "id": "reasoning_sample_12",
              "rewards": [
                2.8396791706580164,
                2.988101054765312,
                2.4315189893629543,
                2.7098100220641332,
                2.060464279094716,
                2.245991634228835
              ],
              "variance": 0.760662156049889,
              "mean_reward": 2.5459275250289943,
              "min_reward": 2.060464279094716,
              "max_reward": 2.988101054765312,
              "num_responses": 6,
              "rvariance": 0.10789839122001395
            },
            {
              "id": "reasoning_sample_543",
              "rewards": [
                -0.9821843451048401,
                -0.5786623476881307,
                -0.8766656618723098,
                -0.8708679320243685,
                -0.7108505882211907,
                -0.34211496989212864,
                -0.36530588928389357
              ],
              "variance": 0.5628436136381343,
              "mean_reward": -0.675235962012409,
              "min_reward": -0.9821843451048401,
              "max_reward": -0.34211496989212864,
              "num_responses": 7,
              "rvariance": 0.055812030216545176
            },
            {
              "id": "reasoning_sample_506",
              "rewards": [
                -0.7409987834304851,
                -0.8291242771191917,
                -0.31892405050036376,
                -0.731722415673779,
                -0.3560295215271876,
                -0.4070495441890704,
                -0.24007492456836307
              ],
              "variance": 0.4888645807784043,
              "mean_reward": -0.5177033595726344,
              "min_reward": -0.8291242771191917,
              "max_reward": -0.24007492456836307,
              "num_responses": 7,
              "rvariance": 0.049660206997325304
            },
            {
              "id": "reasoning_sample_531",
              "rewards": [
                -0.3838586247973055,
                -0.4070495441890704,
                -0.3606677054055406,
                -0.523004141147895,
                -0.4580695668509532,
                -0.32356223437871673,
                -0.4070495441890704
              ],
              "variance": 0.13821787957491882,
              "mean_reward": -0.40903733727979313,
              "min_reward": -0.523004141147895,
              "max_reward": -0.32356223437871673,
              "num_responses": 7,
              "rvariance": 0.0036685823756069237
            },
            {
              "id": "reasoning_sample_274",
              "rewards": [
                0.30723077307728874,
                0.9473001482900002,
                0.9565765160467061,
                0.743220057642469,
                0.44637628942787816
              ],
              "variance": 0.5899769893264992,
              "mean_reward": 0.6801407568968684,
              "min_reward": 0.30723077307728874,
              "max_reward": 0.9565765160467061,
              "num_responses": 5,
              "rvariance": 0.06909550996244587
            },
            {
              "id": "reasoning_sample_597",
              "rewards": [
                1.0493401936137658,
                1.3183548585582388,
                1.3183548585582388,
                0.9287474127765882,
                1.3183548585582388,
                1.3183548585582388,
                0.48348176045470204
              ],
              "variance": 0.567713706710405,
              "mean_reward": 1.1049984001540019,
              "min_reward": 0.48348176045470204,
              "max_reward": 1.3183548585582388,
              "num_responses": 7,
              "rvariance": 0.08607558475729907
            },
            {
              "id": "reasoning_sample_73",
              "rewards": [
                1.6894095688264772,
                1.9305951305008322,
                1.8934896594740083,
                1.8749369239605964,
                0.743220057642469,
                1.986253337041068,
                2.00480607255448
              ],
              "variance": 0.6827406668935587,
              "mean_reward": 1.7318158214285617,
              "min_reward": 0.743220057642469,
              "max_reward": 2.00480607255448,
              "num_responses": 7,
              "rvariance": 0.1720738992299994
            },
            {
              "id": "reasoning_sample_412",
              "rewards": [
                -1.2633742427299897,
                -0.6482351058634255,
                -0.6482351058634255,
                -0.3282004182570697,
                -1.7312510414588467,
                -0.6482351058634255
              ],
              "variance": 1.0090948800341706,
              "mean_reward": -0.8779218366726971,
              "min_reward": -1.7312510414588467,
              "max_reward": -0.3282004182570697,
              "num_responses": 6,
              "rvariance": 0.22286765164512667
            },
            {
              "id": "reasoning_sample_491",
              "rewards": [
                -2.0767957403961437,
                -1.1294466832425472,
                -1.4413645490617852,
                -1.2442417342317835,
                -1.3300481359813137,
                -1.2743899294410779,
                -1.5781909734731983
              ],
              "variance": 0.5793091664062875,
              "mean_reward": -1.4392111065468356,
              "min_reward": -2.0767957403961437,
              "max_reward": -1.1294466832425472,
              "num_responses": 7,
              "rvariance": 0.08555483352821017
            },
            {
              "id": "reasoning_sample_64",
              "rewards": [
                0.03821610813281581,
                0.25157256653705296,
                0.4649290249412901,
                0.11242705018646351,
                0.30723077307728874,
                0.1402561534565814,
                0.22374346326693506
              ],
              "variance": 0.287567400457885,
              "mean_reward": 0.21976787708548964,
              "min_reward": 0.03821610813281581,
              "max_reward": 0.4649290249412901,
              "num_responses": 7,
              "rvariance": 0.017083757467642006
            },
            {
              "id": "reasoning_sample_535",
              "rewards": [
                0.13097978569987545,
                0.33505987634740664,
                0.39071808288764237,
                0.5947981735351736,
                0.7896018964259988,
                0.743220057642469
              ],
              "variance": 0.5333911460105929,
              "mean_reward": 0.49739631208976093,
              "min_reward": 0.13097978569987545,
              "max_reward": 0.7896018964259988,
              "num_responses": 6,
              "rvariance": 0.05454916229578951
            },
            {
              "id": "reasoning_sample_548",
              "rewards": [
                -1.5294900427504918,
                -0.8198479093624857,
                -0.622725094532484,
                -0.8905802135073687,
                -0.6134487267757781,
                -0.6134487267757781,
                -0.23079855681165712
              ],
              "variance": 0.6857554864144884,
              "mean_reward": -0.7600484672165777,
              "min_reward": -1.5294900427504918,
              "max_reward": -0.23079855681165712,
              "num_responses": 7,
              "rvariance": 0.13637157033919542
            },
            {
              "id": "reasoning_sample_235",
              "rewards": [
                -0.39313499255401146,
                -0.3884968086756585,
                0.12170341794316948,
                -0.003527546772361022,
                -0.008165730650714003
              ],
              "variance": 0.46289075105962757,
              "mean_reward": -0.13432433214191508,
              "min_reward": -0.39313499255401146,
              "max_reward": 0.12170341794316948,
              "num_responses": 5,
              "rvariance": 0.04603212127541944
            },
            {
              "id": "reasoning_sample_156",
              "rewards": [
                -2.1881121534766153,
                -2.56844323150156,
                -1.9422884079239073,
                -2.025775717734261,
                -1.965479327315672,
                -1.9422884079239073
              ],
              "variance": 0.43598928456518027,
              "mean_reward": -2.105397874312654,
              "min_reward": -2.56844323150156,
              "max_reward": -1.9422884079239073,
              "num_responses": 6,
              "rvariance": 0.05006315640916655
            },
            {
              "id": "reasoning_sample_587",
              "rewards": [
                -0.49517503787777706,
                0.0011106371059919594,
                -0.4905368539994241,
                -0.13803487924459748,
                -0.05454756943424382,
                -0.05454756943424382,
                -0.14267306312295047
              ],
              "variance": 0.4601078407326158,
              "mean_reward": -0.19634347657246357,
              "min_reward": -0.49517503787777706,
              "max_reward": 0.0011106371059919594,
              "num_responses": 7,
              "rvariance": 0.03733296238958343
            },
            {
              "id": "reasoning_sample_594",
              "rewards": [
                -0.5879387154448367,
                -0.045271201677537856,
                -0.3142858666220108,
                -0.5879387154448367,
                -0.46734593460765916,
                -0.045271201677537856,
                -0.29109494723024587
              ],
              "variance": 0.5426675137672988,
              "mean_reward": -0.33416379752923786,
              "min_reward": -0.5879387154448367,
              "max_reward": -0.045271201677537856,
              "num_responses": 7,
              "rvariance": 0.04510126020600145
            },
            {
              "id": "reasoning_sample_622",
              "rewards": [
                -0.017442098407419965,
                1.0029583548302359,
                0.28867803756387683,
                0.44637628942787816,
                0.5947981735351736,
                0.5762454380217616,
                0.5947981735351736
              ],
              "variance": 0.5918322628778405,
              "mean_reward": 0.49805890978666856,
              "min_reward": -0.017442098407419965,
              "max_reward": 1.0029583548302359,
              "num_responses": 7,
              "rvariance": 0.08457232649328779
            },
            {
              "id": "reasoning_sample_647",
              "rewards": [
                -0.21688400517659817,
                0.40927081840105434,
                0.08459794691634562,
                0.08459794691634562,
                -0.49981322175613
              ],
              "variance": 0.6660432049314882,
              "mean_reward": -0.027646102939796535,
              "min_reward": -0.49981322175613,
              "max_reward": 0.40927081840105434,
              "num_responses": 5,
              "rvariance": 0.09496932426889729
            },
            {
              "id": "reasoning_sample_395",
              "rewards": [
                -0.8128906335449563,
                -0.5809814396273072,
                -0.9856629830136049,
                -0.5647477960530718,
                -0.6853405768902493,
                -0.5554714282963658
              ],
              "variance": 0.3391671961045618,
              "mean_reward": -0.697515809570926,
              "min_reward": -0.9856629830136049,
              "max_reward": -0.5554714282963658,
              "num_responses": 6,
              "rvariance": 0.024645431817363058
            },
            {
              "id": "reasoning_sample_252",
              "rewards": [
                -0.5183659572695419,
                0.17736162448340526,
                0.005748820984344941,
                0.005748820984344941,
                0.10315068242975756,
                -0.6296823703500135
              ],
              "variance": 0.7142803172663591,
              "mean_reward": -0.14267306312295047,
              "min_reward": -0.6296823703500135,
              "max_reward": 0.17736162448340526,
              "num_responses": 6,
              "rvariance": 0.09753880709180084
            },
            {
              "id": "reasoning_sample_497",
              "rewards": [
                -0.7943378980315443,
                -0.11948214373118556,
                -0.10092940821777363,
                0.2144670955102291,
                0.38144171513093644,
                0.38144171513093644,
                -0.10092940821777363
              ],
              "variance": 0.7708661605822654,
              "mean_reward": -0.019761190346596465,
              "min_reward": -0.7943378980315443,
              "max_reward": 0.38144171513093644,
              "num_responses": 7,
              "rvariance": 0.14284004806277217
            },
            {
              "id": "reasoning_sample_87",
              "rewards": [
                0.43709992167117223,
                0.35361261186081855,
                0.6968382188589392,
                0.6319036445619974,
                0.047492475889521775,
                0.32578350859070065,
                0.44637628942787816
              ],
              "variance": 0.443410378770545,
              "mean_reward": 0.4198723815515754,
              "min_reward": 0.047492475889521775,
              "max_reward": 0.6968382188589392,
              "num_responses": 7,
              "rvariance": 0.039225206290835916
            },
            {
              "id": "reasoning_sample_299",
              "rewards": [
                -0.509089589512836,
                -0.06382393719094978,
                0.39999445064434835,
                0.30723077307728874,
                0.34433624410411257,
                0.13097978569987545,
                0.09387431467305159
              ],
              "variance": 0.6085297248399111,
              "mean_reward": 0.10050029164212727,
              "min_reward": -0.509089589512836,
              "max_reward": 0.39999445064434835,
              "num_responses": 7,
              "rvariance": 0.08449505620868909
            },
            {
              "id": "reasoning_sample_303",
              "rewards": [
                0.019663372619403884,
                0.14953252121328736,
                0.08459794691634562,
                0.14953252121328736,
                -1.0679907468543703
              ],
              "variance": 0.782461620278148,
              "mean_reward": -0.13293287697840922,
              "min_reward": -1.0679907468543703,
              "max_reward": 0.14953252121328736,
              "num_responses": 5,
              "rvariance": 0.22090237942076124
            },
            {
              "id": "reasoning_sample_509",
              "rewards": [
                -0.863910656206839,
                -0.7827424383356619,
                -0.43951683133754127,
                -0.3282004182570697,
                -0.36994407316224653,
                -0.24007492456836307,
                -0.258627660081775
              ],
              "variance": 0.5640031596077225,
              "mean_reward": -0.46900242884992815,
              "min_reward": -0.863910656206839,
              "max_reward": -0.24007492456836307,
              "num_responses": 7,
              "rvariance": 0.05450825880233241
            },
            {
              "id": "reasoning_sample_572",
              "rewards": [
                0.6597327478321153,
                0.7988782641827048,
                0.9380237805332942,
                0.9380237805332942,
                0.8916419417497644,
                0.733943689885763,
                0.6040745412918795
              ],
              "variance": 0.30055431531727317,
              "mean_reward": 0.7949026780012594,
              "min_reward": 0.6040745412918795,
              "max_reward": 0.9380237805332942,
              "num_responses": 7,
              "rvariance": 0.01553483949000423
            },
            {
              "id": "reasoning_sample_557",
              "rewards": [
                1.2441439165045909,
                1.5966458912594175,
                1.5966458912594175,
                1.262696652018003,
                1.4853294781789461,
                1.2812493875314148,
                1.1328275034241193
              ],
              "variance": 0.39702853998701526,
              "mean_reward": 1.3713626743108442,
              "min_reward": 1.1328275034241193,
              "max_reward": 1.5966458912594175,
              "num_responses": 7,
              "rvariance": 0.029643691000595912
            },
            {
              "id": "reasoning_sample_678",
              "rewards": [
                -0.5461950605396598,
                0.13097978569987545,
                -0.035994833920831894,
                -0.4905368539994241,
                -0.0823766727043617,
                -0.0823766727043617,
                0.2144670955102291
              ],
              "variance": 0.6771748462395353,
              "mean_reward": -0.1274333160940764,
              "min_reward": -0.5461950605396598,
              "max_reward": 0.2144670955102291,
              "num_responses": 7,
              "rvariance": 0.07189999981909938
            },
            {
              "id": "reasoning_sample_53",
              "rewards": [
                2.245991634228835,
                2.190333427688599,
                2.524282666930014,
                2.468624460389778,
                2.5984936089836617,
                2.6170463444970733,
                2.672704551037309
              ],
              "variance": 0.4155812755004269,
              "mean_reward": 2.473925241965038,
              "min_reward": 2.190333427688599,
              "max_reward": 2.672704551037309,
              "num_responses": 7,
              "rvariance": 0.03006516528022524
            },
            {
              "id": "reasoning_sample_75",
              "rewards": [
                0.43709992167117223,
                0.028939740376109847,
                0.35361261186081855,
                0.1402561534565814,
                0.7710491609125869,
                0.29795440532058276
              ],
              "variance": 0.519476594375534,
              "mean_reward": 0.3381519989329753,
              "min_reward": 0.028939740376109847,
              "max_reward": 0.7710491609125869,
              "num_responses": 6,
              "rvariance": 0.05563675130786542
            },
            {
              "id": "reasoning_sample_595",
              "rewards": [
                0.6690091155888213,
                0.39999445064434835,
                0.47420539269799605,
                0.6782854833455273,
                0.6690091155888213
              ],
              "variance": 0.2448961087770375,
              "mean_reward": 0.5781007115731028,
              "min_reward": 0.39999445064434835,
              "max_reward": 0.6782854833455273,
              "num_responses": 5,
              "rvariance": 0.013816348360528929
            },
            {
              "id": "reasoning_sample_245",
              "rewards": [
                -0.9601529716826634,
                -0.39313499255401146,
                -0.5995341751407192,
                -0.7154887720995436,
                -0.42096409582412936
              ],
              "variance": 0.4580206579873569,
              "mean_reward": -0.6178550014602133,
              "min_reward": -0.9601529716826634,
              "max_reward": -0.39313499255401146,
              "num_responses": 5,
              "rvariance": 0.043260203477938505
            },
            {
              "id": "reasoning_sample_418",
              "rewards": [
                -3.1157489291472116,
                -2.3736395086107347,
                -2.6241014380417953,
                -1.5944246170474337,
                -2.6241014380417953,
                -2.3736395086107347,
                -2.930221574013092
              ],
              "variance": 0.9424789640813258,
              "mean_reward": -2.5194110019303997,
              "min_reward": -3.1157489291472116,
              "max_reward": -1.5944246170474337,
              "num_responses": 7,
              "rvariance": 0.20634327044952713
            },
            {
              "id": "reasoning_sample_60",
              "rewards": [
                1.0307874581003538,
                0.5762454380217616,
                0.6040745412918795,
                0.34433624410411257,
                0.6411800123187034,
                0.6319036445619974
              ],
              "variance": 0.3756928941465914,
              "mean_reward": 0.6380878897331347,
              "min_reward": 0.34433624410411257,
              "max_reward": 1.0307874581003538,
              "num_responses": 6,
              "rvariance": 0.04092203052030657
            },
            {
              "id": "reasoning_sample_385",
              "rewards": [
                -0.7154887720995436,
                -0.6041723590190721,
                -0.4302404635808353,
                -0.14731124700130344,
                -0.6922978527077788,
                -0.49517503787777706,
                -0.39777317643236443
              ],
              "variance": 0.40398581580454473,
              "mean_reward": -0.49749412981695357,
              "min_reward": -0.7154887720995436,
              "max_reward": -0.14731124700130344,
              "num_responses": 7,
              "rvariance": 0.033421593267481696
            },
            {
              "id": "reasoning_sample_243",
              "rewards": [
                -0.9091329490207807,
                0.10315068242975756,
                0.07532157915963966,
                0.11242705018646351,
                0.047492475889521775,
                0.019663372619403884
              ],
              "variance": 0.5525236545087989,
              "mean_reward": -0.09184629812266572,
              "min_reward": -0.9091329490207807,
              "max_reward": 0.11242705018646351,
              "num_responses": 6,
              "rvariance": 0.1345839487995897
            },
            {
              "id": "reasoning_sample_71",
              "rewards": [
                0.9194710450198823,
                0.6968382188589392,
                1.225591180991179,
                0.7803255286692928,
                1.0400638258570598,
                1.1792093422076493,
                1.1699329744509432
              ],
              "variance": 0.45083147297590975,
              "mean_reward": 1.0016331594364207,
              "min_reward": 0.6968382188589392,
              "max_reward": 1.225591180991179,
              "num_responses": 7,
              "rvariance": 0.03715998232065223
            },
            {
              "id": "reasoning_sample_218",
              "rewards": [
                -0.44879319909424725,
                0.30723077307728874,
                0.35361261186081855,
                0.17736162448340526,
                -0.14267306312295047,
                0.17736162448340526,
                0.44637628942787816
              ],
              "variance": 0.6558392003991116,
              "mean_reward": 0.12435380873079975,
              "min_reward": -0.44879319909424725,
              "max_reward": 0.44637628942787816,
              "num_responses": 7,
              "rvariance": 0.08501750870114626
            },
            {
              "id": "reasoning_sample_32",
              "rewards": [
                1.021511090343648,
                1.3183548585582388,
                1.3369075940716506,
                1.4482240071521222
              ],
              "variance": 0.3042648624199553,
              "mean_reward": 1.2812493875314148,
              "min_reward": 1.021511090343648,
              "max_reward": 1.4482240071521222,
              "num_responses": 4,
              "rvariance": 0.02495478963971966
            },
            {
              "id": "reasoning_sample_55",
              "rewards": [
                -1.8170574432083768,
                -2.2066648889900273,
                -1.7126983059454346,
                -1.9562029595589663,
                -2.016499349977555,
                -1.7799519721815529,
                -1.8402483626001416
              ],
              "variance": 0.3395150598954384,
              "mean_reward": -1.904189040351722,
              "min_reward": -2.2066648889900273,
              "max_reward": -1.7126983059454346,
              "num_responses": 7,
              "rvariance": 0.024370652630295916
            },
            {
              "id": "reasoning_sample_403",
              "rewards": [
                -0.6876596688294258,
                -1.223080020286798,
                -1.335845865829255,
                -1.407737715943726,
                -1.0824850714742233,
                -1.4761509281494327,
                -0.9613125176522517
              ],
              "variance": 0.5832516227028877,
              "mean_reward": -1.1677531125950158,
              "min_reward": -1.4761509281494327,
              "max_reward": -0.6876596688294258,
              "num_responses": 7,
              "rvariance": 0.06634230510162559
            },
            {
              "id": "reasoning_sample_580",
              "rewards": [
                0.5855218057784676,
                0.7061145866156451,
                0.6597327478321153,
                0.8267073674528227
              ],
              "variance": 0.1827444448071075,
              "mean_reward": 0.6945191269197627,
              "min_reward": 0.5855218057784676,
              "max_reward": 0.8267073674528227,
              "num_responses": 4,
              "rvariance": 0.0076746734516982724
            },
            {
              "id": "reasoning_sample_530",
              "rewards": [
                -0.768827886700603,
                -0.8430388287542506,
                -0.3560295215271876,
                -0.7409987834304851,
                -0.3374767860137757
              ],
              "variance": 0.4684565717136511,
              "mean_reward": -0.6092743612852604,
              "min_reward": -0.8430388287542506,
              "max_reward": -0.3374767860137757,
              "num_responses": 5,
              "rvariance": 0.04709226958011374
            },
            {
              "id": "reasoning_sample_318",
              "rewards": [
                0.6968382188589392,
                0.6690091155888213,
                0.7524964253991749,
                0.6411800123187034,
                0.7988782641827048,
                1.0586165613704717,
                0.7153909543723511
              ],
              "variance": 0.2448961087770375,
              "mean_reward": 0.7617727931558809,
              "min_reward": 0.6411800123187034,
              "max_reward": 1.0586165613704717,
              "num_responses": 7,
              "rvariance": 0.017013511754370447
            },
            {
              "id": "reasoning_sample_76",
              "rewards": [
                0.6411800123187034,
                1.262696652018003,
                0.9101946772631763,
                1.1142747679107075,
                1.1792093422076493,
                0.9565765160467061,
                1.012234722586942
              ],
              "variance": 0.41001545484640367,
              "mean_reward": 1.0109095271931268,
              "min_reward": 0.6411800123187034,
              "max_reward": 1.262696652018003,
              "num_responses": 7,
              "rvariance": 0.036029026336980206
            },
            {
              "id": "reasoning_sample_393",
              "rewards": [
                -0.1333966953662445,
                0.27012530205046487,
                -0.04063301779918487,
                0.019663372619403884,
                0.09387431467305159,
                0.1866379922401112
              ],
              "variance": 0.3153965037280027,
              "mean_reward": 0.06604521140293369,
              "min_reward": -0.1333966953662445,
              "max_reward": 0.27012530205046487,
              "num_responses": 6,
              "rvariance": 0.018379059151322267
            },
            {
              "id": "reasoning_sample_642",
              "rewards": [
                -0.2771803955951869,
                0.1402561534565814,
                0.6782854833455273,
                0.11242705018646351,
                0.37216534737423046,
                0.5205872314815259
              ],
              "variance": 0.6818130301178883,
              "mean_reward": 0.25775681170819026,
              "min_reward": -0.2771803955951869,
              "max_reward": 0.6782854833455273,
              "num_responses": 6,
              "rvariance": 0.09668307771526637
            },
            {
              "id": "reasoning_sample_16",
              "rewards": [
                0.43709992167117223,
                -0.17050216639306834,
                0.22374346326693506,
                0.27012530205046487,
                0.45565265718458414,
                0.10315068242975756
              ],
              "variance": 0.4800520314095336,
              "mean_reward": 0.21987831003497424,
              "min_reward": -0.17050216639306834,
              "max_reward": 0.45565265718458414,
              "num_responses": 6,
              "rvariance": 0.045222787729048496
            },
            {
              "id": "reasoning_sample_260",
              "rewards": [
                0.1866379922401112,
                0.31650714083399467,
                0.8174309996961167,
                0.733943689885763,
                1.225591180991179,
                1.1606566066942372,
                1.0864456646405896
              ],
              "variance": 0.9220709550165727,
              "mean_reward": 0.7896018964259987,
              "min_reward": 0.1866379922401112,
              "max_reward": 1.225591180991179,
              "num_responses": 7,
              "rvariance": 0.14387726992279748
            },
            {
              "id": "reasoning_sample_582",
              "rewards": [
                0.09387431467305159,
                0.5669690702650557,
                0.5669690702650557,
                0.37216534737423046,
                0.242296198780347
              ],
              "variance": 0.413726001949086,
              "mean_reward": 0.3684548002715481,
              "min_reward": 0.09387431467305159,
              "max_reward": 0.5669690702650557,
              "num_responses": 5,
              "rvariance": 0.03402800694872671
            },
            {
              "id": "reasoning_sample_295",
              "rewards": [
                -0.4812604862427181,
                0.19591435999681717,
                0.047492475889521775,
                0.028939740376109847,
                0.34433624410411257,
                0.30723077307728874
              ],
              "variance": 0.5519438815240048,
              "mean_reward": 0.07377551786685534,
              "min_reward": -0.4812604862427181,
              "max_reward": 0.34433624410411257,
              "num_responses": 6,
              "rvariance": 0.07556472843682545
            },
            {
              "id": "reasoning_sample_366",
              "rewards": [
                -0.059185753312596796,
                0.6597327478321153,
                0.27012530205046487,
                0.028939740376109847,
                0.39071808288764237,
                0.5855218057784676,
                0.6782854833455273
              ],
              "variance": 0.6734642991368529,
              "mean_reward": 0.36487677270824725,
              "min_reward": -0.059185753312596796,
              "max_reward": 0.6782854833455273,
              "num_responses": 7,
              "rvariance": 0.0765968038227187
            },
            {
              "id": "reasoning_sample_286",
              "rewards": [
                -1.3149740383766666,
                -0.754913335065544,
                -0.7479560592480146,
                -0.2864567633518929,
                -0.6737451171943668,
                -0.7479560592480146,
                -0.32356223437871673
              ],
              "variance": 0.6702175704220058,
              "mean_reward": -0.6927948009804593,
              "min_reward": -1.3149740383766666,
              "max_reward": -0.2864567633518929,
              "num_responses": 7,
              "rvariance": 0.09983677486666005
            },
            {
              "id": "reasoning_sample_356",
              "rewards": [
                -1.1117636072063266,
                -1.6825501107361402,
                -1.3938231643086672,
                -0.4534313829726002,
                -0.9752270692873106,
                -0.9752270692873106
              ],
              "variance": 0.8238574113924484,
              "mean_reward": -1.0986704006330592,
              "min_reward": -1.6825501107361402,
              "max_reward": -0.4534313829726002,
              "num_responses": 6,
              "rvariance": 0.14583533397544737
            },
            {
              "id": "reasoning_sample_343",
              "rewards": [
                -0.32356223437871673,
                0.38144171513093644,
                0.19591435999681717,
                0.45565265718458414,
                0.40927081840105434
              ],
              "variance": 0.5528715182996754,
              "mean_reward": 0.22374346326693506,
              "min_reward": -0.32356223437871673,
              "max_reward": 0.45565265718458414,
              "num_responses": 5,
              "rvariance": 0.08267779960635399
            },
            {
              "id": "reasoning_sample_205",
              "rewards": [
                1.2812493875314148,
                1.7265150398533011,
                1.6337513622862414,
                1.2998021230448267,
                2.1161224856349516,
                2.1161224856349516,
                2.1161224856349516
              ],
              "variance": 0.8237414567954897,
              "mean_reward": 1.7556693385172342,
              "min_reward": 1.2812493875314148,
              "max_reward": 2.1161224856349516,
              "num_responses": 7,
              "rvariance": 0.11976894112800016
            },
            {
              "id": "reasoning_sample_512",
              "rewards": [
                0.5113108637248199,
                0.965852883803412,
                1.1328275034241193,
                1.1328275034241193,
                1.1792093422076493,
                0.9473001482900002
              ],
              "variance": 0.42671291680847423,
              "mean_reward": 0.9782213741456866,
              "min_reward": 0.5113108637248199,
              "max_reward": 1.1792093422076493,
              "num_responses": 6,
              "rvariance": 0.051219466704972495
            },
            {
              "id": "reasoning_sample_226",
              "rewards": [
                -0.8836229376898392,
                -0.37458225704059955,
                -0.14731124700130344,
                -0.36994407316224653,
                -0.34211496989212864,
                -0.21224582129824518,
                -0.21224582129824518
              ],
              "variance": 0.39192653772082686,
              "mean_reward": -0.363152446768944,
              "min_reward": -0.8836229376898392,
              "max_reward": -0.14731124700130344,
              "num_responses": 7,
              "rvariance": 0.05194884526339064
            },
            {
              "id": "reasoning_sample_225",
              "rewards": [
                -0.29573313110859883,
                0.242296198780347,
                0.23301983102364102,
                0.242296198780347,
                0.32578350859070065,
                0.08459794691634562
              ],
              "variance": 0.3896074457816504,
              "mean_reward": 0.13871009216379707,
              "min_reward": -0.29573313110859883,
              "max_reward": 0.32578350859070065,
              "num_responses": 6,
              "rvariance": 0.04283666524266438
            },
            {
              "id": "reasoning_sample_508",
              "rewards": [
                -1.1877138682143566,
                -0.6598305655593079,
                -0.8523151965109567,
                -0.6598305655593079,
                -0.7479560592480146
              ],
              "variance": 0.3937238339736887,
              "mean_reward": -0.8215292510183888,
              "min_reward": -1.1877138682143566,
              "max_reward": -0.6598305655593079,
              "num_responses": 5,
              "rvariance": 0.03854897852329975
            },
            {
              "id": "reasoning_sample_585",
              "rewards": [
                -0.5972150832015426,
                -0.618086910654131,
                -0.24935129232506903,
                -0.3282004182570697,
                0.0011106371059919594
              ],
              "variance": 0.5106640450066632,
              "mean_reward": -0.35834861346636404,
              "min_reward": -0.618086910654131,
              "max_reward": 0.0011106371059919594,
              "num_responses": 5,
              "rvariance": 0.05330429118042877
            },
            {
              "id": "reasoning_sample_574",
              "rewards": [
                0.06604521140293369,
                0.20519072775352315,
                0.27012530205046487,
                0.39071808288764237,
                0.1866379922401112,
                0.5669690702650557,
                0.38144171513093644
              ],
              "variance": 0.3228175979333675,
              "mean_reward": 0.29530401453295246,
              "min_reward": 0.06604521140293369,
              "max_reward": 0.5669690702650557,
              "num_responses": 7,
              "rvariance": 0.023349675091464652
            },
            {
              "id": "reasoning_sample_520",
              "rewards": [
                -0.9589934257130752,
                -0.8036142657882503,
                -1.0065348104661933,
                -1.0355234597058993,
                -0.953195695865134,
                -0.636639646167543,
                -1.0650918819303996
              ],
              "variance": 0.31052641065573205,
              "mean_reward": -0.9227990265194992,
              "min_reward": -1.0650918819303996,
              "max_reward": -0.636639646167543,
              "num_responses": 7,
              "rvariance": 0.019755989463660344
            },
            {
              "id": "reasoning_sample_238",
              "rewards": [
                0.07532157915963966,
                0.733943689885763,
                0.6782854833455273,
                0.6597327478321153,
                0.984405619316824
              ],
              "variance": 0.5751348009157697,
              "mean_reward": 0.6263378239079739,
              "min_reward": 0.07532157915963966,
              "max_reward": 0.984405619316824,
              "num_responses": 5,
              "rvariance": 0.0894448501486559
            },
            {
              "id": "reasoning_sample_630",
              "rewards": [
                -1.4158545377308438,
                -0.7038933124036613,
                -1.0517571032801347,
                -0.9787057071960754,
                -1.0517571032801347
              ],
              "variance": 0.4563972936299332,
              "mean_reward": -1.0403935527781702,
              "min_reward": -1.4158545377308438,
              "max_reward": -0.7038933124036613,
              "num_responses": 5,
              "rvariance": 0.05165340276926318
            },
            {
              "id": "reasoning_sample_233",
              "rewards": [
                -0.7781042544573089,
                -0.22616037293330413,
                -0.22616037293330413,
                -1.0076943564357814,
                -0.40241136031071745,
                -0.12875851148789152,
                -0.29109494723024587
              ],
              "variance": 0.6827406668935588,
              "mean_reward": -0.43719773939836476,
              "min_reward": -1.0076943564357814,
              "max_reward": -0.12875851148789152,
              "num_responses": 7,
              "rvariance": 0.09263543678759235
            },
            {
              "id": "reasoning_sample_394",
              "rewards": [
                0.17736162448340526,
                0.8267073674528227,
                0.7896018964259988,
                0.42782355391446625,
                0.42782355391446625,
                0.5113108637248199,
                0.37216534737423046
              ],
              "variance": 0.5102002266188279,
              "mean_reward": 0.5046848867557443,
              "min_reward": 0.17736162448340526,
              "max_reward": 0.8267073674528227,
              "num_responses": 7,
              "rvariance": 0.045919622765615044
            },
            {
              "id": "reasoning_sample_284",
              "rewards": [
                -0.40241136031071745,
                0.1866379922401112,
                0.5669690702650557,
                0.35361261186081855,
                0.32578350859070065,
                0.44637628942787816,
                0.19591435999681717
              ],
              "variance": 0.5435951505429695,
              "mean_reward": 0.23898321029580916,
              "min_reward": -0.40241136031071745,
              "max_reward": 0.5669690702650557,
              "num_responses": 7,
              "rvariance": 0.08389182114596962
            },
            {
              "id": "reasoning_sample_207",
              "rewards": [
                -0.5183659572695419,
                -0.23543674069001008,
                -0.10556759209612661,
                -0.5461950605396598,
                -0.10556759209612661,
                -0.3282004182570697,
                -0.39777317643236443
              ],
              "variance": 0.42393000648146245,
              "mean_reward": -0.3195866481972713,
              "min_reward": -0.5461950605396598,
              "max_reward": -0.10556759209612661,
              "num_responses": 7,
              "rvariance": 0.027963062310573977
            },
            {
              "id": "reasoning_sample_345",
              "rewards": [
                -0.4256022797024823,
                -0.2771803955951869,
                0.08459794691634562,
                -0.04063301779918487,
                0.019663372619403884,
                0.10315068242975756
              ],
              "variance": 0.4452656523218862,
              "mean_reward": -0.08933394852189118,
              "min_reward": -0.4256022797024823,
              "max_reward": 0.10315068242975756,
              "num_responses": 6,
              "rvariance": 0.0383195853842678
            },
            {
              "id": "reasoning_sample_565",
              "rewards": [
                0.42782355391446625,
                0.7896018964259988,
                1.0771692968838837,
                0.7061145866156451,
                0.9101946772631763,
                0.8267073674528227,
                1.0771692968838837
              ],
              "variance": 0.48237112334871013,
              "mean_reward": 0.8306829536342681,
              "min_reward": 0.42782355391446625,
              "max_reward": 1.0771692968838837,
              "num_responses": 7,
              "rvariance": 0.04390708308038503
            },
            {
              "id": "reasoning_sample_78",
              "rewards": [
                2.208886163202011,
                2.041911543581304,
                2.3016498407690706,
                2.245991634228835,
                2.1532279566617754,
                2.0790170146081275,
                2.39441351833613
              ],
              "variance": 0.27458048559849635,
              "mean_reward": 2.2035853816267506,
              "min_reward": 2.041911543581304,
              "max_reward": 2.39441351833613,
              "num_responses": 7,
              "rvariance": 0.013149997524434954
            },
            {
              "id": "reasoning_sample_601",
              "rewards": [
                -0.8221670013016622,
                -0.4116877280674234,
                -0.14267306312295047,
                -0.3050094988653048
              ],
              "variance": 0.5076492254857339,
              "mean_reward": -0.42038432283933524,
              "min_reward": -0.8221670013016622,
              "max_reward": -0.14267306312295047,
              "num_responses": 4,
              "rvariance": 0.06298496131332205
            },
            {
              "id": "reasoning_sample_539",
              "rewards": [
                -0.19369308578483327,
                0.26084893429375894,
                0.5113108637248199,
                0.39999445064434835,
                1.1792093422076493,
                0.5855218057784676
              ],
              "variance": 0.8487876497385957,
              "mean_reward": 0.4571987184773685,
              "min_reward": -0.19369308578483327,
              "max_reward": 1.1792093422076493,
              "num_responses": 6,
              "rvariance": 0.16769666444002038
            },
            {
              "id": "reasoning_sample_603",
              "rewards": [
                -0.9926202588311343,
                -2.1510066824497915,
                -2.0953484759095558,
                -2.1510066824497915,
                -2.1510066824497915,
                -2.1510066824497915
              ],
              "variance": 0.6070223150794467,
              "mean_reward": -1.9486659107566426,
              "min_reward": -2.1510066824497915,
              "max_reward": -0.9926202588311343,
              "num_responses": 6,
              "rvariance": 0.18321770250717082
            },
            {
              "id": "reasoning_sample_339",
              "rewards": [
                0.29795440532058276,
                0.6504563800754094,
                0.6782854833455273,
                0.7896018964259988,
                0.9009183095064703,
                0.9380237805332942
              ],
              "variance": 0.4452656523218861,
              "mean_reward": 0.7092067092012138,
              "min_reward": 0.29795440532058276,
              "max_reward": 0.9380237805332942,
              "num_responses": 6,
              "rvariance": 0.0448516927969061
            },
            {
              "id": "reasoning_sample_447",
              "rewards": [
                0.17736162448340526,
                0.7061145866156451,
                0.7061145866156451,
                0.7061145866156451,
                0.743220057642469,
                0.44637628942787816,
                0.7061145866156451
              ],
              "variance": 0.38218635157628567,
              "mean_reward": 0.598773759716619,
              "min_reward": 0.17736162448340526,
              "max_reward": 0.743220057642469,
              "num_responses": 7,
              "rvariance": 0.03825230316202489
            },
            {
              "id": "reasoning_sample_44",
              "rewards": [
                1.188485709964355,
                1.262696652018003,
                1.3369075940716506,
                1.4111185361252983,
                0.9101946772631763,
                1.4296712716387103,
                1.3369075940716506
              ],
              "variance": 0.3413703334467795,
              "mean_reward": 1.2679974335932636,
              "min_reward": 0.9101946772631763,
              "max_reward": 1.4296712716387103,
              "num_responses": 7,
              "rvariance": 0.02721318932140015
            },
            {
              "id": "reasoning_sample_266",
              "rewards": [
                -0.9926202588311343,
                -0.2818185794735399,
                0.29795440532058276,
                -0.4812604862427181,
                -0.37458225704059955,
                0.242296198780347,
                0.14953252121328736
              ],
              "variance": 0.9503638766745259,
              "mean_reward": -0.20578549375339636,
              "min_reward": -0.9926202588311343,
              "max_reward": 0.29795440532058276,
              "num_responses": 7,
              "rvariance": 0.18715011104358922
            },
            {
              "id": "reasoning_sample_529",
              "rewards": [
                -0.6134487267757781,
                -0.4256022797024823,
                -0.2818185794735399,
                -0.20296945354153922,
                -0.20296945354153922,
                -0.049909385555890834,
                -0.20296945354153922
              ],
              "variance": 0.3589954321845208,
              "mean_reward": -0.2828124760189012,
              "min_reward": -0.6134487267757781,
              "max_reward": -0.049909385555890834,
              "num_responses": 7,
              "rvariance": 0.029011260063297954
            },
            {
              "id": "reasoning_sample_466",
              "rewards": [
                -1.270331518547519,
                -0.39313499255401146,
                -0.2771803955951869,
                -0.6088105428974251,
                -0.42096409582412936,
                -0.36994407316224653,
                -0.34211496989212864
              ],
              "variance": 0.5572777929841107,
              "mean_reward": -0.5260686554960925,
              "min_reward": -1.270331518547519,
              "max_reward": -0.2771803955951869,
              "num_responses": 7,
              "rvariance": 0.10137870943256826
            },
            {
              "id": "reasoning_sample_349",
              "rewards": [
                -2.322619485948852,
                -1.615296444500022,
                -1.6454446397093165,
                -1.5364473185680214,
                -1.7753137883032,
                -1.5897864331690807
              ],
              "variance": 0.4858497612574748,
              "mean_reward": -1.747484685033082,
              "min_reward": -2.322619485948852,
              "max_reward": -1.5364473185680214,
              "num_responses": 6,
              "rvariance": 0.07147431811393559
            },
            {
              "id": "reasoning_sample_206",
              "rewards": [
                -0.9868225289831931,
                -1.2761292483954603,
                -1.2245294527487833,
                -1.2761292483954603
              ],
              "variance": 0.21799464228259025,
              "mean_reward": -1.1909026196307242,
              "min_reward": -1.2761292483954603,
              "max_reward": -0.9868225289831931,
              "num_responses": 4,
              "rvariance": 0.014326650951364643
            },
            {
              "id": "reasoning_sample_516",
              "rewards": [
                -0.7781042544573089,
                -0.17977853414977432,
                -0.07773848882600873,
                -0.4534313829726002,
                -0.11948214373118556,
                -0.24007492456836307,
                -0.16586398251471537
              ],
              "variance": 0.48051584979736883,
              "mean_reward": -0.287781958745708,
              "min_reward": -0.7781042544573089,
              "max_reward": -0.07773848882600873,
              "num_responses": 7,
              "rvariance": 0.05272906659587634
            },
            {
              "id": "reasoning_sample_542",
              "rewards": [
                0.27012530205046487,
                0.5484163347516438,
                0.733943689885763,
                0.7061145866156451,
                0.49275812821140796,
                0.733943689885763,
                0.6411800123187034
              ],
              "variance": 0.33023869213873225,
              "mean_reward": 0.589497391959913,
              "min_reward": 0.27012530205046487,
              "max_reward": 0.733943689885763,
              "num_responses": 7,
              "rvariance": 0.02443497136151016
            },
            {
              "id": "reasoning_sample_151",
              "rewards": [
                -0.9184093167774866,
                -0.8012951738490738,
                -0.6691069333160139,
                -0.7525942431263675
              ],
              "variance": 0.1891219476398428,
              "mean_reward": -0.7853514167672355,
              "min_reward": -0.9184093167774866,
              "max_reward": -0.6691069333160139,
              "num_responses": 4,
              "rvariance": 0.008136105125700491
            },
            {
              "id": "reasoning_sample_223",
              "rewards": [
                -1.0639323359608115,
                -1.3497604174643139,
                -0.4302404635808353,
                -0.7989760819098973,
                -0.4302404635808353,
                -0.5369186927829539,
                -0.36530588928389357
              ],
              "variance": 0.7739969347001538,
              "mean_reward": -0.7107677635090772,
              "min_reward": -1.3497604174643139,
              "max_reward": -0.36530588928389357,
              "num_responses": 7,
              "rvariance": 0.12111086748920663
            },
            {
              "id": "reasoning_sample_452",
              "rewards": [
                -0.7062124043428377,
                0.1402561534565814,
                0.11242705018646351,
                -0.19369308578483327
              ],
              "variance": 0.6843640312509824,
              "mean_reward": -0.16180557162115652,
              "min_reward": -0.7062124043428377,
              "max_reward": 0.1402561534565814,
              "num_responses": 4,
              "rvariance": 0.11596010742350286
            },
            {
              "id": "reasoning_sample_68",
              "rewards": [
                0.9009183095064703,
                1.012234722586942,
                1.2441439165045909,
                1.6708568333130653,
                1.6523040977996533,
                1.2441439165045909,
                1.466776742665534
              ],
              "variance": 0.6920170346502648,
              "mean_reward": 1.313054076982978,
              "min_reward": 0.9009183095064703,
              "max_reward": 1.6708568333130653,
              "num_responses": 7,
              "rvariance": 0.07665563460758361
            },
            {
              "id": "reasoning_sample_552",
              "rewards": [
                0.028939740376109847,
                0.47420539269799605,
                0.48348176045470204,
                -0.09629122433942065,
                0.48348176045470204,
                0.48348176045470204,
                0.502034495968114
              ],
              "variance": 0.5120555001701692,
              "mean_reward": 0.3370476694381294,
              "min_reward": -0.09629122433942065,
              "max_reward": 0.502034495968114,
              "num_responses": 7,
              "rvariance": 0.05615354511786462
            },
            {
              "id": "reasoning_sample_209",
              "rewards": [
                -0.36994407316224653,
                -0.11484395985283258,
                0.27940166980717085,
                0.2144670955102291
              ],
              "variance": 0.5533353366875107,
              "mean_reward": 0.0022701830755802108,
              "min_reward": -0.36994407316224653,
              "max_reward": 0.27940166980717085,
              "num_responses": 4,
              "rvariance": 0.06852214140134877
            },
            {
              "id": "reasoning_sample_391",
              "rewards": [
                -1.766037420546494,
                -1.1666835090862386,
                -1.1423466321542164,
                -1.331207681950902,
                -1.5550000540814333,
                -1.4715127442710796,
                -1.430928635335491
              ],
              "variance": 0.4824662423540278,
              "mean_reward": -1.4091023824894078,
              "min_reward": -1.766037420546494,
              "max_reward": -1.1423466321542164,
              "num_responses": 7,
              "rvariance": 0.041293330775820654
            },
            {
              "id": "reasoning_sample_210",
              "rewards": [
                1.0400638258570598,
                2.00480607255448,
                1.8192787174203606,
                2.0233588080678917,
                1.986253337041068,
                1.9305951305008322,
                1.9677006015276561
              ],
              "variance": 0.5046344059648045,
              "mean_reward": 1.8245794989956214,
              "min_reward": 1.0400638258570598,
              "max_reward": 2.0233588080678917,
              "num_responses": 7,
              "rvariance": 0.106478452177022
            },
            {
              "id": "reasoning_sample_465",
              "rewards": [
                0.019663372619403884,
                0.6319036445619974,
                0.6040745412918795,
                0.6040745412918795,
                0.7524964253991749,
                0.7524964253991749,
                0.965852883803412
              ],
              "variance": 0.4675289349379805,
              "mean_reward": 0.618651690623846,
              "min_reward": 0.019663372619403884,
              "max_reward": 0.965852883803412,
              "num_responses": 7,
              "rvariance": 0.07368072865053331
            },
            {
              "id": "reasoning_sample_396",
              "rewards": [
                -0.6528732897417784,
                -0.3142858666220108,
                -0.43951683133754127,
                0.48348176045470204,
                -0.6528732897417784,
                -0.4812604862427181,
                0.03821610813281581
              ],
              "variance": 0.8691956588033488,
              "mean_reward": -0.2884445564426156,
              "min_reward": -0.6528732897417784,
              "max_reward": 0.48348176045470204,
              "num_responses": 7,
              "rvariance": 0.14698037430656843
            },
            {
              "id": "reasoning_sample_348",
              "rewards": [
                -0.8975374893248982,
                -0.14267306312295047,
                -0.4070495441890704,
                -0.5369186927829539,
                -0.42096409582412936,
                -0.4070495441890704,
                -0.3282004182570697
              ],
              "variance": 0.4271767351963096,
              "mean_reward": -0.44862754967002033,
              "min_reward": -0.8975374893248982,
              "max_reward": -0.14267306312295047,
              "num_responses": 7,
              "rvariance": 0.04594986134999991
            },
            {
              "id": "reasoning_sample_83",
              "rewards": [
                -0.17977853414977432,
                0.20519072775352315,
                0.1680852567266993,
                0.33505987634740664,
                0.30723077307728874,
                0.49275812821140796,
                0.27012530205046487
              ],
              "variance": 0.36919943671689737,
              "mean_reward": 0.22838164714528802,
              "min_reward": -0.17977853414977432,
              "max_reward": 0.49275812821140796,
              "num_responses": 7,
              "rvariance": 0.03714329896375023
            },
            {
              "id": "reasoning_sample_242",
              "rewards": [
                0.5762454380217616,
                1.3925658006118864,
                1.3925658006118864,
                0.984405619316824,
                1.1421038711808253,
                1.0307874581003538,
                1.1699329744509432
              ],
              "variance": 0.5714242538130873,
              "mean_reward": 1.098372423184926,
              "min_reward": 0.5762454380217616,
              "max_reward": 1.3925658006118864,
              "num_responses": 7,
              "rvariance": 0.06718651245857811
            },
            {
              "id": "reasoning_sample_269",
              "rewards": [
                1.1606566066942372,
                1.262696652018003,
                0.743220057642469,
                1.262696652018003,
                1.262696652018003
              ],
              "variance": 0.3525019747548267,
              "mean_reward": 1.1383933240781432,
              "min_reward": 0.743220057642469,
              "max_reward": 1.262696652018003,
              "num_responses": 5,
              "rvariance": 0.04060230325381147
            },
            {
              "id": "reasoning_sample_694",
              "rewards": [
                -0.7595515189438969,
                -0.20760763741989222,
                -1.0471189194017818,
                -0.523004141147895,
                -0.20760763741989222,
                -0.29573313110859883
              ],
              "variance": 0.6957275817529472,
              "mean_reward": -0.5067704975736594,
              "min_reward": -1.0471189194017818,
              "max_reward": -0.20760763741989222,
              "num_responses": 6,
              "rvariance": 0.09661196612601526
            },
            {
              "id": "reasoning_sample_18",
              "rewards": [
                0.5762454380217616,
                0.45565265718458414,
                0.9565765160467061,
                0.7524964253991749,
                0.8174309996961167,
                0.5947981735351736
              ],
              "variance": 0.37105471026823844,
              "mean_reward": 0.6922000349805862,
              "min_reward": 0.45565265718458414,
              "max_reward": 0.9565765160467061,
              "num_responses": 6,
              "rvariance": 0.028016771012179517
            },
            {
              "id": "reasoning_sample_230",
              "rewards": [
                -1.1788723301962463,
                -0.750275151187191,
                -0.7154887720995436,
                -0.3096476827436578,
                -0.7154887720995436
              ],
              "variance": 0.535449340106612,
              "mean_reward": -0.7339545416652364,
              "min_reward": -1.1788723301962463,
              "max_reward": -0.3096476827436578,
              "num_responses": 5,
              "rvariance": 0.07578729613313909
            },
            {
              "id": "reasoning_sample_237",
              "rewards": [
                0.5113108637248199,
                0.724667322129057,
                0.7524964253991749,
                1.1142747679107075,
                1.0493401936137658
              ],
              "variance": 0.49164749110541606,
              "mean_reward": 0.8304179145555051,
              "min_reward": 0.5113108637248199,
              "max_reward": 1.1142747679107075,
              "num_responses": 5,
              "rvariance": 0.049517186725104426
            },
            {
              "id": "reasoning_sample_312",
              "rewards": [
                -0.10092940821777363,
                0.09387431467305159,
                0.07532157915963966,
                0.30723077307728874,
                0.43709992167117223,
                0.43709992167117223
              ],
              "variance": 0.4499038362002392,
              "mean_reward": 0.2082828503390918,
              "min_reward": -0.10092940821777363,
              "max_reward": 0.43709992167117223,
              "num_responses": 6,
              "rvariance": 0.04014757153148769
            },
            {
              "id": "reasoning_sample_47",
              "rewards": [
                0.8638128384796465,
                0.7803255286692928,
                0.5762454380217616,
                0.27012530205046487,
                0.5762454380217616,
                0.5762454380217616,
                0.5762454380217616
              ],
              "variance": 0.35992306896019133,
              "mean_reward": 0.6027493458980643,
              "min_reward": 0.27012530205046487,
              "max_reward": 0.8638128384796465,
              "num_responses": 7,
              "rvariance": 0.030448004417555217
            },
            {
              "id": "reasoning_sample_2",
              "rewards": [
                1.2998021230448267,
                1.3554603295850625,
                1.4296712716387103,
                1.5966458912594175,
                1.5966458912594175,
                1.4296712716387103,
                1.4111185361252983
              ],
              "variance": 0.26344884429044924,
              "mean_reward": 1.4455736163644919,
              "min_reward": 1.2998021230448267,
              "max_reward": 1.5966458912594175,
              "num_responses": 7,
              "rvariance": 0.010958331270362468
            },
            {
              "id": "reasoning_sample_58",
              "rewards": [
                0.40927081840105434,
                0.5855218057784676,
                0.743220057642469,
                0.6504563800754094,
                0.5484163347516438,
                0.39999445064434835,
                0.5762454380217616
              ],
              "variance": 0.28200157980386126,
              "mean_reward": 0.5590178979021648,
              "min_reward": 0.39999445064434835,
              "max_reward": 0.743220057642469,
              "num_responses": 7,
              "rvariance": 0.013016530669219012
            },
            {
              "id": "reasoning_sample_308",
              "rewards": [
                -0.7711469786397794,
                -0.1333966953662445,
                -0.3282004182570697,
                -0.4302404635808353,
                -0.12875851148789152,
                -0.3282004182570697,
                -0.3282004182570697
              ],
              "variance": 0.43506164778950956,
              "mean_reward": -0.3497348434065657,
              "min_reward": -0.7711469786397794,
              "max_reward": -0.12875851148789152,
              "num_responses": 7,
              "rvariance": 0.04015618150953799
            },
            {
              "id": "reasoning_sample_59",
              "rewards": [
                0.12170341794316948,
                0.5113108637248199,
                0.9751292515601181,
                0.743220057642469,
                0.6319036445619974,
                0.733943689885763,
                0.35361261186081855
              ],
              "variance": 0.5751348009157697,
              "mean_reward": 0.5815462195970224,
              "min_reward": 0.12170341794316948,
              "max_reward": 0.9751292515601181,
              "num_responses": 7,
              "rvariance": 0.06787843273430293
            },
            {
              "id": "reasoning_sample_219",
              "rewards": [
                0.38144171513093644,
                1.1328275034241193,
                1.0400638258570598,
                1.1699329744509432,
                1.2441439165045909,
                1.1513802389375314,
                1.1792093422076493
              ],
              "variance": 0.4285681903598153,
              "mean_reward": 1.04271421664469,
              "min_reward": 0.38144171513093644,
              "max_reward": 1.2441439165045909,
              "num_responses": 7,
              "rvariance": 0.07608664433008404
            },
            {
              "id": "reasoning_sample_216",
              "rewards": [
                -1.3822277046127847,
                -0.3050094988653048,
                -0.21224582129824518,
                -0.4302404635808353
              ],
              "variance": 0.8565566077348366,
              "mean_reward": -0.5824308720892926,
              "min_reward": -1.3822277046127847,
              "max_reward": -0.21224582129824518,
              "num_responses": 4,
              "rvariance": 0.21920912097680884
            },
            {
              "id": "reasoning_sample_201",
              "rewards": [
                -0.3328386021354227,
                0.05676884364622774,
                -0.04063301779918487,
                -0.10092940821777363,
                0.028939740376109847
              ],
              "variance": 0.2857121269065437,
              "mean_reward": -0.07773848882600873,
              "min_reward": -0.3328386021354227,
              "max_reward": 0.05676884364622774,
              "num_responses": 5,
              "rvariance": 0.01929263392146603
            },
            {
              "id": "reasoning_sample_550",
              "rewards": [
                -0.5693859799314247,
                -0.258627660081775,
                -0.258627660081775,
                -0.258627660081775,
                -0.258627660081775,
                -0.258627660081775,
                -0.4116877280674234
              ],
              "variance": 0.2161393687312489,
              "mean_reward": -0.3248874297725318,
              "min_reward": -0.5693859799314247,
              "max_reward": -0.258627660081775,
              "num_responses": 7,
              "rvariance": 0.012752231173034784
            },
            {
              "id": "reasoning_sample_34",
              "rewards": [
                1.262696652018003,
                0.733943689885763,
                1.3554603295850625,
                1.4853294781789461,
                1.4296712716387103,
                1.3554603295850625,
                1.2812493875314148
              ],
              "variance": 0.40073908708969763,
              "mean_reward": 1.271973019774709,
              "min_reward": 0.733943689885763,
              "max_reward": 1.4853294781789461,
              "num_responses": 7,
              "rvariance": 0.053425377228680626
            },
            {
              "id": "reasoning_sample_618",
              "rewards": [
                0.06604521140293369,
                0.14953252121328736,
                0.7617727931558809,
                0.28867803756387683,
                0.34433624410411257,
                0.13097978569987545
              ],
              "variance": 0.4545420200785921,
              "mean_reward": 0.2902240988566611,
              "min_reward": 0.06604521140293369,
              "max_reward": 0.7617727931558809,
              "num_responses": 6,
              "rvariance": 0.05344962175610837
            },
            {
              "id": "reasoning_sample_257",
              "rewards": [
                0.5762454380217616,
                0.9101946772631763,
                0.8081546319394107,
                0.965852883803412,
                0.8823655739930584
              ],
              "variance": 0.27458048559849646,
              "mean_reward": 0.8285626410041639,
              "min_reward": 0.5762454380217616,
              "max_reward": 0.965852883803412,
              "num_responses": 5,
              "rvariance": 0.018497522692945304
            },
            {
              "id": "reasoning_sample_527",
              "rewards": [
                0.39999445064434835,
                0.48348176045470204,
                0.5762454380217616,
                0.38144171513093644,
                0.5762454380217616,
                0.5762454380217616,
                0.5762454380217616
              ],
              "variance": 0.18367208158277804,
              "mean_reward": 0.5099856683310048,
              "min_reward": 0.38144171513093644,
              "max_reward": 0.5762454380217616,
              "num_responses": 7,
              "rvariance": 0.0066979287604427016
            },
            {
              "id": "reasoning_sample_66",
              "rewards": [
                -0.3606677054055406,
                -0.22152218905495114,
                -0.14267306312295047,
                -0.17977853414977432,
                -0.045271201677537856,
                -0.017442098407419965,
                -0.3328386021354227
              ],
              "variance": 0.3098306830739792,
              "mean_reward": -0.18574191342194243,
              "min_reward": -0.3606677054055406,
              "max_reward": -0.017442098407419965,
              "num_responses": 7,
              "rvariance": 0.014780576143750918
            },
            {
              "id": "reasoning_sample_292",
              "rewards": [
                -0.4812604862427181,
                0.242296198780347,
                -0.012803914529066984,
                0.05676884364622774,
                -0.012803914529066984,
                -0.16586398251471537,
                0.05676884364622774
              ],
              "variance": 0.42300236970579197,
              "mean_reward": -0.04527120167753785,
              "min_reward": -0.4812604862427181,
              "max_reward": 0.242296198780347,
              "num_responses": 7,
              "rvariance": 0.04432241086010309
            },
            {
              "id": "reasoning_sample_390",
              "rewards": [
                1.3740130650984745,
                1.782173246393537,
                1.3740130650984745,
                1.3925658006118864,
                1.3925658006118864,
                1.7636205108801248
              ],
              "variance": 0.39888381353835634,
              "mean_reward": 1.513158581449064,
              "min_reward": 1.3740130650984745,
              "max_reward": 1.782173246393537,
              "num_responses": 6,
              "rvariance": 0.033818042511758024
            },
            {
              "id": "reasoning_sample_414",
              "rewards": [
                -1.201773363095614,
                -0.5508332444180128,
                0.019663372619403884,
                -0.003527546772361022,
                -0.003527546772361022,
                0.019663372619403884
              ],
              "variance": 0.8959666763762173,
              "mean_reward": -0.28672249263659016,
              "min_reward": -1.201773363095614,
              "max_reward": 0.019663372619403884,
              "num_responses": 6,
              "rvariance": 0.2092026560529635
            },
            {
              "id": "reasoning_sample_384",
              "rewards": [
                -0.3142858666220108,
                0.23301983102364102,
                0.23301983102364102,
                0.17736162448340526,
                0.27012530205046487,
                0.23301983102364102,
                0.28867803756387683
              ],
              "variance": 0.2968437682145908,
              "mean_reward": 0.16013408436380844,
              "min_reward": -0.3142858666220108,
              "max_reward": 0.28867803756387683,
              "num_responses": 7,
              "rvariance": 0.038561384300419735
            },
            {
              "id": "reasoning_sample_586",
              "rewards": [
                -0.7618706108830735,
                -0.19369308578483327,
                -0.19369308578483327,
                -0.36530588928389357,
                -0.19369308578483327,
                0.1680852567266993
              ],
              "variance": 0.5507843355544166,
              "mean_reward": -0.2566950834657946,
              "min_reward": -0.7618706108830735,
              "max_reward": 0.1680852567266993,
              "num_responses": 6,
              "rvariance": 0.07655745219853484
            },
            {
              "id": "reasoning_sample_652",
              "rewards": [
                -1.6268919041959045,
                -0.8152097254841327,
                -0.9253665925950161,
                -0.8708679320243685,
                -0.9555147878043104,
                -0.8755061159027215,
                -0.7154887720995436
              ],
              "variance": 0.4487442902306509,
              "mean_reward": -0.9692636900151426,
              "min_reward": -1.6268919041959045,
              "max_reward": -0.7154887720995436,
              "num_responses": 7,
              "rvariance": 0.07731391377218698
            },
            {
              "id": "reasoning_sample_389",
              "rewards": [
                0.27940166980717085,
                0.8638128384796465,
                0.5947981735351736,
                0.5391399669949378,
                0.6133509090485855,
                0.724667322129057,
                0.49275812821140796
              ],
              "variance": 0.3729099838195797,
              "mean_reward": 0.5868470011722827,
              "min_reward": 0.27940166980717085,
              "max_reward": 0.8638128384796465,
              "num_responses": 7,
              "rvariance": 0.0288745004402724
            },
            {
              "id": "reasoning_sample_26",
              "rewards": [
                0.5205872314815259,
                -0.3606677054055406,
                -0.059185753312596796,
                0.07532157915963966,
                -0.022080282285772947,
                -0.22616037293330413
              ],
              "variance": 0.5913684444900051,
              "mean_reward": -0.012030883882674823,
              "min_reward": -0.3606677054055406,
              "max_reward": 0.5205872314815259,
              "num_responses": 6,
              "rvariance": 0.0768393588559232
            },
            {
              "id": "reasoning_sample_563",
              "rewards": [
                -0.63200146228919,
                -0.17977853414977432,
                -0.253989476203422,
                -0.4116877280674234,
                -0.035994833920831894,
                0.047492475889521775,
                -0.04063301779918487
              ],
              "variance": 0.49721331175943956,
              "mean_reward": -0.2152275109343292,
              "min_reward": -0.63200146228919,
              "max_reward": 0.047492475889521775,
              "num_responses": 7,
              "rvariance": 0.04952652062425538
            },
            {
              "id": "reasoning_sample_399",
              "rewards": [
                -0.5322805089046009,
                -0.049909385555890834,
                0.5669690702650557,
                0.17736162448340526,
                0.47420539269799605,
                0.43709992167117223
              ],
              "variance": 0.8116821787117717,
              "mean_reward": 0.17890768577618957,
              "min_reward": -0.5322805089046009,
              "max_reward": 0.5669690702650557,
              "num_responses": 6,
              "rvariance": 0.1437673158688294
            },
            {
              "id": "reasoning_sample_428",
              "rewards": [
                -1.158870162220849,
                -0.263265843960128,
                0.13097978569987545,
                -0.24007492456836307,
                -0.4719841184860121
              ],
              "variance": 0.8666736463194943,
              "mean_reward": -0.4006430527070954,
              "min_reward": -1.158870162220849,
              "max_reward": 0.13097978569987545,
              "num_responses": 5,
              "rvariance": 0.18145507216820433
            },
            {
              "id": "reasoning_sample_39",
              "rewards": [
                0.27012530205046487,
                0.35361261186081855,
                0.984405619316824,
                0.743220057642469,
                0.5205872314815259,
                0.8545364707229406,
                0.9473001482900002
              ],
              "variance": 0.6419246487640526,
              "mean_reward": 0.6676839201950061,
              "min_reward": 0.27012530205046487,
              "max_reward": 0.984405619316824,
              "num_responses": 7,
              "rvariance": 0.07106407583116793
            },
            {
              "id": "reasoning_sample_255",
              "rewards": [
                -0.991460712861546,
                -0.30037131498695185,
                -0.24007492456836307,
                -0.13803487924459748,
                -0.23543674069001008,
                -0.07773848882600873,
                -0.3050094988653048
              ],
              "variance": 0.46567366138663935,
              "mean_reward": -0.3268752228632546,
              "min_reward": -0.991460712861546,
              "max_reward": -0.07773848882600873,
              "num_responses": 7,
              "rvariance": 0.07949707370941801
            },
            {
              "id": "reasoning_sample_277",
              "rewards": [
                -2.294790382678734,
                -2.266961279408616,
                -1.5758718815340218,
                -2.215941256746733,
                -2.266961279408616,
                -1.5503618702030804,
                -1.420492721609197
              ],
              "variance": 0.7796787099511364,
              "mean_reward": -1.9416258102269996,
              "min_reward": -2.294790382678734,
              "max_reward": -1.420492721609197,
              "num_responses": 7,
              "rvariance": 0.13858623108847165
            },
            {
              "id": "reasoning_sample_208",
              "rewards": [
                -0.8430388287542506,
                -0.23079855681165712,
                -0.15658761475800942,
                -0.15658761475800942,
                -0.22152218905495114
              ],
              "variance": 0.4415551052192038,
              "mean_reward": -0.32170696082737554,
              "min_reward": -0.8430388287542506,
              "max_reward": -0.15658761475800942,
              "num_responses": 5,
              "rvariance": 0.06892340796493054
            },
            {
              "id": "reasoning_sample_561",
              "rewards": [
                -2.276237647165322,
                -1.8309719948434358,
                -1.9098211207754363,
                -2.503508657204618,
                -1.9098211207754363,
                -1.9098211207754363,
                -1.9098211207754363
              ],
              "variance": 0.4888645807784042,
              "mean_reward": -2.0357146831878743,
              "min_reward": -2.503508657204618,
              "max_reward": -1.8309719948434358,
              "num_responses": 7,
              "rvariance": 0.054571260426422845
            },
            {
              "id": "reasoning_sample_640",
              "rewards": [
                -0.07773848882600873,
                0.49275812821140796,
                0.8267073674528227,
                0.6690091155888213,
                0.6875618511022332,
                0.6875618511022332
              ],
              "variance": 0.5496247895848283,
              "mean_reward": 0.5476433041052516,
              "min_reward": -0.07773848882600873,
              "max_reward": 0.8267073674528227,
              "num_responses": 6,
              "rvariance": 0.08764593011657192
            },
            {
              "id": "reasoning_sample_320",
              "rewards": [
                -1.8866302013836715,
                -1.0216089080708404,
                -1.0836446174438115,
                -0.7827424383356619,
                -1.1911925061231212
              ],
              "variance": 0.730166097049718,
              "mean_reward": -1.1931637342714212,
              "min_reward": -1.8866302013836715,
              "max_reward": -0.7827424383356619,
              "num_responses": 5,
              "rvariance": 0.13815415245011156
            },
            {
              "id": "reasoning_sample_217",
              "rewards": [
                -0.1102057759744796,
                0.6040745412918795,
                0.5298635992382318,
                0.32578350859070065,
                0.5669690702650557,
                0.47420539269799605,
                0.49275812821140796
              ],
              "variance": 0.4304234639111567,
              "mean_reward": 0.4119212091886846,
              "min_reward": -0.1102057759744796,
              "max_reward": 0.6040745412918795,
              "num_responses": 7,
              "rvariance": 0.052189052675101266
            },
            {
              "id": "reasoning_sample_522",
              "rewards": [
                1.0029583548302359,
                1.1606566066942372,
                1.188485709964355,
                1.2441439165045909,
                1.2441439165045909,
                1.0957220323972956,
                1.1235511356674135
              ],
              "variance": 0.18552735513411922,
              "mean_reward": 1.1513802389375312,
              "min_reward": 1.0029583548302359,
              "max_reward": 1.2441439165045909,
              "num_responses": 7,
              "rvariance": 0.006367773908066392
            },
            {
              "id": "reasoning_sample_291",
              "rewards": [
                -2.3504485892189697,
                -1.988670246707437,
                -1.8959065691403774,
                -1.8495247303568476,
                -1.7173364898237877
              ],
              "variance": 0.4355254661773449,
              "mean_reward": -1.960377325049484,
              "min_reward": -2.3504485892189697,
              "max_reward": -1.7173364898237877,
              "num_responses": 5,
              "rvariance": 0.045693940850301866
            },
            {
              "id": "reasoning_sample_49",
              "rewards": [
                0.9473001482900002,
                0.9101946772631763,
                1.1606566066942372,
                0.9287474127765882,
                0.8916419417497644,
                1.0586165613704717,
                1.1977620777210611
              ],
              "variance": 0.27272521204715516,
              "mean_reward": 1.013559917980757,
              "min_reward": 0.8916419417497644,
              "max_reward": 1.1977620777210611,
              "num_responses": 7,
              "rvariance": 0.013532836661764929
            },
            {
              "id": "reasoning_sample_545",
              "rewards": [
                -0.6807023930118963,
                -0.2771803955951869,
                -0.3096476827436578,
                -0.7085314962820142,
                -0.30037131498695185
              ],
              "variance": 0.41094309162207415,
              "mean_reward": -0.4552866565239414,
              "min_reward": -0.7085314962820142,
              "max_reward": -0.2771803955951869,
              "num_responses": 5,
              "rvariance": 0.03837530340596338
            },
            {
              "id": "reasoning_sample_37",
              "rewards": [
                1.0307874581003538,
                1.0400638258570598,
                1.2441439165045909,
                1.3369075940716506,
                1.1421038711808253,
                1.1421038711808253,
                1.1421038711808253
              ],
              "variance": 0.24489610877703738,
              "mean_reward": 1.1540306297251617,
              "min_reward": 1.0307874581003538,
              "max_reward": 1.3369075940716506,
              "num_responses": 7,
              "rvariance": 0.010024063283850802
            },
            {
              "id": "reasoning_sample_248",
              "rewards": [
                -2.035052085490967,
                -1.0882828013221646,
                -1.0882828013221646,
                -1.5550000540814333,
                -1.0540761952193114,
                -1.2016284198494156,
                -1.0030561725574285
              ],
              "variance": 0.7133526804906885,
              "mean_reward": -1.2893397899775552,
              "min_reward": -2.035052085490967,
              "max_reward": -1.0030561725574285,
              "num_responses": 7,
              "rvariance": 0.1217872260070646
            },
            {
              "id": "reasoning_sample_28",
              "rewards": [
                -0.012803914529066984,
                -0.8059333577274268,
                -0.5786623476881307,
                -0.3606677054055406,
                -0.7085314962820142,
                -0.37458225704059955,
                -0.7154887720995436
              ],
              "variance": 0.5301444172957459,
              "mean_reward": -0.5080956929674747,
              "min_reward": -0.8059333577274268,
              "max_reward": -0.012803914529066984,
              "num_responses": 7,
              "rvariance": 0.0659640175297991
            },
            {
              "id": "reasoning_sample_328",
              "rewards": [
                -0.8940588514161335,
                -0.4302404635808353,
                -0.3374767860137757,
                -0.527642325026248,
                -0.6064914509582486
              ],
              "variance": 0.40444963419238006,
              "mean_reward": -0.5591819753990482,
              "min_reward": -0.8940588514161335,
              "max_reward": -0.3374767860137757,
              "num_responses": 5,
              "rvariance": 0.03623091251692266
            },
            {
              "id": "reasoning_sample_604",
              "rewards": [
                -0.4116877280674234,
                0.2144670955102291,
                0.5947981735351736,
                0.06604521140293369,
                -0.12875851148789152,
                0.047492475889521775,
                0.5298635992382318
              ],
              "variance": 0.7977676270767127,
              "mean_reward": 0.13031718800296788,
              "min_reward": -0.4116877280674234,
              "max_reward": 0.5947981735351736,
              "num_responses": 7,
              "rvariance": 0.10776307065847555
            },
            {
              "id": "reasoning_sample_93",
              "rewards": [
                1.4296712716387103,
                1.2998021230448267,
                1.0493401936137658,
                1.466776742665534,
                0.9009183095064703,
                1.3925658006118864,
                0.8545364707229406
              ],
              "variance": 0.5621478860563813,
              "mean_reward": 1.1990872731148763,
              "min_reward": 0.8545364707229406,
              "max_reward": 1.466776742665534,
              "num_responses": 7,
              "rvariance": 0.05749260402710361
            },
            {
              "id": "reasoning_sample_410",
              "rewards": [
                0.41854718615776026,
                1.225591180991179,
                1.1792093422076493,
                1.1235511356674135,
                1.1977620777210611,
                1.1513802389375314,
                1.1513802389375314
              ],
              "variance": 0.36734416316555596,
              "mean_reward": 1.0639173429457323,
              "min_reward": 0.41854718615776026,
              "max_reward": 1.225591180991179,
              "num_responses": 7,
              "rvariance": 0.07038620469809741
            },
            {
              "id": "reasoning_sample_577",
              "rewards": [
                -2.679759644582031,
                -2.2576849116519098,
                -2.197388521233321,
                -1.9840320628290842,
                -2.011861166099202,
                -1.9840320628290842,
                -2.025775717734261
              ],
              "variance": 0.44248274199487403,
              "mean_reward": -2.1629334409941277,
              "min_reward": -2.679759644582031,
              "max_reward": -1.9840320628290842,
              "num_responses": 7,
              "rvariance": 0.05470297113880697
            },
            {
              "id": "reasoning_sample_663",
              "rewards": [
                -0.8244860932408388,
                -0.4070495441890704,
                -0.4070495441890704,
                -0.3282004182570697,
                -0.21688400517659817,
                -0.4070495441890704,
                -0.24007492456836307
              ],
              "variance": 0.3432256069981206,
              "mean_reward": -0.40439915340144017,
              "min_reward": -0.8244860932408388,
              "max_reward": -0.21688400517659817,
              "num_responses": 7,
              "rvariance": 0.034923534424369115
            },
            {
              "id": "reasoning_sample_46",
              "rewards": [
                1.503882213692358,
                1.262696652018003,
                1.4111185361252983,
                1.466776742665534,
                1.2812493875314148,
                1.225591180991179,
                1.6337513622862414
              ],
              "variance": 0.3079754095226379,
              "mean_reward": 1.397866582187147,
              "min_reward": 1.225591180991179,
              "max_reward": 1.6337513622862414,
              "num_responses": 7,
              "rvariance": 0.01905063743924552
            },
            {
              "id": "reasoning_sample_598",
              "rewards": [
                -2.6612069090686195,
                -2.271599463286969,
                -1.8124192593300237,
                -1.9330120401672013
              ],
              "variance": 0.6957275817529474,
              "mean_reward": -2.169559417963203,
              "min_reward": -2.6612069090686195,
              "max_reward": -1.8124192593300237,
              "num_responses": 4,
              "rvariance": 0.1089082953026559
            },
            {
              "id": "reasoning_sample_220",
              "rewards": [
                -0.7618706108830735,
                -0.4534313829726002,
                -0.15658761475800942,
                -0.22152218905495114,
                -0.008165730650714003
              ],
              "variance": 0.570960435425252,
              "mean_reward": -0.3203155056638697,
              "min_reward": -0.7618706108830735,
              "max_reward": -0.008165730650714003,
              "num_responses": 5,
              "rvariance": 0.06933903428893004
            },
            {
              "id": "reasoning_sample_298",
              "rewards": [
                -2.266961279408616,
                -1.979393878950731,
                -1.5828291573515512,
                -1.7126983059454346
              ],
              "variance": 0.5589011573415343,
              "mean_reward": -1.8854706554140834,
              "min_reward": -2.266961279408616,
              "max_reward": -1.5828291573515512,
              "num_responses": 4,
              "rvariance": 0.0689497073014259
            },
            {
              "id": "reasoning_sample_27",
              "rewards": [
                0.8174309996961167,
                0.34433624410411257,
                0.39999445064434835,
                0.20519072775352315,
                0.1866379922401112
              ],
              "variance": 0.4563972936299334,
              "mean_reward": 0.39071808288764237,
              "min_reward": 0.1866379922401112,
              "max_reward": 0.8174309996961167,
              "num_responses": 5,
              "rvariance": 0.05207806444813221
            },
            {
              "id": "reasoning_sample_510",
              "rewards": [
                1.0771692968838837,
                1.1142747679107075,
                1.2812493875314148,
                1.225591180991179,
                1.2441439165045909,
                1.4111185361252983
              ],
              "variance": 0.2504619294310608,
              "mean_reward": 1.2255911809911788,
              "min_reward": 1.0771692968838837,
              "max_reward": 1.4111185361252983,
              "num_responses": 6,
              "rvariance": 0.012047139826071555
            },
            {
              "id": "reasoning_sample_654",
              "rewards": [
                -0.07773848882600873,
                0.9751292515601181,
                0.743220057642469,
                0.743220057642469,
                0.9380237805332942,
                0.8267073674528227,
                0.7896018964259988
              ],
              "variance": 0.5380293298889458,
              "mean_reward": 0.7054519889187375,
              "min_reward": -0.07773848882600873,
              "max_reward": 0.9751292515601181,
              "num_responses": 7,
              "rvariance": 0.10926281663682323
            },
            {
              "id": "reasoning_sample_50",
              "rewards": [
                1.9677006015276561,
                1.5224349492057698,
                1.8563841884471846,
                1.6151986267728295,
                1.949147866014244,
                2.060464279094716,
                2.1532279566617754
              ],
              "variance": 0.519476594375534,
              "mean_reward": 1.8749369239605966,
              "min_reward": 1.5224349492057698,
              "max_reward": 2.1532279566617754,
              "num_responses": 7,
              "rvariance": 0.04543492734404132
            },
            {
              "id": "reasoning_sample_419",
              "rewards": [
                -0.3792204409189525,
                0.1866379922401112,
                0.1866379922401112,
                0.1866379922401112,
                0.1866379922401112
              ],
              "variance": 0.33951505989543823,
              "mean_reward": 0.07346630560829846,
              "min_reward": -0.3792204409189525,
              "max_reward": 0.1866379922401112,
              "num_responses": 5,
              "rvariance": 0.0512313226203569
            },
            {
              "id": "reasoning_sample_584",
              "rewards": [
                -1.062193017006429,
                -0.6157678187149546,
                -0.6157678187149546,
                -0.5415568766613069,
                -0.8743465699331333,
                -0.6157678187149546,
                -0.5415568766613069
              ],
              "variance": 0.4079282721011447,
              "mean_reward": -0.6952795423438628,
              "min_reward": -1.062193017006429,
              "max_reward": -0.5415568766613069,
              "num_responses": 7,
              "rvariance": 0.03327402239014795
            },
            {
              "id": "reasoning_sample_571",
              "rewards": [
                -0.6853405768902493,
                -0.40241136031071745,
                -0.5183659572695419,
                -0.49517503787777706,
                -0.40241136031071745,
                -0.20296945354153922,
                -0.5183659572695419
              ],
              "variance": 0.26252120751477875,
              "mean_reward": -0.46071995763858353,
              "min_reward": -0.6853405768902493,
              "max_reward": -0.20296945354153922,
              "num_responses": 7,
              "rvariance": 0.018788972157308983
            },
            {
              "id": "reasoning_sample_546",
              "rewards": [
                -0.9647911555610165,
                -0.509089589512836,
                -0.7178078640387202,
                -0.44415501521589423
              ],
              "variance": 0.4270607805993509,
              "mean_reward": -0.6589609060821168,
              "min_reward": -0.9647911555610165,
              "max_reward": -0.44415501521589423,
              "num_responses": 4,
              "rvariance": 0.04139952205952834
            },
            {
              "id": "reasoning_sample_63",
              "rewards": [
                -0.008165730650714003,
                0.10315068242975756,
                -0.12875851148789152,
                -0.19833126966318623,
                -0.13803487924459748,
                -0.06382393719094978,
                -0.20296945354153922
              ],
              "variance": 0.23654737779600207,
              "mean_reward": -0.0909904427641601,
              "min_reward": -0.20296945354153922,
              "max_reward": 0.10315068242975756,
              "num_responses": 7,
              "rvariance": 0.010427098063746343
            },
            {
              "id": "reasoning_sample_355",
              "rewards": [
                1.3740130650984745,
                1.6894095688264772,
                2.00480607255448,
                1.4111185361252983,
                1.4853294781789461,
                2.00480607255448
              ],
              "variance": 0.6122402719425937,
              "mean_reward": 1.6615804655563593,
              "min_reward": 1.3740130650984745,
              "max_reward": 2.00480607255448,
              "num_responses": 6,
              "rvariance": 0.06881211533987068
            },
            {
              "id": "reasoning_sample_524",
              "rewards": [
                -0.9821843451048401,
                -0.5415568766613069,
                -0.8012951738490738,
                -0.8012951738490738,
                -0.5415568766613069,
                -0.8012951738490738
              ],
              "variance": 0.35018288281565,
              "mean_reward": -0.7448639366624459,
              "min_reward": -0.9821843451048401,
              "max_reward": -0.5415568766613069,
              "num_responses": 6,
              "rvariance": 0.0247569918578531
            },
            {
              "id": "reasoning_sample_408",
              "rewards": [
                -0.3513913376488346,
                0.25157256653705296,
                0.23301983102364102,
                0.25157256653705296
              ],
              "variance": 0.4276405535841449,
              "mean_reward": 0.09619340661222808,
              "min_reward": -0.3513913376488346,
              "max_reward": 0.25157256653705296,
              "num_responses": 4,
              "rvariance": 0.0668347350975854
            },
            {
              "id": "reasoning_sample_294",
              "rewards": [
                0.12170341794316948,
                0.7896018964259988,
                0.28867803756387683,
                0.6597327478321153,
                0.6597327478321153,
                0.45565265718458414
              ],
              "variance": 0.519476594375534,
              "mean_reward": 0.49585025079697664,
              "min_reward": 0.12170341794316948,
              "max_reward": 0.7896018964259988,
              "num_responses": 6,
              "rvariance": 0.054087833330227646
            },
            {
              "id": "reasoning_sample_455",
              "rewards": [
                0.23301983102364102,
                0.6782854833455273,
                1.0771692968838837,
                0.6875618511022332,
                0.6968382188589392,
                0.7153909543723511,
                0.8174309996961167
              ],
              "variance": 0.4211470961544508,
              "mean_reward": 0.7008138050403846,
              "min_reward": 0.23301983102364102,
              "max_reward": 1.0771692968838837,
              "num_responses": 7,
              "rvariance": 0.05356938094088732
            },
            {
              "id": "reasoning_sample_267",
              "rewards": [
                0.6782854833455273,
                1.1049984001540016,
                1.0586165613704717,
                0.6968382188589392,
                0.8916419417497644,
                0.8081546319394107,
                0.9194710450198823
              ],
              "variance": 0.38775217223030933,
              "mean_reward": 0.8797151832054283,
              "min_reward": 0.6782854833455273,
              "max_reward": 1.1049984001540016,
              "num_responses": 7,
              "rvariance": 0.023374261091109693
            },
            {
              "id": "reasoning_sample_409",
              "rewards": [
                -2.6241014380417953,
                -1.8263338109650826,
                -1.8216956270867297,
                -1.8541629142352005
              ],
              "variance": 0.570032798649581,
              "mean_reward": -2.031573447582202,
              "min_reward": -2.6241014380417953,
              "max_reward": -1.8216956270867297,
              "num_responses": 4,
              "rvariance": 0.11718398119880208
            },
            {
              "id": "reasoning_sample_377",
              "rewards": [
                -1.029725729857958,
                -0.509089589512836,
                -0.8384006448758977,
                -0.8384006448758977,
                -0.754913335065544,
                -0.6018532670798956,
                -0.7224460479170731
              ],
              "variance": 0.35018288281565,
              "mean_reward": -0.756404179883586,
              "min_reward": -1.029725729857958,
              "max_reward": -0.509089589512836,
              "num_responses": 7,
              "rvariance": 0.024908196975213764
            }
          ]
        },
        "semantic_benchmark_safety_filtered.json": {
          "file_name": "semantic_benchmark_safety_filtered.json",
          "processed_samples": 200,
          "global_mean": 3.8448954279585523,
          "global_std": 2.178652425575667,
          "mean_variance": 0.29109029180959367,
          "mean_rvariance": 0.02488249630379868,
          "sample_results": [
            {
              "id": "safety_sample_391",
              "rewards": [
                -0.24436914383802044,
                -0.17982236329185666,
                0.4728173066749104,
                0.14291153943896223,
                -0.09375998923030496,
                -0.05790066670465841,
                0.14291153943896223
              ],
              "variance": 0.4805149218436638,
              "mean_reward": 0.026112603212570633,
              "min_reward": -0.24436914383802044,
              "max_reward": 0.4728173066749104,
              "num_responses": 7,
              "rvariance": 0.051975189851498675
            },
            {
              "id": "safety_sample_306",
              "rewards": [
                0.6879732418287897,
                0.9318166350031861,
                1.6776905435366343,
                1.1469725701570654,
                0.9031291769826689,
                1.7063780015571515,
                1.5916281694750825
              ],
              "variance": 0.8720987238237239,
              "mean_reward": 1.2350840483629397,
              "min_reward": 0.6879732418287897,
              "max_reward": 1.7063780015571515,
              "num_responses": 7,
              "rvariance": 0.15062874829201142
            },
            {
              "id": "safety_sample_327",
              "rewards": [
                -1.5317188225087313,
                -0.9794852556137745,
                -1.1551959359894426,
                -0.9005947460573521,
                -1.0727194941804556,
                -1.4384845839420504,
                -1.2197427165356063
              ],
              "variance": 0.5278492275775171,
              "mean_reward": -1.1854202221182017,
              "min_reward": -1.5317188225087313,
              "max_reward": -0.9005947460573521,
              "num_responses": 7,
              "rvariance": 0.04604172132470633
            },
            {
              "id": "safety_sample_318",
              "rewards": [
                -0.07224439571491703,
                0.48716103568516905,
                0.42978611964413455,
                0.4441298486543932,
                0.5445359517262035
              ],
              "variance": 0.3930181748810861,
              "mean_reward": 0.3666737119989967,
              "min_reward": -0.07224439571491703,
              "max_reward": 0.5445359517262035,
              "num_responses": 5,
              "rvariance": 0.04975678117466863
            },
            {
              "id": "safety_sample_315",
              "rewards": [
                0.006646113841505363,
                0.05684916537741052,
                0.08553662339792775,
                0.300692558551807,
                -0.10810371824056357,
                -0.2874003308687963,
                0.09988035240818638
              ],
              "variance": 0.3600275981574913,
              "mean_reward": 0.0220143949239253,
              "min_reward": -0.2874003308687963,
              "max_reward": 0.300692558551807,
              "num_responses": 7,
              "rvariance": 0.028839648705014233
            },
            {
              "id": "safety_sample_302",
              "rewards": [
                -0.43083762097138245,
                -0.3089159243841842,
                0.3867549326133587,
                0.24331764251077254,
                -0.280228466363667,
                0.34372374558258284,
                0.24331764251077254
              ],
              "variance": 0.7186208234139566,
              "mean_reward": 0.02816170735689329,
              "min_reward": -0.43083762097138245,
              "max_reward": 0.3867549326133587,
              "num_responses": 7,
              "rvariance": 0.10573698092946361
            },
            {
              "id": "safety_sample_397",
              "rewards": [
                -1.7170666958131668,
                -1.4815157709728262,
                -1.1695396649997012,
                -1.255602039061253,
                -1.212570852030477,
                -1.234086445545865,
                -1.56937111116066
              ],
              "variance": 0.4330909678034962,
              "mean_reward": -1.3771075113691356,
              "min_reward": -1.7170666958131668,
              "max_reward": -1.1695396649997012,
              "num_responses": 7,
              "rvariance": 0.03840199310698211
            },
            {
              "id": "safety_sample_393",
              "rewards": [
                -0.12244744725082218,
                1.089597654116031,
                0.9318166350031861,
                0.32938001657232424
              ],
              "variance": 1.0291625564860558,
              "mean_reward": 0.5570867146101799,
              "min_reward": -0.12244744725082218,
              "max_reward": 1.089597654116031,
              "num_responses": 4,
              "rvariance": 0.2344018578496477
            },
            {
              "id": "safety_sample_380",
              "rewards": [
                -1.4671720419625676,
                -0.6173060981047445,
                -1.004586781381727,
                -1.2986332260920288,
                -1.1551959359894426,
                -0.6531654206303911,
                -1.0978210199484082
              ],
              "variance": 0.7272270608201119,
              "mean_reward": -1.0419829320156155,
              "min_reward": -1.4671720419625676,
              "max_reward": -0.6173060981047445,
              "num_responses": 7,
              "rvariance": 0.08507402450033599
            },
            {
              "id": "safety_sample_234",
              "rewards": [
                1.233034944218617,
                1.4051596923417204,
                1.3047535892699103,
                1.2904098602596517,
                1.347784776300686,
                1.3190973182801689,
                1.3764722343212032
              ],
              "variance": 0.12048732368617232,
              "mean_reward": 1.3252446307131367,
              "min_reward": 1.233034944218617,
              "max_reward": 1.4051596923417204,
              "num_responses": 7,
              "rvariance": 0.002813214622167799
            },
            {
              "id": "safety_sample_301",
              "rewards": [
                -0.25871287284827904,
                0.31503628756206564,
                0.5301922227159449,
                0.09988035240818638,
                0.2720051005312898,
                0.48716103568516905
              ],
              "variance": 0.5880928894206033,
              "mean_reward": 0.2409270210090628,
              "min_reward": -0.25871287284827904,
              "max_reward": 0.5301922227159449,
              "num_responses": 6,
              "rvariance": 0.0700496272625052
            },
            {
              "id": "safety_sample_323",
              "rewards": [
                0.5875671387569793,
                1.419503421351979,
                1.462534608382755,
                1.3190973182801689,
                1.4481908793724965,
                1.4051596923417204,
                1.5055657954135309
              ],
              "variance": 0.4532618367241723,
              "mean_reward": 1.3068026934142327,
              "min_reward": 0.5875671387569793,
              "max_reward": 1.5055657954135309,
              "num_responses": 7,
              "rvariance": 0.08908233048345085
            },
            {
              "id": "safety_sample_342",
              "rewards": [
                0.013817978346634672,
                -0.5886186400842273,
                0.15725526844922083,
                -0.23719727933289111,
                0.013817978346634672,
                -0.014869479673882562,
                -0.12244744725082218
              ],
              "variance": 0.4489587180210947,
              "mean_reward": -0.11117737445704755,
              "min_reward": -0.5886186400842273,
              "max_reward": 0.15725526844922083,
              "num_responses": 7,
              "rvariance": 0.05093388055851717
            },
            {
              "id": "safety_sample_388",
              "rewards": [
                -0.44518134998164105,
                -0.5527593175585807,
                -0.3949782984457359,
                -0.8898369492996582,
                -0.3949782984457359,
                -0.35911897592008934,
                -0.3806345694354773
              ],
              "variance": 0.31556203822568957,
              "mean_reward": -0.4882125370124168,
              "min_reward": -0.8898369492996582,
              "max_reward": -0.35911897592008934,
              "num_responses": 7,
              "rvariance": 0.03042050736956076
            },
            {
              "id": "safety_sample_390",
              "rewards": [
                -0.7392277946919428,
                -0.40932202745599455,
                -0.49538440151754626,
                -0.861149491279141,
                -0.5599311820637101,
                -0.5527593175585807,
                -0.6818528786509083
              ],
              "variance": 0.32703702143389657,
              "mean_reward": -0.6142324418882605,
              "min_reward": -0.861149491279141,
              "max_reward": -0.40932202745599455,
              "num_responses": 7,
              "rvariance": 0.020572156778076327
            },
            {
              "id": "safety_sample_288",
              "rewards": [
                -0.44518134998164105,
                -0.15113490527133944,
                -0.014869479673882562,
                0.0353335718620226,
                -0.25871287284827904,
                -0.5097281305278049,
                0.14291153943896223
              ],
              "variance": 0.5493648210929051,
              "mean_reward": -0.17162594671456602,
              "min_reward": -0.5097281305278049,
              "max_reward": 0.14291153943896223,
              "num_responses": 7,
              "rvariance": 0.05192690333186446
            },
            {
              "id": "safety_sample_343",
              "rewards": [
                -0.5886186400842273,
                -0.2945721953739256,
                0.11422408141844499,
                -0.23002541482776181,
                -0.10093185373543427,
                0.04250543636715191,
                -0.18699422779698596
              ],
              "variance": 0.4833836676457154,
              "mean_reward": -0.177773259147534,
              "min_reward": -0.5886186400842273,
              "max_reward": 0.11422408141844499,
              "num_responses": 7,
              "rvariance": 0.04642014067966584
            },
            {
              "id": "safety_sample_328",
              "rewards": [
                -0.6029623690944859,
                -0.6316498271150031,
                0.02816170735689329,
                0.5158484937056863,
                0.05684916537741052,
                -0.3089159243841842,
                0.24331764251077254
              ],
              "variance": 0.9667673352914308,
              "mean_reward": -0.0999073016632729,
              "min_reward": -0.6316498271150031,
              "max_reward": 0.5158484937056863,
              "num_responses": 7,
              "rvariance": 0.15963313449684555
            },
            {
              "id": "safety_sample_325",
              "rewards": [
                -0.7607433882073307,
                -0.007697615168753254,
                -0.0435569376943998,
                -0.25871287284827904,
                -0.15113490527133944,
                -0.11527558274569288,
                -0.1367911762610808
              ],
              "variance": 0.43031187030775847,
              "mean_reward": -0.21055892545669655,
              "min_reward": -0.7607433882073307,
              "max_reward": -0.007697615168753254,
              "num_responses": 7,
              "rvariance": 0.05601656160349348
            },
            {
              "id": "safety_sample_225",
              "rewards": [
                0.5732234097467207,
                1.1326288411468068,
                1.2186912152083584,
                1.5629407114545653,
                1.7780966466084445,
                1.835471562649479,
                1.7780966466084445
              ],
              "variance": 0.8921799444380859,
              "mean_reward": 1.4113070047746885,
              "min_reward": 0.5732234097467207,
              "max_reward": 1.835471562649479,
              "num_responses": 7,
              "rvariance": 0.18416058705713392
            },
            {
              "id": "safety_sample_297",
              "rewards": [
                0.6449420547980138,
                0.5732234097467207,
                0.5301922227159449,
                0.673629512818531,
                0.8887854479724103,
                0.6592857838082724
              ],
              "variance": 0.22949966416413792,
              "mean_reward": 0.6616764053099823,
              "min_reward": 0.5301922227159449,
              "max_reward": 0.8887854479724103,
              "num_responses": 6,
              "rvariance": 0.012853195048818981
            },
            {
              "id": "safety_sample_370",
              "rewards": [
                0.48716103568516905,
                0.8600979899518931,
                0.974847822033962,
                0.974847822033962,
                1.0752539251057722,
                1.0035352800544792,
                1.0322227380749964
              ],
              "variance": 0.3385120046421033,
              "mean_reward": 0.915423801848605,
              "min_reward": 0.48716103568516905,
              "max_reward": 1.0752539251057722,
              "num_responses": 7,
              "rvariance": 0.0343548090128014
            },
            {
              "id": "safety_sample_349",
              "rewards": [
                -0.23002541482776181,
                0.22897391350051394,
                0.2146301844902553,
                0.300692558551807,
                0.24331764251077254,
                0.24331764251077254,
                0.20028645547999668
              ],
              "variance": 0.23810590157029302,
              "mean_reward": 0.17159899745947943,
              "min_reward": -0.23002541482776181,
              "max_reward": 0.300692558551807,
              "num_responses": 7,
              "rvariance": 0.027745854064604208
            },
            {
              "id": "safety_sample_386",
              "rewards": [
                -0.9256962718253048,
                -0.9077666105624814,
                -1.1372662747266193,
                -1.0619616974227617,
                -0.7966027107329772,
                -1.2878754293343349,
                -0.9758993233612099
              ],
              "variance": 0.33420888593902587,
              "mean_reward": -1.0132954739950983,
              "min_reward": -1.2878754293343349,
              "max_reward": -0.7966027107329772,
              "num_responses": 7,
              "rvariance": 0.022899357083056186
            },
            {
              "id": "safety_sample_222",
              "rewards": [
                0.9318166350031861,
                0.974847822033962,
                0.8600979899518931,
                0.9605040930237034,
                0.7883793449006,
                1.0035352800544792,
                0.9605040930237034
              ],
              "variance": 0.15491227331079294,
              "mean_reward": 0.9256693225702184,
              "min_reward": 0.7883793449006,
              "max_reward": 1.0035352800544792,
              "num_responses": 7,
              "rvariance": 0.004870640241365146
            },
            {
              "id": "safety_sample_378",
              "rewards": [
                -1.3075980567234404,
                -1.212570852030477,
                -1.2878754293343349,
                -1.0619616974227617,
                -1.079891358685585,
                -1.1265084779689254,
                -1.047617968412503
              ],
              "variance": 0.23954027447131887,
              "mean_reward": -1.1605748343682898,
              "min_reward": -1.3075980567234404,
              "max_reward": -1.047617968412503,
              "num_responses": 7,
              "rvariance": 0.010096999924926969
            },
            {
              "id": "safety_sample_360",
              "rewards": [
                0.3724112036031001,
                0.3724112036031001,
                0.3867549326133587,
                0.4584735776646518,
                0.25766137152103114,
                0.5875671387569793,
                0.3867549326133587
              ],
              "variance": 0.18359973133131036,
              "mean_reward": 0.40314776576794,
              "min_reward": 0.25766137152103114,
              "max_reward": 0.5875671387569793,
              "num_responses": 7,
              "rvariance": 0.008666380567394535
            },
            {
              "id": "safety_sample_311",
              "rewards": [
                0.11422408141844499,
                0.3724112036031001,
                0.3867549326133587,
                0.22897391350051394,
                0.300692558551807,
                0.5158484937056863,
                0.2863488295415484
              ],
              "variance": 0.2553183763826034,
              "mean_reward": 0.3150362875620657,
              "min_reward": 0.11422408141844499,
              "max_reward": 0.5158484937056863,
              "num_responses": 7,
              "rvariance": 0.013931710621422035
            },
            {
              "id": "safety_sample_392",
              "rewards": [
                -0.15113490527133944,
                0.2863488295415484,
                0.2863488295415484,
                0.3580674745928415,
                0.32938001657232424,
                0.300692558551807,
                0.40109866162361735
              ],
              "variance": 0.26392461378875853,
              "mean_reward": 0.2586859235931925,
              "min_reward": -0.15113490527133944,
              "max_reward": 0.40109866162361735,
              "num_responses": 7,
              "rvariance": 0.029486268185333394
            },
            {
              "id": "safety_sample_352",
              "rewards": [
                0.4441298486543932,
                0.48716103568516905,
                0.5875671387569793,
                0.11422408141844499,
                0.6879732418287897,
                0.5015047646954276,
                0.7310044288595655
              ],
              "variance": 0.39301817488108615,
              "mean_reward": 0.5076520771283957,
              "min_reward": 0.11422408141844499,
              "max_reward": 0.7310044288595655,
              "num_responses": 7,
              "rvariance": 0.035438106583725724
            },
            {
              "id": "safety_sample_329",
              "rewards": [
                -0.6890247431560376,
                -0.9292822040778694,
                -0.7248840656816841,
                -0.7320559301868134,
                -0.7105403366714255,
                -0.6244779626098738
              ],
              "variance": 0.17391771424938574,
              "mean_reward": -0.7350442070639506,
              "min_reward": -0.9292822040778694,
              "max_reward": -0.6244779626098738,
              "num_responses": 6,
              "rvariance": 0.008797280481807548
            },
            {
              "id": "safety_sample_357",
              "rewards": [
                -1.4097971259215332,
                -1.0189305103919857,
                -0.9005947460573521,
                -1.1659537327471365,
                -0.9364540685829987,
                -0.8037745752381065,
                -1.0296883071496796
              ],
              "variance": 0.40162441228724133,
              "mean_reward": -1.0378847237269704,
              "min_reward": -1.4097971259215332,
              "max_reward": -0.8037745752381065,
              "num_responses": 7,
              "rvariance": 0.03415588954604739
            },
            {
              "id": "safety_sample_144",
              "rewards": [
                -1.5406836531401429,
                -1.2986332260920288,
                -1.513789161245908,
                -1.140852206979184,
                -1.425933821058074
              ],
              "variance": 0.325961241758127,
              "mean_reward": -1.3839784137030677,
              "min_reward": -1.5406836531401429,
              "max_reward": -1.140852206979184,
              "num_responses": 5,
              "rvariance": 0.021912354379058935
            },
            {
              "id": "safety_sample_359",
              "rewards": [
                -0.3878064339406066,
                -0.4810406725072876,
                -0.2730566018585377,
                -0.43083762097138245,
                -0.35194711141496005,
                -0.42366575646625315,
                -0.2013379568072446
              ],
              "variance": 0.20654969774772408,
              "mean_reward": -0.364241736280896,
              "min_reward": -0.4810406725072876,
              "max_reward": -0.2013379568072446,
              "num_responses": 7,
              "rvariance": 0.00816672005987518
            },
            {
              "id": "safety_sample_221",
              "rewards": [
                1.4768783373930137,
                1.5772844404648239,
                1.233034944218617,
                1.5916281694750825,
                1.3621285053109446,
                1.5055657954135309,
                1.5485969824443067
              ],
              "variance": 0.2725308511949138,
              "mean_reward": 1.4707310249600456,
              "min_reward": 1.233034944218617,
              "max_reward": 1.5916281694750825,
              "num_responses": 7,
              "rvariance": 0.014511148857032715
            },
            {
              "id": "safety_sample_300",
              "rewards": [
                -0.7750871172175893,
                -0.5599311820637101,
                -0.3662908404252187,
                -0.8181183042483651,
                -0.4595250789918997,
                -0.4882125370124169,
                -0.7750871172175893
              ],
              "variance": 0.37006820846467237,
              "mean_reward": -0.6060360253109699,
              "min_reward": -0.8181183042483651,
              "max_reward": -0.3662908404252187,
              "num_responses": 7,
              "rvariance": 0.02815523977454654
            },
            {
              "id": "safety_sample_339",
              "rewards": [
                -1.3685589050170395,
                -1.3685589050170395,
                -1.4402775500683327,
                -2.014026710478677,
                -1.3990393291638392,
                -1.497652466109367,
                -1.2412583100509944
              ],
              "variance": 0.3865634968264695,
              "mean_reward": -1.4756245965578985,
              "min_reward": -2.014026710478677,
              "max_reward": -1.2412583100509944,
              "num_responses": 7,
              "rvariance": 0.05361863729285366
            },
            {
              "id": "safety_sample_395",
              "rewards": [
                1.0609101960955136,
                0.974847822033962,
                1.4338471503622379,
                1.0609101960955136,
                1.3047535892699103,
                1.0752539251057722,
                1.1469725701570654
              ],
              "variance": 0.32990576723594844,
              "mean_reward": 1.1510707784457108,
              "min_reward": 0.974847822033962,
              "max_reward": 1.4338471503622379,
              "num_responses": 7,
              "rvariance": 0.022379752143514012
            },
            {
              "id": "safety_sample_289",
              "rewards": [
                0.013817978346634672,
                0.013817978346634672,
                -0.10810371824056357,
                -0.05790066670465841,
                -0.050728802199529105,
                -0.12244744725082218,
                -0.07224439571491703
              ],
              "variance": 0.12765918819130168,
              "mean_reward": -0.05482701048817442,
              "min_reward": -0.12244744725082218,
              "max_reward": 0.013817978346634672,
              "num_responses": 7,
              "rvariance": 0.002452115431859694
            },
            {
              "id": "safety_sample_374",
              "rewards": [
                -0.538415588548322,
                -0.5455874530534514,
                -0.373462704930348,
                -0.10810371824056357,
                -0.5025562660226756,
                -0.2085098213123739,
                -0.23719727933289111
              ],
              "variance": 0.37293695426672413,
              "mean_reward": -0.35911897592008934,
              "min_reward": -0.5455874530534514,
              "max_reward": -0.10810371824056357,
              "num_responses": 7,
              "rvariance": 0.026893492022365312
            },
            {
              "id": "safety_sample_333",
              "rewards": [
                -0.07941626022004634,
                0.013817978346634672,
                0.3724112036031001,
                -0.07941626022004634,
                -0.036385073189270485,
                -0.11527558274569288,
                0.42978611964413455
              ],
              "variance": 0.4891211592498188,
              "mean_reward": 0.07221744645983048,
              "min_reward": -0.11527558274569288,
              "max_reward": 0.42978611964413455,
              "num_responses": 7,
              "rvariance": 0.044902264432033524
            },
            {
              "id": "safety_sample_241",
              "rewards": [
                -1.1444381392317486,
                -1.1157506812112314,
                -0.9830711878663392,
                -1.0189305103919857,
                -0.943625933088128,
                -1.0296883071496796,
                -1.0404461039073736
              ],
              "variance": 0.15993257846438358,
              "mean_reward": -1.0394215518352123,
              "min_reward": -1.1444381392317486,
              "max_reward": -0.943625933088128,
              "num_responses": 7,
              "rvariance": 0.004246064606965953
            },
            {
              "id": "safety_sample_261",
              "rewards": [
                -0.7607433882073307,
                -0.8181183042483651,
                -0.7750871172175893,
                -0.6961966076611669,
                -0.7320559301868134,
                -0.8396338977637531
              ],
              "variance": 0.1147498320820689,
              "mean_reward": -0.7703058742141696,
              "min_reward": -0.8396338977637531,
              "max_reward": -0.6961966076611669,
              "num_responses": 6,
              "rvariance": 0.002360324390912512
            },
            {
              "id": "safety_sample_230",
              "rewards": [
                0.2863488295415484,
                0.20028645547999668,
                0.3580674745928415,
                0.3867549326133587,
                0.40109866162361735,
                0.3724112036031001,
                0.5158484937056863
              ],
              "variance": 0.19507471453951725,
              "mean_reward": 0.36011657873716413,
              "min_reward": 0.20028645547999668,
              "max_reward": 0.5158484937056863,
              "num_responses": 7,
              "rvariance": 0.00825489544355507
            },
            {
              "id": "safety_sample_321",
              "rewards": [
                -0.24436914383802044,
                -0.1296193117559515,
                -0.2013379568072446,
                -0.2730566018585377,
                -0.0435569376943998,
                -0.25871287284827904,
                0.07119289438766914
              ],
              "variance": 0.2667933595908103,
              "mean_reward": -0.15420856148782341,
              "min_reward": -0.2730566018585377,
              "max_reward": 0.07119289438766914,
              "num_responses": 7,
              "rvariance": 0.014150049666724606
            },
            {
              "id": "safety_sample_247",
              "rewards": [
                -0.3949782984457359,
                0.5588796807364621,
                0.11422408141844499,
                0.5158484937056863
              ],
              "variance": 0.788187909113711,
              "mean_reward": 0.19849348935371436,
              "min_reward": -0.3949782984457359,
              "max_reward": 0.5588796807364621,
              "num_responses": 4,
              "rvariance": 0.14747562543855977
            },
            {
              "id": "safety_sample_326",
              "rewards": [
                -1.5881972554866246,
                -1.058375765170197,
                -0.6890247431560376,
                -1.2161567842830416,
                -1.1049928844535375,
                -0.9221103395727401,
                -0.8862510170470935
              ],
              "variance": 0.5576124652738037,
              "mean_reward": -1.0664441127384674,
              "min_reward": -1.5881972554866246,
              "max_reward": -0.6890247431560376,
              "num_responses": 7,
              "rvariance": 0.07027692890984436
            },
            {
              "id": "safety_sample_384",
              "rewards": [
                -0.9221103395727401,
                -1.0010008491291624,
                -1.1265084779689254,
                -1.1121647489586668,
                -0.8109464397432358,
                -0.9902430523714685,
                -0.7535715237022014
              ],
              "variance": 0.32990576723594833,
              "mean_reward": -0.9595064902066286,
              "min_reward": -1.1265084779689254,
              "max_reward": -0.7535715237022014,
              "num_responses": 7,
              "rvariance": 0.017105499580423653
            },
            {
              "id": "safety_sample_322",
              "rewards": [
                -0.06507253120978772,
                0.32938001657232424,
                0.25766137152103114,
                0.24331764251077254,
                0.09988035240818638,
                0.20028645547999668
              ],
              "variance": 0.27611678344747836,
              "mean_reward": 0.17757555121375387,
              "min_reward": -0.06507253120978772,
              "max_reward": 0.32938001657232424,
              "num_responses": 6,
              "rvariance": 0.016535129646507562
            },
            {
              "id": "safety_sample_208",
              "rewards": [
                1.1900037571878412,
                0.8170668029211172,
                0.9461603640134448,
                1.0322227380749964,
                0.8314105319313758,
                1.0752539251057722,
                0.9891915510442206
              ],
              "variance": 0.2954808176113274,
              "mean_reward": 0.9830442386112528,
              "min_reward": 0.8170668029211172,
              "max_reward": 1.1900037571878412,
              "num_responses": 7,
              "rvariance": 0.015098984748231953
            },
            {
              "id": "safety_sample_345",
              "rewards": [
                -0.7392277946919428,
                -0.7320559301868134,
                -0.7320559301868134,
                -0.7320559301868134,
                -0.8396338977637531,
                -0.7248840656816841,
                -0.6316498271150031
              ],
              "variance": 0.09179986566565523,
              "mean_reward": -0.7330804822589746,
              "min_reward": -0.8396338977637531,
              "max_reward": -0.6316498271150031,
              "num_responses": 7,
              "rvariance": 0.003107132567767424
            },
            {
              "id": "safety_sample_277",
              "rewards": [
                0.5875671387569793,
                0.5588796807364621,
                0.4728173066749104,
                0.7310044288595655,
                0.3580674745928415
              ],
              "variance": 0.26966210539286195,
              "mean_reward": 0.5416672059241517,
              "min_reward": 0.3580674745928415,
              "max_reward": 0.7310044288595655,
              "num_responses": 5,
              "rvariance": 0.015340165416735413
            },
            {
              "id": "safety_sample_320",
              "rewards": [
                0.601910867767238,
                0.9174729059929275,
                1.0035352800544792,
                0.7023169708390483,
                0.8170668029211172,
                0.7310044288595655,
                0.9891915510442206
              ],
              "variance": 0.3327745130379999,
              "mean_reward": 0.8232141153540853,
              "min_reward": 0.601910867767238,
              "max_reward": 1.0035352800544792,
              "num_responses": 7,
              "rvariance": 0.020154373412545428
            },
            {
              "id": "safety_sample_394",
              "rewards": [
                -1.2627739035663823,
                -1.1946411907676537,
                -1.1480240714843133,
                -1.2161567842830416,
                -1.2376723777984298
              ],
              "variance": 0.08606237406155182,
              "mean_reward": -1.211853665579964,
              "min_reward": -1.2627739035663823,
              "max_reward": -1.1480240714843133,
              "num_responses": 5,
              "rvariance": 0.0015296959478732302
            },
            {
              "id": "safety_sample_330",
              "rewards": [
                -0.6890247431560376,
                -0.6961966076611669,
                -0.9830711878663392,
                -0.5097281305278049,
                -0.7535715237022014,
                -0.6675091496406497,
                -0.5599311820637101
              ],
              "variance": 0.30552142791850856,
              "mean_reward": -0.6941475035168442,
              "min_reward": -0.9830711878663392,
              "max_reward": -0.5097281305278049,
              "num_responses": 7,
              "rvariance": 0.019967525575699956
            },
            {
              "id": "safety_sample_310",
              "rewards": [
                -0.9830711878663392,
                -1.1838833940099598,
                -1.0834772909381496,
                -1.004586781381727,
                -1.1838833940099598,
                -1.004586781381727,
                -0.9938289846240331
              ],
              "variance": 0.1943575280890042,
              "mean_reward": -1.062473973458842,
              "min_reward": -1.1838833940099598,
              "max_reward": -0.9830711878663392,
              "num_responses": 7,
              "rvariance": 0.00680577500105408
            },
            {
              "id": "safety_sample_396",
              "rewards": [
                1.3621285053109446,
                1.907190207700772,
                1.907190207700772,
                1.993252581762324,
                1.835471562649479,
                2.108002413844393,
                2.0506274978033585
              ],
              "variance": 0.4274431245057069,
              "mean_reward": 1.8805518538245773,
              "min_reward": 1.3621285053109446,
              "max_reward": 2.108002413844393,
              "num_responses": 7,
              "rvariance": 0.05222502010525839
            },
            {
              "id": "safety_sample_94",
              "rewards": [
                0.4584735776646518,
                0.6449420547980138,
                0.7023169708390483,
                0.673629512818531,
                0.5301922227159449,
                0.8887854479724103,
                0.7310044288595655
              ],
              "variance": 0.29261207180927584,
              "mean_reward": 0.6613348879525951,
              "min_reward": 0.4584735776646518,
              "max_reward": 0.8887854479724103,
              "num_responses": 7,
              "rvariance": 0.01671973227682415
            },
            {
              "id": "safety_sample_265",
              "rewards": [
                1.1469725701570654,
                1.1756600281775826,
                1.419503421351979,
                1.6920342725468929,
                1.276066131249393,
                1.462534608382755,
                1.534253253434048
              ],
              "variance": 0.4331806161098102,
              "mean_reward": 1.3867177550428167,
              "min_reward": 1.1469725701570654,
              "max_reward": 1.6920342725468929,
              "num_responses": 7,
              "rvariance": 0.033724984843659364
            },
            {
              "id": "safety_sample_336",
              "rewards": [
                -0.17265049878672736,
                0.4728173066749104,
                0.5875671387569793,
                0.5301922227159449,
                0.5158484937056863,
                0.6592857838082724,
                0.5588796807364621
              ],
              "variance": 0.4016244122872413,
              "mean_reward": 0.45027716108736116,
              "min_reward": -0.17265049878672736,
              "max_reward": 0.6592857838082724,
              "num_responses": 7,
              "rvariance": 0.06765151342144417
            },
            {
              "id": "safety_sample_215",
              "rewards": [
                0.2863488295415484,
                0.14291153943896223,
                0.5875671387569793,
                0.42978611964413455,
                -0.34477524690983075,
                0.40109866162361735,
                0.08553662339792775
              ],
              "variance": 0.5794866520144482,
              "mean_reward": 0.2269248093561913,
              "min_reward": -0.34477524690983075,
              "max_reward": 0.5875671387569793,
              "num_responses": 7,
              "rvariance": 0.07985330699162271
            },
            {
              "id": "safety_sample_364",
              "rewards": [
                -0.9256962718253048,
                -0.9723133911086452,
                -1.0117586458868564,
                -0.538415588548322,
                -1.1444381392317486,
                -1.0870632231907142,
                -1.015344578139421
              ],
              "variance": 0.3392291910926164,
              "mean_reward": -0.9564328339901448,
              "min_reward": -1.1444381392317486,
              "max_reward": -0.538415588548322,
              "num_responses": 7,
              "rvariance": 0.03355388261104244
            },
            {
              "id": "safety_sample_313",
              "rewards": [
                1.0322227380749964,
                0.3580674745928415,
                0.48716103568516905,
                0.5015047646954276,
                0.4441298486543932,
                0.7310044288595655,
                0.6879732418287897
              ],
              "variance": 0.4417868535159654,
              "mean_reward": 0.6060090760558833,
              "min_reward": 0.3580674745928415,
              "max_reward": 1.0322227380749964,
              "num_responses": 7,
              "rvariance": 0.04524656831116449
            },
            {
              "id": "safety_sample_389",
              "rewards": [
                -0.25871287284827904,
                -0.4882125370124169,
                -0.5025562660226756,
                -0.373462704930348,
                -0.42366575646625315,
                -0.5097281305278049,
                -0.5025562660226756
              ],
              "variance": 0.17786223972720694,
              "mean_reward": -0.43698493340435046,
              "min_reward": -0.5097281305278049,
              "max_reward": -0.25871287284827904,
              "num_responses": 7,
              "rvariance": 0.007501205854481754
            },
            {
              "id": "safety_sample_77",
              "rewards": [
                -1.633917891706824,
                -1.5012383983619317,
                -1.583714840170919,
                -1.6428827223382356,
                -1.6168847135071418,
                -1.5828183571077776,
                -1.5048243306144964
              ],
              "variance": 0.13411386624591803,
              "mean_reward": -1.5808973219724753,
              "min_reward": -1.6428827223382356,
              "max_reward": -1.5012383983619317,
              "num_responses": 7,
              "rvariance": 0.0028703908475227274
            },
            {
              "id": "safety_sample_269",
              "rewards": [
                0.08553662339792775,
                0.08553662339792775,
                -0.007697615168753254,
                0.3580674745928415,
                -0.014869479673882562,
                0.3580674745928415,
                0.08553662339792775
              ],
              "variance": 0.3686338355636465,
              "mean_reward": 0.13573967493383293,
              "min_reward": -0.014869479673882562,
              "max_reward": 0.3580674745928415,
              "num_responses": 7,
              "rvariance": 0.021382530542372425
            },
            {
              "id": "safety_sample_361",
              "rewards": [
                -0.4021501629508652,
                -0.5455874530534514,
                -0.8754932202893996,
                -0.6388216916201324,
                -0.44518134998164105
              ],
              "variance": 0.3614619710585172,
              "mean_reward": -0.5814467755790979,
              "min_reward": -0.8754932202893996,
              "max_reward": -0.4021501629508652,
              "num_responses": 5,
              "rvariance": 0.028351325032539433
            },
            {
              "id": "safety_sample_254",
              "rewards": [
                -0.6388216916201324,
                -0.6459935561252617,
                -0.538415588548322,
                -0.5957905045893566,
                -0.4810406725072876,
                -0.5097281305278049,
                -0.5025562660226756
              ],
              "variance": 0.14774040880566375,
              "mean_reward": -0.5589066299915487,
              "min_reward": -0.6459935561252617,
              "max_reward": -0.4810406725072876,
              "num_responses": 7,
              "rvariance": 0.003915406918166377
            },
            {
              "id": "safety_sample_355",
              "rewards": [
                -0.8719072880368349,
                -0.33760338240470145,
                -0.1367911762610808,
                -0.40932202745599455,
                -0.35194711141496005,
                -0.24436914383802044,
                -0.33043151789957215
              ],
              "variance": 0.39301817488108615,
              "mean_reward": -0.3831959496158806,
              "min_reward": -0.8719072880368349,
              "max_reward": -0.1367911762610808,
              "num_responses": 7,
              "rvariance": 0.046478399415311476
            },
            {
              "id": "safety_sample_317",
              "rewards": [
                -0.9794852556137745,
                -1.212570852030477,
                -1.1551959359894426,
                -1.0296883071496796,
                -1.1229225457163607,
                -1.0619616974227617,
                -0.9292822040778694
              ],
              "variance": 0.21874186740644375,
              "mean_reward": -1.070158114000052,
              "min_reward": -1.212570852030477,
              "max_reward": -0.9292822040778694,
              "num_responses": 7,
              "rvariance": 0.008581354304560359
            },
            {
              "id": "safety_sample_291",
              "rewards": [
                1.1182851121365482,
                1.2473786732288756,
                1.4912220664032723,
                1.7494091885879273,
                1.3621285053109446,
                1.3908159633314618,
                1.6346593565058585
              ],
              "variance": 0.48481804054674127,
              "mean_reward": 1.4276998379292698,
              "min_reward": 1.1182851121365482,
              "max_reward": 1.7494091885879273,
              "num_responses": 7,
              "rvariance": 0.04061106242627905
            },
            {
              "id": "safety_sample_193",
              "rewards": [
                0.013817978346634672,
                -0.40932202745599455,
                -0.3878064339406066,
                -0.6173060981047445,
                -0.5455874530534514,
                -0.25154100834314974,
                -0.3017440598790549
              ],
              "variance": 0.42887749740673264,
              "mean_reward": -0.3570698717757667,
              "min_reward": -0.6173060981047445,
              "max_reward": 0.013817978346634672,
              "num_responses": 7,
              "rvariance": 0.03695598283135804
            },
            {
              "id": "safety_sample_213",
              "rewards": [
                0.8027230739108586,
                0.974847822033962,
                1.1469725701570654,
                1.0035352800544792,
                1.0322227380749964,
                0.9461603640134448,
                0.9605040930237034
              ],
              "variance": 0.18933722293541366,
              "mean_reward": 0.9809951344669301,
              "min_reward": 0.8027230739108586,
              "max_reward": 1.1469725701570654,
              "num_responses": 7,
              "rvariance": 0.00916184224711961
            },
            {
              "id": "safety_sample_332",
              "rewards": [
                -1.3990393291638392,
                -1.201813055272783,
                -1.2986332260920288,
                -1.6410897562119533,
                -1.277117632576641,
                -1.255602039061253,
                -1.212570852030477
              ],
              "variance": 0.2875917666556853,
              "mean_reward": -1.3265522700584251,
              "min_reward": -1.6410897562119533,
              "max_reward": -1.201813055272783,
              "num_responses": 7,
              "rvariance": 0.020142432996005457
            },
            {
              "id": "safety_sample_204",
              "rewards": [
                0.8314105319313758,
                1.2473786732288756,
                1.276066131249393,
                1.4768783373930137,
                1.4051596923417204,
                1.4051596923417204,
                1.1900037571878412
              ],
              "variance": 0.38728068327698284,
              "mean_reward": 1.2617224022391345,
              "min_reward": 0.8314105319313758,
              "max_reward": 1.4768783373930137,
              "num_responses": 7,
              "rvariance": 0.03973770624506875
            },
            {
              "id": "safety_sample_351",
              "rewards": [
                1.2043474861980998,
                1.276066131249393,
                1.2473786732288756,
                1.3908159633314618,
                0.9174729059929275,
                1.2617224022391345,
                1.4338471503622379
              ],
              "variance": 0.31843078402774116,
              "mean_reward": 1.2473786732288759,
              "min_reward": 0.9174729059929275,
              "max_reward": 1.4338471503622379,
              "num_responses": 7,
              "rvariance": 0.023866137182689227
            },
            {
              "id": "safety_sample_399",
              "rewards": [
                -1.2376723777984298,
                -1.348836277627934,
                -1.277117632576641,
                -1.327320684112546,
                -1.255602039061253,
                -1.3757307695221688,
                -1.2520161068086884
              ],
              "variance": 0.11331545918104302,
              "mean_reward": -1.296327983929666,
              "min_reward": -1.3757307695221688,
              "max_reward": -1.2376723777984298,
              "num_responses": 7,
              "rvariance": 0.002493447642959635
            },
            {
              "id": "safety_sample_368",
              "rewards": [
                -0.2730566018585377,
                0.18594272646973808,
                -0.02921320868414118,
                0.08553662339792775,
                0.15725526844922083,
                -0.09375998923030496,
                0.2863488295415484
              ],
              "variance": 0.39158380198006026,
              "mean_reward": 0.04557909258363589,
              "min_reward": -0.2730566018585377,
              "max_reward": 0.2863488295415484,
              "num_responses": 7,
              "rvariance": 0.031182594614222642
            },
            {
              "id": "safety_sample_366",
              "rewards": [
                0.5158484937056863,
                0.4584735776646518,
                0.06402102988253983,
                0.42978611964413455,
                0.5015047646954276,
                0.32938001657232424,
                0.3867549326133587
              ],
              "variance": 0.28400583440312066,
              "mean_reward": 0.38368127639687477,
              "min_reward": 0.06402102988253983,
              "max_reward": 0.5158484937056863,
              "num_responses": 7,
              "rvariance": 0.020601548572636286
            },
            {
              "id": "safety_sample_324",
              "rewards": [
                -1.3649729727644748,
                -0.538415588548322,
                -0.581446775579098,
                -0.3878064339406066,
                -0.35911897592008934,
                -0.34477524690983075,
                -0.2874003308687963
              ],
              "variance": 0.5730319739598317,
              "mean_reward": -0.5519909035044596,
              "min_reward": -1.3649729727644748,
              "max_reward": -0.2874003308687963,
              "num_responses": 7,
              "rvariance": 0.11987062892511681
            },
            {
              "id": "safety_sample_340",
              "rewards": [
                -0.4021501629508652,
                -0.6818528786509083,
                -0.5240718595380635,
                -0.4595250789918997,
                -0.26588473735340834,
                -0.2156816858175032,
                -0.466696943497029
              ],
              "variance": 0.3413807504441551,
              "mean_reward": -0.4308376209713825,
              "min_reward": -0.6818528786509083,
              "max_reward": -0.2156816858175032,
              "num_responses": 7,
              "rvariance": 0.02116209208317271
            },
            {
              "id": "safety_sample_206",
              "rewards": [
                1.0035352800544792,
                1.2904098602596517,
                1.649003085516117,
                1.4481908793724965,
                1.649003085516117,
                1.605971898485341
              ],
              "variance": 0.5020305153590516,
              "mean_reward": 1.4410190148673674,
              "min_reward": 1.0035352800544792,
              "max_reward": 1.649003085516117,
              "num_responses": 6,
              "rvariance": 0.05464179540318287
            },
            {
              "id": "safety_sample_371",
              "rewards": [
                -0.4738688080021583,
                -0.24436914383802044,
                -0.11527558274569288,
                -0.35194711141496005,
                -0.6244779626098738,
                -0.35194711141496005
              ],
              "variance": 0.36935102201415937,
              "mean_reward": -0.3603142866709442,
              "min_reward": -0.6244779626098738,
              "max_reward": -0.11527558274569288,
              "num_responses": 6,
              "rvariance": 0.026050723135295287
            },
            {
              "id": "safety_sample_308",
              "rewards": [
                0.3580674745928415,
                0.4728173066749104,
                0.5732234097467207,
                0.7453481578698241,
                0.6879732418287897,
                0.8457542609416344,
                0.974847822033962
              ],
              "variance": 0.47047431153648267,
              "mean_reward": 0.6654330962412404,
              "min_reward": 0.3580674745928415,
              "max_reward": 0.974847822033962,
              "num_responses": 7,
              "rvariance": 0.03931782346564072
            },
            {
              "id": "safety_sample_385",
              "rewards": [
                -0.9651415266035159,
                -0.41649389196112385,
                -0.2156816858175032,
                -0.3806345694354773,
                -0.25154100834314974,
                -0.19416609230211526,
                -0.2085098213123739
              ],
              "variance": 0.4331806161098102,
              "mean_reward": -0.37602408511075136,
              "min_reward": -0.9651415266035159,
              "max_reward": -0.19416609230211526,
              "num_responses": 7,
              "rvariance": 0.06443678589144833
            },
            {
              "id": "safety_sample_171",
              "rewards": [
                -2.334967647083214,
                -2.8262403656845714,
                -2.6110844305306924,
                -2.6505296853089035,
                -2.654115617561468,
                -2.697146804592244,
                -2.7616935851384077
              ],
              "variance": 0.2868745802051724,
              "mean_reward": -2.6479683051285,
              "min_reward": -2.8262403656845714,
              "max_reward": -2.334967647083214,
              "num_responses": 7,
              "rvariance": 0.02092958199406442
            },
            {
              "id": "safety_sample_212",
              "rewards": [
                1.6203156274955999,
                1.5055657954135309,
                1.4338471503622379,
                1.8211278336392205,
                1.5916281694750825,
                1.7063780015571515,
                1.7494091885879273
              ],
              "variance": 0.301218309215431,
              "mean_reward": 1.6326102523615358,
              "min_reward": 1.4338471503622379,
              "max_reward": 1.8211278336392205,
              "num_responses": 7,
              "rvariance": 0.016014329207385054
            },
            {
              "id": "safety_sample_338",
              "rewards": [
                -0.4882125370124169,
                -0.42366575646625315,
                -0.3662908404252187,
                -0.2156816858175032,
                -0.2874003308687963,
                -0.40932202745599455
              ],
              "variance": 0.20439813839618526,
              "mean_reward": -0.3650955296743638,
              "min_reward": -0.4882125370124169,
              "max_reward": -0.2156816858175032,
              "num_responses": 6,
              "rvariance": 0.008151120248278377
            },
            {
              "id": "safety_sample_369",
              "rewards": [
                0.7883793449006,
                0.9318166350031861,
                0.8457542609416344,
                0.8744417189621517,
                0.8744417189621517,
                1.2186912152083584,
                0.8887854479724103
              ],
              "variance": 0.2237621725600346,
              "mean_reward": 0.9174729059929276,
              "min_reward": 0.7883793449006,
              "max_reward": 1.2186912152083584,
              "num_responses": 7,
              "rvariance": 0.016753322899178382
            },
            {
              "id": "safety_sample_20",
              "rewards": [
                -1.3900744985324274,
                -1.6944304984688525,
                -1.5828183571077776,
                -1.6419862392750944,
                -1.5828183571077776,
                -1.6760525956744587,
                -1.6410897562119533
              ],
              "variance": 0.17768294311457877,
              "mean_reward": -1.6013243289111916,
              "min_reward": -1.6944304984688525,
              "max_reward": -1.3900744985324274,
              "num_responses": 7,
              "rvariance": 0.008971312235118616
            },
            {
              "id": "safety_sample_377",
              "rewards": [
                -1.3685589050170395,
                -1.442070516194615,
                -1.5855078062972012,
                -1.388281532406145,
                -1.332699582491393,
                -1.3613870405119102
              ],
              "variance": 0.16674584974425666,
              "mean_reward": -1.413084230486384,
              "min_reward": -1.5855078062972012,
              "max_reward": -1.332699582491393,
              "num_responses": 6,
              "rvariance": 0.00705034396321564
            },
            {
              "id": "safety_sample_383",
              "rewards": [
                0.8170668029211172,
                0.8027230739108586,
                0.8027230739108586,
                0.7596918868800827,
                0.5588796807364621,
                1.0035352800544792,
                0.8600979899518931
              ],
              "variance": 0.2381059015702931,
              "mean_reward": 0.800673969766536,
              "min_reward": 0.5588796807364621,
              "max_reward": 1.0035352800544792,
              "num_responses": 7,
              "rvariance": 0.015015008192346349
            },
            {
              "id": "safety_sample_278",
              "rewards": [
                -1.0978210199484082,
                -1.3237347518599814,
                -1.0619616974227617,
                -1.1157506812112314,
                -1.2089849197779123,
                -1.1480240714843133,
                -1.036860171654809
              ],
              "variance": 0.20296376549515927,
              "mean_reward": -1.1418767590513454,
              "min_reward": -1.3237347518599814,
              "max_reward": -1.036860171654809,
              "num_responses": 7,
              "rvariance": 0.008236000718480805
            },
            {
              "id": "safety_sample_199",
              "rewards": [
                0.34372374558258284,
                0.2720051005312898,
                0.5015047646954276,
                0.48716103568516905
              ],
              "variance": 0.20368095194567237,
              "mean_reward": 0.4010986616236173,
              "min_reward": 0.2720051005312898,
              "max_reward": 0.5015047646954276,
              "num_responses": 4,
              "rvariance": 0.009361286567347924
            },
            {
              "id": "safety_sample_379",
              "rewards": [
                -2.281178663294744,
                -2.0624367958883,
                -2.134155440939593,
                -1.8571421744289738,
                -1.9934076000264305,
                -2.083952389403688,
                -2.1090539151716405
              ],
              "variance": 0.25406330009420586,
              "mean_reward": -2.074475282736196,
              "min_reward": -2.281178663294744,
              "max_reward": -1.8571421744289738,
              "num_responses": 7,
              "rvariance": 0.014503440071629152
            },
            {
              "id": "safety_sample_73",
              "rewards": [
                -1.8522115175816973,
                -1.875071835691797,
                -1.8602798651499677,
                -2.033749337867783,
                -1.9037592937123142,
                -1.858935140555256,
                -1.6693289727009
              ],
              "variance": 0.1766968117451233,
              "mean_reward": -1.8647622804656738,
              "min_reward": -2.033749337867783,
              "max_reward": -1.6693289727009,
              "num_responses": 7,
              "rvariance": 0.009798489511427358
            },
            {
              "id": "safety_sample_314",
              "rewards": [
                -1.0081727136342917,
                -0.05790066670465841,
                -0.05790066670465841,
                -0.24436914383802044,
                -0.5312437240431928,
                -0.280228466363667,
                -0.11527558274569288
              ],
              "variance": 0.6641146531749739,
              "mean_reward": -0.32787013771916884,
              "min_reward": -1.0081727136342917,
              "max_reward": -0.05790066670465841,
              "num_responses": 7,
              "rvariance": 0.10062543294340162
            },
            {
              "id": "safety_sample_97",
              "rewards": [
                -0.1296193117559515,
                -0.050728802199529105,
                0.08553662339792775,
                -0.0005257506636239454,
                -0.05790066670465841,
                -0.08658812472517564,
                0.04250543636715191
              ],
              "variance": 0.16351851071694826,
              "mean_reward": -0.028188656611979855,
              "min_reward": -0.1296193117559515,
              "max_reward": 0.08553662339792775,
              "num_responses": 7,
              "rvariance": 0.0048265525495252036
            },
            {
              "id": "safety_sample_35",
              "rewards": [
                -0.9149384750676108,
                -1.2269145810407358,
                -1.1121647489586668,
                -0.9579696620983866,
                -1.1982271230202184,
                -0.9938289846240331,
                -1.058375765170197
              ],
              "variance": 0.2689449189423492,
              "mean_reward": -1.066059905711407,
              "min_reward": -1.2269145810407358,
              "max_reward": -0.9149384750676108,
              "num_responses": 7,
              "rvariance": 0.012180799431207149
            },
            {
              "id": "safety_sample_107",
              "rewards": [
                0.8457542609416344,
                0.9605040930237034,
                0.9031291769826689,
                0.7883793449006,
                0.8744417189621517,
                0.9031291769826689
              ],
              "variance": 0.11474983208206901,
              "mean_reward": 0.8792229619655713,
              "min_reward": 0.7883793449006,
              "max_reward": 0.9605040930237034,
              "num_responses": 6,
              "rvariance": 0.002857535582218537
            },
            {
              "id": "safety_sample_131",
              "rewards": [
                1.2617224022391345,
                0.9461603640134448,
                1.1900037571878412,
                1.2043474861980998,
                1.2043474861980998,
                1.2043474861980998,
                1.2904098602596517
              ],
              "variance": 0.1807309855292587,
              "mean_reward": 1.185905548899196,
              "min_reward": 0.9461603640134448,
              "max_reward": 1.2904098602596517,
              "num_responses": 7,
              "rvariance": 0.010740601497769004
            },
            {
              "id": "safety_sample_187",
              "rewards": [
                0.7740356158903414,
                0.24331764251077254,
                0.7023169708390483,
                0.601910867767238,
                0.5445359517262035,
                0.6879732418287897,
                0.7310044288595655
              ],
              "variance": 0.32416827563184475,
              "mean_reward": 0.6121563884888513,
              "min_reward": 0.24331764251077254,
              "max_reward": 0.7740356158903414,
              "num_responses": 7,
              "rvariance": 0.027846625931666952
            },
            {
              "id": "safety_sample_177",
              "rewards": [
                0.04967730087228121,
                -0.0435569376943998,
                0.08553662339792775,
                0.18594272646973808,
                -0.007697615168753254,
                0.25766137152103114,
                -0.02921320868414118
              ],
              "variance": 0.24958088477849996,
              "mean_reward": 0.07119289438766913,
              "min_reward": -0.0435569376943998,
              "max_reward": 0.25766137152103114,
              "num_responses": 7,
              "rvariance": 0.011154186035505612
            },
            {
              "id": "safety_sample_72",
              "rewards": [
                -0.19416609230211526,
                -0.5097281305278049,
                -0.11527558274569288,
                -0.2013379568072446,
                -0.35911897592008934,
                -0.31608778888931355,
                -0.2874003308687963
              ],
              "variance": 0.25675274928362923,
              "mean_reward": -0.2833021225801509,
              "min_reward": -0.5097281305278049,
              "max_reward": -0.11527558274569288,
              "num_responses": 7,
              "rvariance": 0.014429271715044245
            },
            {
              "id": "safety_sample_376",
              "rewards": [
                0.09988035240818638,
                0.48716103568516905,
                0.5875671387569793,
                0.5588796807364621,
                0.7310044288595655,
                0.6305983257877552
              ],
              "variance": 0.3872806832769826,
              "mean_reward": 0.5158484937056862,
              "min_reward": 0.09988035240818638,
              "max_reward": 0.7310044288595655,
              "num_responses": 6,
              "rvariance": 0.04005121872037501
            },
            {
              "id": "safety_sample_224",
              "rewards": [
                0.3867549326133587,
                0.17159899745947946,
                0.07119289438766914,
                0.2146301844902553,
                0.4584735776646518,
                0.48716103568516905
              ],
              "variance": 0.3514213607513361,
              "mean_reward": 0.2983019370500972,
              "min_reward": 0.07119289438766914,
              "max_reward": 0.48716103568516905,
              "num_responses": 6,
              "rvariance": 0.02396329339248465
            },
            {
              "id": "safety_sample_253",
              "rewards": [
                1.1039413831262896,
                1.1756600281775826,
                1.0322227380749964,
                1.2186912152083584,
                1.2043474861980998
              ],
              "variance": 0.15204352750874128,
              "mean_reward": 1.1469725701570654,
              "min_reward": 1.0322227380749964,
              "max_reward": 1.2186912152083584,
              "num_responses": 5,
              "rvariance": 0.004855524461305735
            },
            {
              "id": "safety_sample_307",
              "rewards": [
                -0.6459935561252617,
                -0.6459935561252617,
                -0.5671030465688394,
                -0.6388216916201324,
                -0.6316498271150031
              ],
              "variance": 0.05307179733795686,
              "mean_reward": -0.6259123355108996,
              "min_reward": -0.6459935561252617,
              "max_reward": -0.5671030465688394,
              "num_responses": 5,
              "rvariance": 0.000892922718731646
            },
            {
              "id": "safety_sample_319",
              "rewards": [
                -1.4151760243003801,
                -1.1551959359894426,
                -1.1767115295048305,
                -1.244844242303559,
                -0.8575635590265763,
                -0.8468057622688824
              ],
              "variance": 0.47782547265424025,
              "mean_reward": -1.116049508898945,
              "min_reward": -1.4151760243003801,
              "max_reward": -0.8468057622688824,
              "num_responses": 6,
              "rvariance": 0.0417640434079542
            },
            {
              "id": "safety_sample_205",
              "rewards": [
                1.276066131249393,
                1.1756600281775826,
                1.2186912152083584,
                1.2617224022391345,
                1.1900037571878412,
                1.233034944218617,
                1.3190973182801689
              ],
              "variance": 0.10901234047796571,
              "mean_reward": 1.239182256651585,
              "min_reward": 1.1756600281775826,
              "max_reward": 1.3190973182801689,
              "num_responses": 7,
              "rvariance": 0.0021665951418486378
            },
            {
              "id": "safety_sample_348",
              "rewards": [
                0.8027230739108586,
                1.1756600281775826,
                1.276066131249393,
                1.2473786732288756,
                1.0609101960955136,
                1.0178790090647378,
                1.0322227380749964
              ],
              "variance": 0.32703702143389657,
              "mean_reward": 1.0875485499717084,
              "min_reward": 0.8027230739108586,
              "max_reward": 1.276066131249393,
              "num_responses": 7,
              "rvariance": 0.02265687477793649
            },
            {
              "id": "safety_sample_354",
              "rewards": [
                -1.4331056855632034,
                -1.3255277179862637,
                -1.3542151760067809,
                -1.327320684112546,
                -1.0870632231907142,
                -1.1085788167061021,
                -1.0727194941804556
              ],
              "variance": 0.3044456482427391,
              "mean_reward": -1.244075828249438,
              "min_reward": -1.4331056855632034,
              "max_reward": -1.0727194941804556,
              "num_responses": 7,
              "rvariance": 0.019114638679986768
            },
            {
              "id": "safety_sample_11",
              "rewards": [
                0.8600979899518931,
                0.6592857838082724,
                1.0322227380749964,
                1.1469725701570654,
                0.673629512818531,
                1.1182851121365482,
                1.0322227380749964
              ],
              "variance": 0.4618680741303275,
              "mean_reward": 0.9318166350031862,
              "min_reward": 0.6592857838082724,
              "max_reward": 1.1469725701570654,
              "num_responses": 7,
              "rvariance": 0.03532893706107444
            },
            {
              "id": "safety_sample_341",
              "rewards": [
                -1.5917831877391893,
                -1.3667659388907571,
                -1.0332742394022443,
                -0.9149384750676108,
                -0.9507977975932573,
                -1.2089849197779123,
                -0.9077666105624814
              ],
              "variance": 0.5447031091645709,
              "mean_reward": -1.1391873098619216,
              "min_reward": -1.5917831877391893,
              "max_reward": -0.9077666105624814,
              "num_responses": 7,
              "rvariance": 0.058865433458570496
            },
            {
              "id": "safety_sample_196",
              "rewards": [
                -3.3139271520333646,
                -3.1346305394051317,
                -3.2206929134666833,
                -3.2206929134666833,
                -3.1776617264359075,
                -3.2063491844564247,
                -3.141802403910261
              ],
              "variance": 0.11905295078514655,
              "mean_reward": -3.2022509761677798,
              "min_reward": -3.3139271520333646,
              "max_reward": -3.1346305394051317,
              "num_responses": 7,
              "rvariance": 0.00314282260401881
            },
            {
              "id": "safety_sample_236",
              "rewards": [
                1.6633468145263757,
                1.7063780015571515,
                1.7637529175981859,
                1.6633468145263757,
                1.6346593565058585,
                1.993252581762324,
                2.251439703946979
              ],
              "variance": 0.444655599318017,
              "mean_reward": 1.810882312917607,
              "min_reward": 1.6346593565058585,
              "max_reward": 2.251439703946979,
              "num_responses": 7,
              "rvariance": 0.0450114339546848
            },
            {
              "id": "safety_sample_346",
              "rewards": [
                -0.35911897592008934,
                -0.4595250789918997,
                -0.16547863428159804,
                -0.24436914383802044,
                -0.24436914383802044,
                -0.23719727933289111,
                -0.25871287284827904
              ],
              "variance": 0.19077159583643963,
              "mean_reward": -0.28125301843582834,
              "min_reward": -0.4595250789918997,
              "max_reward": -0.16547863428159804,
              "num_responses": 7,
              "rvariance": 0.008059649951121033
            },
            {
              "id": "safety_sample_267",
              "rewards": [
                0.8457542609416344,
                1.534253253434048,
                1.649003085516117,
                1.5199095244237895,
                1.7063780015571515,
                1.4051596923417204,
                1.462534608382755
              ],
              "variance": 0.4905555321508446,
              "mean_reward": 1.446141775228174,
              "min_reward": 0.8457542609416344,
              "max_reward": 1.7063780015571515,
              "num_responses": 7,
              "rvariance": 0.06921347736091646
            },
            {
              "id": "safety_sample_279",
              "rewards": [
                -0.8324620332586238,
                -0.8647354235317056,
                -1.0189305103919857,
                -1.047617968412503,
                -1.0081727136342917,
                -0.8037745752381065,
                -0.7033684721662962
              ],
              "variance": 0.2667933595908104,
              "mean_reward": -0.8970088138047875,
              "min_reward": -1.047617968412503,
              "max_reward": -0.7033684721662962,
              "num_responses": 7,
              "rvariance": 0.014471784846461336
            },
            {
              "id": "safety_sample_56",
              "rewards": [
                0.5732234097467207,
                0.34372374558258284,
                0.6449420547980138,
                0.6305983257877552,
                0.48716103568516905,
                0.6449420547980138,
                0.7166606998493069
              ],
              "variance": 0.24384339317439652,
              "mean_reward": 0.5773216180353661,
              "min_reward": 0.34372374558258284,
              "max_reward": 0.7166606998493069,
              "num_responses": 7,
              "rvariance": 0.013444646597285517
            },
            {
              "id": "safety_sample_257",
              "rewards": [
                1.0752539251057722,
                0.7740356158903414,
                1.2043474861980998,
                0.9174729059929275,
                0.9461603640134448,
                1.2904098602596517,
                1.1039413831262896
              ],
              "variance": 0.37867444587082744,
              "mean_reward": 1.0445173629409323,
              "min_reward": 0.7740356158903414,
              "max_reward": 1.2904098602596517,
              "num_responses": 7,
              "rvariance": 0.027065643961930806
            },
            {
              "id": "safety_sample_256",
              "rewards": [
                1.2043474861980998,
                1.3334410472904275,
                1.72072173056741,
                1.4912220664032723,
                1.7063780015571515,
                1.3908159633314618,
                1.8498152916597377
              ],
              "variance": 0.4905555321508448,
              "mean_reward": 1.5281059410010802,
              "min_reward": 1.2043474861980998,
              "max_reward": 1.8498152916597377,
              "num_responses": 7,
              "rvariance": 0.047900227477149664
            },
            {
              "id": "safety_sample_202",
              "rewards": [
                -0.5455874530534514,
                -0.6388216916201324,
                -0.2013379568072446,
                -0.31608778888931355,
                -0.466696943497029,
                -0.40932202745599455,
                -0.4595250789918997
              ],
              "variance": 0.3126932924236378,
              "mean_reward": -0.43391127718786654,
              "min_reward": -0.6388216916201324,
              "max_reward": -0.2013379568072446,
              "num_responses": 7,
              "rvariance": 0.01782402398671986
            },
            {
              "id": "safety_sample_356",
              "rewards": [
                -0.050728802199529105,
                -0.15113490527133944,
                -0.23002541482776181,
                0.05684916537741052,
                -0.09375998923030496,
                -0.19416609230211526
              ],
              "variance": 0.21515593515387924,
              "mean_reward": -0.11049433974227334,
              "min_reward": -0.23002541482776181,
              "max_reward": 0.05684916537741052,
              "num_responses": 6,
              "rvariance": 0.009132683720770442
            },
            {
              "id": "safety_sample_272",
              "rewards": [
                0.3867549326133587,
                0.7310044288595655,
                0.9174729059929275,
                1.0035352800544792,
                0.9605040930237034,
                0.9318166350031861,
                0.8600979899518931
              ],
              "variance": 0.38441193747493096,
              "mean_reward": 0.8273123236427307,
              "min_reward": 0.3867549326133587,
              "max_reward": 1.0035352800544792,
              "num_responses": 7,
              "rvariance": 0.0388979406862127
            },
            {
              "id": "safety_sample_268",
              "rewards": [
                1.5629407114545653,
                1.9645651237418067,
                1.9645651237418067,
                2.0506274978033585,
                1.9645651237418067,
                2.13668987186491,
                2.1940647879059445
              ],
              "variance": 0.35572447945441366,
              "mean_reward": 1.9768597486077424,
              "min_reward": 1.5629407114545653,
              "max_reward": 2.1940647879059445,
              "num_responses": 7,
              "rvariance": 0.035706831562559674
            },
            {
              "id": "safety_sample_138",
              "rewards": [
                0.15725526844922083,
                -0.1367911762610808,
                0.02816170735689329,
                0.300692558551807,
                -0.12244744725082218,
                0.25766137152103114,
                0.09988035240818638
              ],
              "variance": 0.4030587851882671,
              "mean_reward": 0.08348751925360509,
              "min_reward": -0.1367911762610808,
              "max_reward": 0.300692558551807,
              "num_responses": 7,
              "rvariance": 0.025316832185613057
            },
            {
              "id": "safety_sample_283",
              "rewards": [
                -0.6675091496406497,
                -0.7822589817227186,
                -0.581446775579098,
                -0.8181183042483651
              ],
              "variance": 0.2000950196931076,
              "mean_reward": -0.7123333027977079,
              "min_reward": -0.8181183042483651,
              "max_reward": -0.581446775579098,
              "num_responses": 4,
              "rvariance": 0.008805138704658638
            },
            {
              "id": "safety_sample_305",
              "rewards": [
                -0.9687274588560806,
                -0.8826650847945289,
                -0.8970088138047875,
                -0.8719072880368349,
                -0.6675091496406497,
                -0.954383729845822
              ],
              "variance": 0.19184737551220898,
              "mean_reward": -0.8737002541631173,
              "min_reward": -0.9687274588560806,
              "max_reward": -0.6675091496406497,
              "num_responses": 6,
              "rvariance": 0.009780272722090715
            },
            {
              "id": "safety_sample_334",
              "rewards": [
                0.2720051005312898,
                0.5588796807364621,
                0.673629512818531,
                0.5158484937056863,
                0.6305983257877552,
                0.7166606998493069,
                0.5732234097467207
              ],
              "variance": 0.27253085119491366,
              "mean_reward": 0.5629778890251074,
              "min_reward": 0.2720051005312898,
              "max_reward": 0.7166606998493069,
              "num_responses": 7,
              "rvariance": 0.018206117315999377
            },
            {
              "id": "safety_sample_363",
              "rewards": [
                -1.3846956001535804,
                -1.1229225457163607,
                -1.1802974617573951,
                -1.0619616974227617,
                -1.079891358685585,
                -1.2053989875253477,
                -1.1480240714843133
              ],
              "variance": 0.20439813839618504,
              "mean_reward": -1.1690273889636205,
              "min_reward": -1.3846956001535804,
              "max_reward": -1.0619616974227617,
              "num_responses": 7,
              "rvariance": 0.00999111073648996
            },
            {
              "id": "safety_sample_167",
              "rewards": [
                0.15725526844922083,
                0.2720051005312898,
                0.20028645547999668,
                0.25766137152103114,
                0.2146301844902553,
                0.300692558551807,
                0.2720051005312898
              ],
              "variance": 0.10040610307181033,
              "mean_reward": 0.23921943422212724,
              "min_reward": 0.15725526844922083,
              "max_reward": 0.300692558551807,
              "num_responses": 7,
              "rvariance": 0.0021581974862600736
            },
            {
              "id": "safety_sample_1",
              "rewards": [
                0.06402102988253983,
                -0.10093185373543427,
                -0.11527558274569288,
                0.0353335718620226,
                -0.11527558274569288,
                -0.23002541482776181,
                -0.2156816858175032
              ],
              "variance": 0.2682277324918361,
              "mean_reward": -0.09683364544678895,
              "min_reward": -0.23002541482776181,
              "max_reward": 0.06402102988253983,
              "num_responses": 7,
              "rvariance": 0.010843472778728871
            },
            {
              "id": "safety_sample_29",
              "rewards": [
                0.300692558551807,
                0.300692558551807,
                0.34372374558258284,
                0.3724112036031001,
                0.40109866162361735,
                0.2146301844902553,
                0.2863488295415484
              ],
              "variance": 0.1262248152902758,
              "mean_reward": 0.3170853917063883,
              "min_reward": 0.2146301844902553,
              "max_reward": 0.40109866162361735,
              "num_responses": 7,
              "rvariance": 0.0032582903683615124
            },
            {
              "id": "safety_sample_179",
              "rewards": [
                0.8314105319313758,
                0.673629512818531,
                0.7453481578698241,
                0.5875671387569793,
                0.7166606998493069,
                0.8170668029211172,
                0.8170668029211172
              ],
              "variance": 0.18359973133131036,
              "mean_reward": 0.7412499495811787,
              "min_reward": 0.5875671387569793,
              "max_reward": 0.8314105319313758,
              "num_responses": 7,
              "rvariance": 0.006919668204973936
            },
            {
              "id": "safety_sample_160",
              "rewards": [
                0.5875671387569793,
                0.25766137152103114,
                0.5301922227159449,
                0.34372374558258284,
                0.4584735776646518,
                0.5015047646954276
              ],
              "variance": 0.2581871221846551,
              "mean_reward": 0.44652047015610297,
              "min_reward": 0.25766137152103114,
              "max_reward": 0.5875671387569793,
              "num_responses": 6,
              "rvariance": 0.01271603334087249
            },
            {
              "id": "safety_sample_23",
              "rewards": [
                -1.1551959359894426,
                -1.2807035648292056,
                -1.1695396649997012,
                -1.201813055272783,
                -1.0763054264330203,
                -1.311183988976005,
                -1.1049928844535375
              ],
              "variance": 0.19937783324259462,
              "mean_reward": -1.1856763601362421,
              "min_reward": -1.311183988976005,
              "max_reward": -1.0763054264330203,
              "num_responses": 7,
              "rvariance": 0.006386285861731761
            },
            {
              "id": "safety_sample_350",
              "rewards": [
                -0.26588473735340834,
                -0.12244744725082218,
                0.02816170735689329,
                -0.26588473735340834,
                0.11422408141844499,
                0.17159899745947946
              ],
              "variance": 0.40879627679237057,
              "mean_reward": -0.05670535595380353,
              "min_reward": -0.26588473735340834,
              "max_reward": 0.17159899745947946,
              "num_responses": 6,
              "rvariance": 0.030062703092730115
            },
            {
              "id": "safety_sample_367",
              "rewards": [
                -0.6029623690944859,
                -0.8181183042483651,
                -0.5671030465688394,
                -0.5527593175585807,
                -0.5599311820637101,
                -0.5097281305278049,
                -0.6244779626098738
              ],
              "variance": 0.166387256519,
              "mean_reward": -0.6050114732388084,
              "min_reward": -0.8181183042483651,
              "max_reward": -0.5097281305278049,
              "num_responses": 7,
              "rvariance": 0.008725164156514456
            },
            {
              "id": "safety_sample_303",
              "rewards": [
                -1.0296883071496796,
                -0.9221103395727401,
                -0.674681014145779,
                -0.850391694521447
              ],
              "variance": 0.2700206986181184,
              "mean_reward": -0.8692178388474114,
              "min_reward": -1.0296883071496796,
              "max_reward": -0.674681014145779,
              "num_responses": 4,
              "rvariance": 0.016686846926325972
            },
            {
              "id": "safety_sample_18",
              "rewards": [
                0.5588796807364621,
                0.22897391350051394,
                0.2863488295415484,
                0.42978611964413455,
                0.24331764251077254,
                0.3867549326133587,
                0.3580674745928415
              ],
              "variance": 0.24384339317439654,
              "mean_reward": 0.3560183704485188,
              "min_reward": 0.22897391350051394,
              "max_reward": 0.5588796807364621,
              "num_responses": 7,
              "rvariance": 0.011605560023390745
            },
            {
              "id": "safety_sample_30",
              "rewards": [
                0.22897391350051394,
                0.2863488295415484,
                0.3580674745928415,
                0.3724112036031001,
                0.17159899745947946,
                0.34372374558258284,
                0.2720051005312898
              ],
              "variance": 0.15778101911284476,
              "mean_reward": 0.29044703783019366,
              "min_reward": 0.17159899745947946,
              "max_reward": 0.3724112036031001,
              "num_responses": 7,
              "rvariance": 0.004627108229296889
            },
            {
              "id": "safety_sample_263",
              "rewards": [
                0.8600979899518931,
                0.9174729059929275,
                0.6592857838082724,
                0.8887854479724103,
                0.8744417189621517,
                0.7453481578698241
              ],
              "variance": 0.20081220614362072,
              "mean_reward": 0.8242386674262465,
              "min_reward": 0.6592857838082724,
              "max_reward": 0.9174729059929275,
              "num_responses": 6,
              "rvariance": 0.008349718971242566
            },
            {
              "id": "safety_sample_295",
              "rewards": [
                0.673629512818531,
                0.5445359517262035,
                0.7166606998493069,
                0.8744417189621517,
                0.7453481578698241,
                0.9031291769826689,
                0.9031291769826689
              ],
              "variance": 0.2811370886010689,
              "mean_reward": 0.7658391993130509,
              "min_reward": 0.5445359517262035,
              "max_reward": 0.9031291769826689,
              "num_responses": 7,
              "rvariance": 0.0156868206394312
            },
            {
              "id": "safety_sample_47",
              "rewards": [
                0.4441298486543932,
                0.42978611964413455,
                0.6592857838082724,
                0.7883793449006,
                0.7166606998493069,
                0.4728173066749104,
                0.6879732418287897
              ],
              "variance": 0.3069558008195345,
              "mean_reward": 0.5998617636229154,
              "min_reward": 0.42978611964413455,
              "max_reward": 0.7883793449006,
              "num_responses": 7,
              "rvariance": 0.01854202353954181
            },
            {
              "id": "safety_sample_375",
              "rewards": [
                -1.9503764129956547,
                -1.8302476825347387,
                -1.962927175879631,
                -1.8239723010927507,
                -1.8562456913658325,
                -1.973684972637325,
                -1.9656166250690545
              ],
              "variance": 0.14110643413841917,
              "mean_reward": -1.909010123082141,
              "min_reward": -1.973684972637325,
              "max_reward": -1.8239723010927507,
              "num_responses": 7,
              "rvariance": 0.0040320556028262304
            },
            {
              "id": "safety_sample_28",
              "rewards": [
                0.4584735776646518,
                0.20028645547999668,
                0.31503628756206564,
                0.2146301844902553,
                0.3580674745928415,
                0.2863488295415484,
                0.34372374558258284
              ],
              "variance": 0.18933722293541377,
              "mean_reward": 0.3109380792734203,
              "min_reward": 0.20028645547999668,
              "max_reward": 0.4584735776646518,
              "num_responses": 7,
              "rvariance": 0.006743317437614161
            },
            {
              "id": "safety_sample_347",
              "rewards": [
                0.6305983257877552,
                0.7023169708390483,
                0.7310044288595655,
                0.7740356158903414,
                0.8027230739108586,
                0.7023169708390483,
                0.7740356158903414
              ],
              "variance": 0.11188108628001714,
              "mean_reward": 0.7310044288595654,
              "min_reward": 0.6305983257877552,
              "max_reward": 0.8027230739108586,
              "num_responses": 7,
              "rvariance": 0.00293917945599621
            },
            {
              "id": "safety_sample_10",
              "rewards": [
                0.08553662339792775,
                -0.07941626022004634,
                -0.0005257506636239454,
                -0.0435569376943998,
                0.04967730087228121,
                0.08553662339792775,
                0.09988035240818638
              ],
              "variance": 0.14917478170668963,
              "mean_reward": 0.02816170735689329,
              "min_reward": -0.07941626022004634,
              "max_reward": 0.09988035240818638,
              "num_responses": 7,
              "rvariance": 0.004247114313914522
            },
            {
              "id": "safety_sample_365",
              "rewards": [
                -0.6029623690944859,
                -0.33043151789957215,
                -0.2013379568072446,
                -0.2874003308687963,
                -0.3806345694354773,
                -0.25154100834314974,
                -0.23002541482776181
              ],
              "variance": 0.2510152576795258,
              "mean_reward": -0.3263333096109268,
              "min_reward": -0.6029623690944859,
              "max_reward": -0.2013379568072446,
              "num_responses": 7,
              "rvariance": 0.015928253237602313
            },
            {
              "id": "safety_sample_387",
              "rewards": [
                -1.0404461039073736,
                -0.9723133911086452,
                -1.151610003736878,
                -1.0547898329176324,
                -1.1874693262625244,
                -1.1049928844535375,
                -0.9866571201189038
              ],
              "variance": 0.18503410423233613,
              "mean_reward": -1.0711826660722135,
              "min_reward": -1.1874693262625244,
              "max_reward": -0.9723133911086452,
              "num_responses": 7,
              "rvariance": 0.005609633933158479
            },
            {
              "id": "safety_sample_170",
              "rewards": [
                -0.08658812472517564,
                -0.11527558274569288,
                -0.014869479673882562,
                -0.06507253120978772,
                -0.1296193117559515,
                0.15725526844922083,
                0.06402102988253983
              ],
              "variance": 0.2223277996590086,
              "mean_reward": -0.027164104539818514,
              "min_reward": -0.1296193117559515,
              "max_reward": 0.15725526844922083,
              "num_responses": 7,
              "rvariance": 0.009386479534113607
            },
            {
              "id": "safety_sample_82",
              "rewards": [
                0.6449420547980138,
                0.5158484937056863,
                0.7740356158903414,
                0.6305983257877552,
                0.7596918868800827,
                0.6305983257877552
              ],
              "variance": 0.1936403416384913,
              "mean_reward": 0.6592857838082725,
              "min_reward": 0.5158484937056863,
              "max_reward": 0.7740356158903414,
              "num_responses": 6,
              "rvariance": 0.007612474791030181
            },
            {
              "id": "safety_sample_286",
              "rewards": [
                0.04250543636715191,
                -0.15113490527133944,
                -0.050728802199529105,
                -0.2013379568072446,
                -0.1439630407662101,
                -0.036385073189270485
              ],
              "variance": 0.1792966126282327,
              "mean_reward": -0.09017405697774032,
              "min_reward": -0.2013379568072446,
              "max_reward": 0.04250543636715191,
              "num_responses": 6,
              "rvariance": 0.00683665388045785
            },
            {
              "id": "safety_sample_290",
              "rewards": [
                -1.6303319594542593,
                -1.6796385279270234,
                -1.7042918121634052,
                -1.6522957945012178,
                -1.7051882952265465,
                -1.699361155316129,
                -1.6276425102648358
              ],
              "variance": 0.07539422561017184,
              "mean_reward": -1.6712500078362027,
              "min_reward": -1.7051882952265465,
              "max_reward": -1.6276425102648358,
              "num_responses": 7,
              "rvariance": 0.0010056192567301319
            },
            {
              "id": "safety_sample_296",
              "rewards": [
                0.7453481578698241,
                0.673629512818531,
                0.8744417189621517,
                0.8027230739108586,
                0.974847822033962,
                0.6592857838082724,
                0.8314105319313758
              ],
              "variance": 0.24671213897644828,
              "mean_reward": 0.7945266573335678,
              "min_reward": 0.6592857838082724,
              "max_reward": 0.974847822033962,
              "num_responses": 7,
              "rvariance": 0.010807782742477493
            },
            {
              "id": "safety_sample_183",
              "rewards": [
                -0.8862510170470935,
                -0.861149491279141,
                -0.7894308462278479,
                -0.8754932202893996,
                -0.8324620332586238,
                -0.7105403366714255,
                -0.7966027107329772
              ],
              "variance": 0.1219216965871982,
              "mean_reward": -0.8217042365009298,
              "min_reward": -0.8862510170470935,
              "max_reward": -0.7105403366714255,
              "num_responses": 7,
              "rvariance": 0.0032514672731958076
            },
            {
              "id": "safety_sample_304",
              "rewards": [
                -0.538415588548322,
                -0.1367911762610808,
                0.08553662339792775,
                0.006646113841505363,
                -0.1367911762610808,
                -0.022041344179011872,
                0.02816170735689329
              ],
              "variance": 0.3485526149492844,
              "mean_reward": -0.10195640580759559,
              "min_reward": -0.538415588548322,
              "max_reward": 0.08553662339792775,
              "num_responses": 7,
              "rvariance": 0.037598403483882936
            },
            {
              "id": "safety_sample_353",
              "rewards": [
                -0.8109464397432358,
                -0.8324620332586238,
                -0.7033684721662962,
                -0.7894308462278479,
                -0.674681014145779,
                -0.7320559301868134,
                -0.6603372851355204
              ],
              "variance": 0.1506091546077154,
              "mean_reward": -0.743326002980588,
              "min_reward": -0.8324620332586238,
              "max_reward": -0.6603372851355204,
              "num_responses": 7,
              "rvariance": 0.003995184646257704
            },
            {
              "id": "safety_sample_141",
              "rewards": [
                0.22897391350051394,
                0.18594272646973808,
                0.24331764251077254,
                0.2146301844902553,
                0.2720051005312898,
                0.2720051005312898
              ],
              "variance": 0.0717186450512931,
              "mean_reward": 0.23614577800564326,
              "min_reward": 0.18594272646973808,
              "max_reward": 0.2720051005312898,
              "num_responses": 6,
              "rvariance": 0.0009429867421321172
            },
            {
              "id": "safety_sample_156",
              "rewards": [
                -2.6110844305306924,
                -2.747349856128149,
                -2.7616935851384077,
                -2.6792171433294207,
                -2.596740701520434,
                -2.7330061271178905,
                -2.5572954467422226
              ],
              "variance": 0.1721247481231032,
              "mean_reward": -2.6694838986438882,
              "min_reward": -2.7616935851384077,
              "max_reward": -2.5572954467422226,
              "num_responses": 7,
              "rvariance": 0.005711980360644048
            },
            {
              "id": "safety_sample_372",
              "rewards": [
                -0.9256962718253048,
                -1.1265084779689254,
                -0.8754932202893996,
                -1.0081727136342917,
                -0.9364540685829987,
                -0.954383729845822,
                -0.9579696620983866
              ],
              "variance": 0.14989196815720263,
              "mean_reward": -0.9692397348921613,
              "min_reward": -1.1265084779689254,
              "max_reward": -0.8754932202893996,
              "num_responses": 7,
              "rvariance": 0.005479470271535789
            },
            {
              "id": "safety_sample_85",
              "rewards": [
                0.4441298486543932,
                0.5301922227159449,
                0.48716103568516905,
                0.5301922227159449,
                0.6305983257877552,
                0.7166606998493069,
                0.6305983257877552
              ],
              "variance": 0.1950747145395172,
              "mean_reward": 0.5670760973137529,
              "min_reward": 0.4441298486543932,
              "max_reward": 0.7166606998493069,
              "num_responses": 7,
              "rvariance": 0.007809819697361354
            },
            {
              "id": "safety_sample_98",
              "rewards": [
                0.07119289438766914,
                0.18594272646973808,
                0.08553662339792775,
                0.25766137152103114,
                0.06402102988253983,
                -0.007697615168753254,
                0.08553662339792775
              ],
              "variance": 0.17929661262823274,
              "mean_reward": 0.10602766484115436,
              "min_reward": -0.007697615168753254,
              "max_reward": 0.25766137152103114,
              "num_responses": 7,
              "rvariance": 0.006590060223122929
            },
            {
              "id": "safety_sample_382",
              "rewards": [
                -0.7966027107329772,
                -0.6029623690944859,
                -0.538415588548322,
                -0.7105403366714255,
                -0.6818528786509083,
                -0.6101342335996152,
                -0.5168999950329342
              ],
              "variance": 0.2151559351538792,
              "mean_reward": -0.6367725874758097,
              "min_reward": -0.7966027107329772,
              "max_reward": -0.5168999950329342,
              "num_responses": 7,
              "rvariance": 0.00841655031363486
            },
            {
              "id": "safety_sample_148",
              "rewards": [
                0.5445359517262035,
                0.6305983257877552,
                0.601910867767238,
                0.601910867767238,
                0.5158484937056863,
                0.7310044288595655,
                0.5732234097467207
              ],
              "variance": 0.13769979849848268,
              "mean_reward": 0.5998617636229154,
              "min_reward": 0.5158484937056863,
              "max_reward": 0.7310044288595655,
              "num_responses": 7,
              "rvariance": 0.004140044205160374
            },
            {
              "id": "safety_sample_37",
              "rewards": [
                1.1182851121365482,
                1.0609101960955136,
                1.046566467085255,
                1.089597654116031,
                0.9891915510442206,
                1.3047535892699103
              ],
              "variance": 0.1936403416384913,
              "mean_reward": 1.1015507616245799,
              "min_reward": 0.9891915510442206,
              "max_reward": 1.3047535892699103,
              "num_responses": 6,
              "rvariance": 0.00983563747399621
            },
            {
              "id": "safety_sample_271",
              "rewards": [
                1.3047535892699103,
                1.4481908793724965,
                1.4768783373930137,
                1.6203156274955999,
                1.462534608382755
              ],
              "variance": 0.20081220614362083,
              "mean_reward": 1.462534608382755,
              "min_reward": 1.3047535892699103,
              "max_reward": 1.6203156274955999,
              "num_responses": 5,
              "rvariance": 0.010040237021683055
            },
            {
              "id": "safety_sample_111",
              "rewards": [
                0.2146301844902553,
                0.300692558551807,
                0.2146301844902553,
                0.2863488295415484,
                0.25766137152103114,
                0.17159899745947946,
                0.24331764251077254
              ],
              "variance": 0.09466861146770683,
              "mean_reward": 0.24126853836644988,
              "min_reward": 0.17159899745947946,
              "max_reward": 0.300692558551807,
              "num_responses": 7,
              "rvariance": 0.0017299170512434824
            },
            {
              "id": "safety_sample_209",
              "rewards": [
                2.021940039782841,
                2.480939368111117,
                2.3088146199880133,
                2.480939368111117,
                2.251439703946979,
                2.3661895360290477,
                2.65306411623422
              ],
              "variance": 0.3901494290790346,
              "mean_reward": 2.3661895360290477,
              "min_reward": 2.021940039782841,
              "max_reward": 2.65306411623422,
              "num_responses": 7,
              "rvariance": 0.03479988475899514
            },
            {
              "id": "safety_sample_7",
              "rewards": [
                -0.2945721953739256,
                -0.4882125370124169,
                -0.3949782984457359,
                -0.33043151789957215,
                -0.3878064339406066,
                -0.33760338240470145,
                -0.25871287284827904
              ],
              "variance": 0.15204352750874134,
              "mean_reward": -0.35604531970360537,
              "min_reward": -0.4882125370124169,
              "max_reward": -0.25871287284827904,
              "num_responses": 7,
              "rvariance": 0.004891634380336548
            },
            {
              "id": "safety_sample_49",
              "rewards": [
                -1.5478555176452722,
                -1.680983252521735,
                -1.5604062805292485,
                -1.5675781450343778,
                -1.663950074322053,
                -1.5568203482766838
              ],
              "variance": 0.12012873046091599,
              "mean_reward": -1.596265603054895,
              "min_reward": -1.680983252521735,
              "max_reward": -1.5478555176452722,
              "num_responses": 6,
              "rvariance": 0.0029610989225772257
            },
            {
              "id": "safety_sample_358",
              "rewards": [
                0.11422408141844499,
                0.09988035240818638,
                -0.17982236329185666,
                0.300692558551807,
                0.09988035240818638,
                0.08553662339792775
              ],
              "variance": 0.25460118993209047,
              "mean_reward": 0.08673193414878265,
              "min_reward": -0.17982236329185666,
              "max_reward": 0.300692558551807,
              "num_responses": 6,
              "rvariance": 0.0196555585022902
            },
            {
              "id": "safety_sample_335",
              "rewards": [
                -0.6316498271150031,
                -0.6029623690944859,
                -0.4882125370124169,
                -0.3806345694354773,
                -0.40932202745599455,
                -0.5097281305278049,
                -0.25154100834314974
              ],
              "variance": 0.2854402073041465,
              "mean_reward": -0.46772149556919035,
              "min_reward": -0.6316498271150031,
              "max_reward": -0.25154100834314974,
              "num_responses": 7,
              "rvariance": 0.015010809364552067
            },
            {
              "id": "safety_sample_132",
              "rewards": [
                1.1756600281775826,
                1.1469725701570654,
                1.2186912152083584,
                1.2473786732288756,
                1.1900037571878412,
                1.1326288411468068,
                1.2904098602596517
              ],
              "variance": 0.12335606948822408,
              "mean_reward": 1.2002492779094547,
              "min_reward": 1.1326288411468068,
              "max_reward": 1.2904098602596517,
              "num_responses": 7,
              "rvariance": 0.0026872497883393904
            },
            {
              "id": "safety_sample_38",
              "rewards": [
                -0.18699422779698596,
                -0.43083762097138245,
                -0.32325965339444285,
                -0.31608778888931355,
                -0.373462704930348,
                -0.2156816858175032,
                -0.35194711141496005
              ],
              "variance": 0.19220596873746548,
              "mean_reward": -0.3140386847449909,
              "min_reward": -0.43083762097138245,
              "max_reward": -0.18699422779698596,
              "num_responses": 7,
              "rvariance": 0.006359124694437513
            },
            {
              "id": "safety_sample_53",
              "rewards": [
                1.2473786732288756,
                1.4768783373930137,
                1.3334410472904275,
                1.4051596923417204,
                1.4912220664032723,
                1.4912220664032723,
                1.4338471503622379
              ],
              "variance": 0.19220596873746554,
              "mean_reward": 1.4113070047746885,
              "min_reward": 1.2473786732288756,
              "max_reward": 1.4912220664032723,
              "num_responses": 7,
              "rvariance": 0.0072219838061621236
            },
            {
              "id": "safety_sample_219",
              "rewards": [
                -1.3524222098804985,
                -1.026102374897115,
                -1.321941785733699,
                -1.2735317003240763,
                -1.2089849197779123
              ],
              "variance": 0.24097464737234486,
              "mean_reward": -1.2365965981226603,
              "min_reward": -1.3524222098804985,
              "max_reward": -1.026102374897115,
              "num_responses": 5,
              "rvariance": 0.01342675959088189
            },
            {
              "id": "safety_sample_270",
              "rewards": [
                1.8785027496802549,
                2.1940647879059445,
                2.2227522459264617,
                2.021940039782841,
                2.13668987186491,
                1.9358776657212893,
                1.835471562649479
              ],
              "variance": 0.34424949624620704,
              "mean_reward": 2.032185560504454,
              "min_reward": 1.835471562649479,
              "max_reward": 2.2227522459264617,
              "num_responses": 7,
              "rvariance": 0.02073381164815612
            },
            {
              "id": "safety_sample_112",
              "rewards": [
                1.3190973182801689,
                1.3047535892699103,
                1.4768783373930137,
                1.3334410472904275,
                1.161316299167324,
                1.2186912152083584
              ],
              "variance": 0.21515593515387943,
              "mean_reward": 1.3023629677682005,
              "min_reward": 1.161316299167324,
              "max_reward": 1.4768783373930137,
              "num_responses": 6,
              "rvariance": 0.009767056620022965
            },
            {
              "id": "safety_sample_362",
              "rewards": [
                -0.6244779626098738,
                -0.7392277946919428,
                -0.6029623690944859,
                -0.6316498271150031,
                -0.6531654206303911,
                -0.6029623690944859,
                -0.5671030465688394
              ],
              "variance": 0.09897173017078442,
              "mean_reward": -0.631649827115003,
              "min_reward": -0.7392277946919428,
              "max_reward": -0.5671030465688394,
              "num_responses": 7,
              "rvariance": 0.002557086126716703
            },
            {
              "id": "safety_sample_258",
              "rewards": [
                1.2904098602596517,
                1.0322227380749964,
                1.1469725701570654,
                1.3047535892699103,
                1.0752539251057722,
                1.046566467085255,
                1.1900037571878412
              ],
              "variance": 0.2553183763826037,
              "mean_reward": 1.1551689867343562,
              "min_reward": 1.0322227380749964,
              "max_reward": 1.3047535892699103,
              "num_responses": 7,
              "rvariance": 0.010748999153357575
            },
            {
              "id": "safety_sample_78",
              "rewards": [
                1.0752539251057722,
                1.046566467085255,
                0.9605040930237034,
                0.9605040930237034,
                0.8887854479724103,
                0.974847822033962,
                0.9031291769826689
              ],
              "variance": 0.16064976491489635,
              "mean_reward": 0.9727987178896395,
              "min_reward": 0.8887854479724103,
              "max_reward": 1.0752539251057722,
              "num_responses": 7,
              "rvariance": 0.004022477026920522
            },
            {
              "id": "safety_sample_12",
              "rewards": [
                -0.6818528786509083,
                -0.8252901687534945,
                -0.8181183042483651,
                -0.6961966076611669,
                -0.7248840656816841,
                -0.7966027107329772,
                -0.76791525271246
              ],
              "variance": 0.13052793399335338,
              "mean_reward": -0.758694284063008,
              "min_reward": -0.8252901687534945,
              "max_reward": -0.6818528786509083,
              "num_responses": 7,
              "rvariance": 0.002920284730921948
            },
            {
              "id": "safety_sample_173",
              "rewards": [
                -1.2591879713138177,
                -1.140852206979184,
                -1.3129769551022874,
                -1.2161567842830416,
                -1.4223478888055094,
                -1.377523735648451
              ],
              "variance": 0.22143131659586746,
              "mean_reward": -1.2881742570220485,
              "min_reward": -1.4223478888055094,
              "max_reward": -1.140852206979184,
              "num_responses": 6,
              "rvariance": 0.009055262366089714
            },
            {
              "id": "safety_sample_67",
              "rewards": [
                -1.1551959359894426,
                -1.1480240714843133,
                -0.9292822040778694,
                -1.026102374897115,
                -0.8539776267740117,
                -0.9077666105624814,
                -0.8539776267740117
              ],
              "variance": 0.2969151905123534,
              "mean_reward": -0.9820466357941778,
              "min_reward": -1.1551959359894426,
              "max_reward": -0.8539776267740117,
              "num_responses": 7,
              "rvariance": 0.014367863858552892
            },
            {
              "id": "safety_sample_154",
              "rewards": [
                1.9645651237418067,
                1.649003085516117,
                2.021940039782841,
                2.021940039782841,
                2.021940039782841,
                2.021940039782841,
                1.9645651237418067
              ],
              "variance": 0.18359973133131002,
              "mean_reward": 1.9522704988758706,
              "min_reward": 1.649003085516117,
              "max_reward": 2.021940039782841,
              "num_responses": 7,
              "rvariance": 0.015955545618265114
            },
            {
              "id": "safety_sample_17",
              "rewards": [
                -0.6244779626098738,
                -0.6316498271150031,
                -0.7033684721662962,
                -0.5886186400842273,
                -0.7392277946919428
              ],
              "variance": 0.12192169658719831,
              "mean_reward": -0.6574685393334686,
              "min_reward": -0.7392277946919428,
              "max_reward": -0.5886186400842273,
              "num_responses": 5,
              "rvariance": 0.0030573344701272584
            },
            {
              "id": "safety_sample_249",
              "rewards": [
                1.3190973182801689,
                1.2186912152083584,
                1.276066131249393,
                1.1900037571878412,
                1.2904098602596517,
                1.276066131249393
              ],
              "variance": 0.10040610307181042,
              "mean_reward": 1.2617224022391342,
              "min_reward": 1.1900037571878412,
              "max_reward": 1.3190973182801689,
              "num_responses": 6,
              "rvariance": 0.0019202639112508605
            },
            {
              "id": "safety_sample_266",
              "rewards": [
                0.6449420547980138,
                0.5158484937056863,
                0.41544239063387595,
                0.673629512818531,
                0.7023169708390483,
                0.48716103568516905,
                0.8457542609416344
              ],
              "variance": 0.301218309215431,
              "mean_reward": 0.6121563884888513,
              "min_reward": 0.41544239063387595,
              "max_reward": 0.8457542609416344,
              "num_responses": 7,
              "rvariance": 0.01873516961807869
            },
            {
              "id": "safety_sample_133",
              "rewards": [
                0.32938001657232424,
                0.3724112036031001,
                0.2863488295415484,
                0.40109866162361735,
                0.4728173066749104,
                0.31503628756206564
              ],
              "variance": 0.1362654255974569,
              "mean_reward": 0.3628487175962611,
              "min_reward": 0.2863488295415484,
              "max_reward": 0.4728173066749104,
              "num_responses": 6,
              "rvariance": 0.0038176675378439645
            },
            {
              "id": "safety_sample_125",
              "rewards": [
                0.04967730087228121,
                0.11422408141844499,
                -0.036385073189270485,
                -0.007697615168753254,
                -0.07941626022004634,
                0.04250543636715191
              ],
              "variance": 0.1398513578500215,
              "mean_reward": 0.013817978346634674,
              "min_reward": -0.07941626022004634,
              "max_reward": 0.11422408141844499,
              "num_responses": 6,
              "rvariance": 0.003977689530448203
            },
            {
              "id": "safety_sample_182",
              "rewards": [
                0.31503628756206564,
                0.3724112036031001,
                0.40109866162361735,
                0.42978611964413455,
                0.4584735776646518,
                0.5301922227159449,
                0.48716103568516905
              ],
              "variance": 0.15491227331079305,
              "mean_reward": 0.42773701549981197,
              "min_reward": 0.31503628756206564,
              "max_reward": 0.5301922227159449,
              "num_responses": 7,
              "rvariance": 0.004492745739879921
            },
            {
              "id": "safety_sample_117",
              "rewards": [
                0.18594272646973808,
                -0.1439630407662101,
                0.14291153943896223,
                0.08553662339792775,
                0.17159899745947946,
                0.25766137152103114
              ],
              "variance": 0.2510152576795258,
              "mean_reward": 0.11661470292015474,
              "min_reward": -0.1439630407662101,
              "max_reward": 0.25766137152103114,
              "num_responses": 6,
              "rvariance": 0.01621365689350798
            },
            {
              "id": "safety_sample_242",
              "rewards": [
                0.5732234097467207,
                0.7166606998493069,
                0.7883793449006,
                0.7596918868800827,
                0.5158484937056863,
                0.6449420547980138
              ],
              "variance": 0.22949966416413792,
              "mean_reward": 0.6664576483134018,
              "min_reward": 0.5158484937056863,
              "max_reward": 0.7883793449006,
              "num_responses": 6,
              "rvariance": 0.009652755196734216
            },
            {
              "id": "safety_sample_70",
              "rewards": [
                -1.2305005132933005,
                -1.1372662747266193,
                -1.1049928844535375,
                -1.1265084779689254,
                -1.1767115295048305,
                -1.151610003736878,
                -0.9794852556137745
              ],
              "variance": 0.1434372901025862,
              "mean_reward": -1.1295821341854093,
              "min_reward": -1.2305005132933005,
              "max_reward": -0.9794852556137745,
              "num_responses": 7,
              "rvariance": 0.0051561605313762094
            },
            {
              "id": "safety_sample_31",
              "rewards": [
                0.20028645547999668,
                0.02816170735689329,
                -0.0005257506636239454,
                0.17159899745947946,
                0.18594272646973808,
                0.24331764251077254,
                0.31503628756206564
              ],
              "variance": 0.2553183763826034,
              "mean_reward": 0.1634025808821888,
              "min_reward": -0.0005257506636239454,
              "max_reward": 0.31503628756206564,
              "num_responses": 7,
              "rvariance": 0.010925349920717337
            },
            {
              "id": "safety_sample_59",
              "rewards": [
                0.9174729059929275,
                0.7883793449006,
                1.0609101960955136,
                0.8887854479724103,
                1.0035352800544792,
                1.0035352800544792
              ],
              "variance": 0.1936403416384913,
              "mean_reward": 0.943769742511735,
              "min_reward": 0.7883793449006,
              "max_reward": 1.0609101960955136,
              "num_responses": 6,
              "rvariance": 0.008121116124665075
            },
            {
              "id": "safety_sample_149",
              "rewards": [
                0.32938001657232424,
                0.25766137152103114,
                0.25766137152103114,
                0.3724112036031001,
                0.31503628756206564,
                0.22897391350051394,
                0.3867549326133587
              ],
              "variance": 0.13196230689437927,
              "mean_reward": 0.306839870984775,
              "min_reward": 0.22897391350051394,
              "max_reward": 0.3867549326133587,
              "num_responses": 7,
              "rvariance": 0.0031659161568873455
            },
            {
              "id": "safety_sample_309",
              "rewards": [
                -0.43800948547651175,
                -0.41649389196112385,
                -0.4523532144867704,
                -0.35911897592008934,
                -0.35194711141496005,
                -0.4523532144867704,
                -0.35194711141496005
              ],
              "variance": 0.10040610307181036,
              "mean_reward": -0.40317471502302654,
              "min_reward": -0.4523532144867704,
              "max_reward": -0.35194711141496005,
              "num_responses": 7,
              "rvariance": 0.0019167648880889577
            }
          ]
        }
      },
      "overall_stats": {
        "mean_variance_across_files": 0.3969131447423342,
        "mean_rvariance_across_files": 0.048650854677386834,
        "total_processed_files": 4
      }
    }
  },
  "summary": {
    "model_comparison": {
      "RM-Mistral-7B": {
        "mean_variance": 0.3969131447423342,
        "mean_rvariance": 0.048650854677386834
      }
    }
  }
}