{
  "models": {
    "GRM-llama3-8B-distill": {
      "model_name": "GRM-llama3-8B-distill",
      "model_path": "Ray2333/GRM-llama3-8B-distill",
      "files": {
        "semantic_benchmark_chat_filtered.json": {
          "file_name": "semantic_benchmark_chat_filtered.json",
          "processed_samples": 200,
          "global_mean": 3.4408817263086227,
          "global_std": 1.8412366509657416,
          "mean_variance": 0.4671094731794215,
          "mean_rvariance": 0.05815621345265052,
          "sample_results": [
            {
              "id": "chat_sample_306",
              "rewards": [
                -0.3582547229671108,
                0.04059406141637142,
                0.5412765779828704,
                0.3715536910111758,
                0.25274767013098964,
                -0.5025191768930511,
                0.4733874231941926
              ],
              "variance": 0.9165035896471507,
              "mean_reward": 0.11696936055363398,
              "min_reward": -0.5025191768930511,
              "max_reward": 0.5412765779828704,
              "num_responses": 7,
              "rvariance": 0.14367950638706578
            },
            {
              "id": "chat_sample_202",
              "rewards": [
                0.2866922475253285,
                -0.5279776099388054,
                -0.8249926621392708,
                -0.34128243426994137,
                0.6091657327715482,
                -0.9480417551937494,
                -0.24793484643550934
              ],
              "variance": 1.2898939409848786,
              "mean_reward": -0.2849101896686285,
              "min_reward": -0.9480417551937494,
              "max_reward": 0.6091657327715482,
              "num_responses": 7,
              "rvariance": 0.2744514897606457
            },
            {
              "id": "chat_sample_298",
              "rewards": [
                -1.0668477760739357,
                -1.1262507865140288,
                -1.4084150861044709,
                -2.611326047516356,
                -1.151709219559783,
                -1.0116878378081349,
                -1.4699396326317102
              ],
              "variance": 0.8817103978179532,
              "mean_reward": -1.4065966266012029,
              "min_reward": -2.611326047516356,
              "max_reward": -1.0116878378081349,
              "num_responses": 7,
              "rvariance": 0.26719031914994223
            },
            {
              "id": "chat_sample_268",
              "rewards": [
                -0.12064268120673842,
                -0.9353125386708723,
                -0.837721878662148,
                -0.1800456916468315,
                -0.08669810381239951,
                -0.3582547229671108,
                -0.34128243426994137
              ],
              "variance": 0.7696932924166349,
              "mean_reward": -0.40856543589086314,
              "min_reward": -0.9353125386708723,
              "max_reward": -0.08669810381239951,
              "num_responses": 7,
              "rvariance": 0.1010593283478306
            },
            {
              "id": "chat_sample_303",
              "rewards": [
                -1.5208564987232185,
                -2.295217170531575,
                -1.421144302627348,
                -2.1371627320391844,
                -1.421144302627348,
                -3.489641987594876,
                -1.421144302627348
              ],
              "variance": 1.3518427947295475,
              "mean_reward": -1.9580444709672713,
              "min_reward": -3.489641987594876,
              "max_reward": -1.421144302627348,
              "num_responses": 7,
              "rvariance": 0.5067826327265618
            },
            {
              "id": "chat_sample_65",
              "rewards": [
                1.5426416111158683,
                0.7109994649545649,
                1.4747524563271905,
                1.5935584772073768,
                1.2880572806583264,
                1.2201681258696486,
                1.4408078789328516
              ],
              "variance": 0.5465076960488564,
              "mean_reward": 1.3244264707236895,
              "min_reward": 0.7109994649545649,
              "max_reward": 1.5935584772073768,
              "num_responses": 7,
              "rvariance": 0.0778110900570448
            },
            {
              "id": "chat_sample_212",
              "rewards": [
                0.7958609084404122,
                1.2201681258696486,
                1.0504452388979542,
                1.271084991961157,
                1.0504452388979542,
                0.3715536910111758,
                1.5256693224186988
              ],
              "variance": 0.7467807026754562,
              "mean_reward": 1.0407467882138572,
              "min_reward": 0.3715536910111758,
              "max_reward": 1.5256693224186988,
              "num_responses": 7,
              "rvariance": 0.11833916914840671
            },
            {
              "id": "chat_sample_262",
              "rewards": [
                1.3559464354470043,
                1.084389816292293,
                0.7449440423489039,
                1.423835590235682,
                1.5086970337215293,
                1.0504452388979542,
                1.3389741467498348
              ],
              "variance": 0.5295354073516869,
              "mean_reward": 1.2153189005276002,
              "min_reward": 0.7449440423489039,
              "max_reward": 1.5086970337215293,
              "num_responses": 7,
              "rvariance": 0.061456417003350416
            },
            {
              "id": "chat_sample_178",
              "rewards": [
                -1.0541185595510585,
                -0.6298113421218221,
                -0.8080203734421014,
                -0.1715595472982468,
                -0.9862294047623806,
                -0.5534360429845595,
                -0.6892143525619152
              ],
              "variance": 0.6126996219678174,
              "mean_reward": -0.6989128032460121,
              "min_reward": -1.0541185595510585,
              "max_reward": -0.1715595472982468,
              "num_responses": 7,
              "rvariance": 0.07496577670047108
            },
            {
              "id": "chat_sample_290",
              "rewards": [
                -0.4685745994987123,
                -0.6128390534246526,
                0.13394164925080343,
                0.25274767013098964,
                -0.044267382069475864,
                -0.07821195946381478,
                -0.044267382069475864
              ],
              "variance": 0.7077444386719663,
              "mean_reward": -0.12306729387776262,
              "min_reward": -0.6128390534246526,
              "max_reward": 0.25274767013098964,
              "num_responses": 7,
              "rvariance": 0.08299614456220597
            },
            {
              "id": "chat_sample_292",
              "rewards": [
                -0.46008845515012753,
                -0.7655896516991778,
                -0.4006854447100344,
                -1.5081272822003415,
                -0.5619221873331443,
                -0.22247641338975516,
                -0.6552697751675763
              ],
              "variance": 0.7332028717177207,
              "mean_reward": -0.6534513156643081,
              "min_reward": -1.5081272822003415,
              "max_reward": -0.22247641338975516,
              "num_responses": 7,
              "rvariance": 0.14834943572100848
            },
            {
              "id": "chat_sample_116",
              "rewards": [
                0.7958609084404122,
                1.0504452388979542,
                1.0674175275951234,
                0.5243042892857009,
                0.33760911361683693,
                0.3715536910111758,
                1.084389816292293
              ],
              "variance": 0.7162305830205511,
              "mean_reward": 0.747368655019928,
              "min_reward": 0.33760911361683693,
              "max_reward": 1.084389816292293,
              "num_responses": 7,
              "rvariance": 0.09558841978902599
            },
            {
              "id": "chat_sample_106",
              "rewards": [
                1.4747524563271905,
                1.1522789710809709,
                0.32063682491966744,
                1.3729187241441738,
                1.2541127032639876,
                1.457780167630021
              ],
              "variance": 0.7298084139782866,
              "mean_reward": 1.1720799745610018,
              "min_reward": 0.32063682491966744,
              "max_reward": 1.4747524563271905,
              "num_responses": 6,
              "rvariance": 0.15760805337679007
            },
            {
              "id": "chat_sample_251",
              "rewards": [
                -0.21399026904117044,
                -0.663755919516161,
                0.2442615257824049,
                0.32063682491966744,
                0.33760911361683693,
                0.3715536910111758,
                0.43944284579985365
              ],
              "variance": 0.7926058821578135,
              "mean_reward": 0.11939397322465818,
              "min_reward": -0.663755919516161,
              "max_reward": 0.43944284579985365,
              "num_responses": 7,
              "rvariance": 0.1420275785912038
            },
            {
              "id": "chat_sample_280",
              "rewards": [
                -0.8249926621392708,
                -1.257786023917092,
                -0.7740757960477624,
                -0.663755919516161,
                -0.40917158905861917,
                -0.5873806203788985,
                -1.037146270853889
              ],
              "variance": 0.6093051642283835,
              "mean_reward": -0.7934726974159562,
              "min_reward": -1.257786023917092,
              "max_reward": -0.40917158905861917,
              "num_responses": 7,
              "rvariance": 0.06904587886974849
            },
            {
              "id": "chat_sample_58",
              "rewards": [
                -0.5534360429845595,
                -0.03578123772089113,
                0.04908020576495615,
                -0.29036556817843295,
                -0.2649071351326788,
                0.09151092750787979,
                -0.4176577334072039
              ],
              "variance": 0.5380215517002718,
              "mean_reward": -0.20307951202156144,
              "min_reward": -0.5534360429845595,
              "max_reward": 0.09151092750787979,
              "num_responses": 7,
              "rvariance": 0.05122739791153582
            },
            {
              "id": "chat_sample_90",
              "rewards": [
                -0.4006854447100344,
                -0.5110053212416359,
                -0.8886387447536563,
                -0.8462080230107327,
                -0.5619221873331443,
                -0.5364637542873901
              ],
              "variance": 0.4115780009063594,
              "mean_reward": -0.624153912556099,
              "min_reward": -0.8886387447536563,
              "max_reward": -0.4006854447100344,
              "num_responses": 6,
              "rvariance": 0.032260560958616714
            },
            {
              "id": "chat_sample_180",
              "rewards": [
                0.7109994649545649,
                0.3885259797083453,
                0.5243042892857009,
                1.1522789710809709,
                0.8467777745319206
              ],
              "variance": 0.5872411889220632,
              "mean_reward": 0.7245772959123006,
              "min_reward": 0.3885259797083453,
              "max_reward": 1.1522789710809709,
              "num_responses": 5,
              "rvariance": 0.07021716034322731
            },
            {
              "id": "chat_sample_291",
              "rewards": [
                1.1692512597781404,
                1.2541127032639876,
                0.3885259797083453,
                1.1353066823838014,
                0.4733874231941926,
                0.7449440423489039
              ],
              "variance": 0.780725280069795,
              "mean_reward": 0.8609213484462286,
              "min_reward": 0.3885259797083453,
              "max_reward": 1.2541127032639876,
              "num_responses": 6,
              "rvariance": 0.11862412506020777
            },
            {
              "id": "chat_sample_129",
              "rewards": [
                -0.06123967076664532,
                -0.03578123772089113,
                0.13394164925080343,
                0.16788622664514236,
                -0.13761496990390787,
                -0.850451095185025,
                -0.6552697751675763
              ],
              "variance": 0.8808617833830948,
              "mean_reward": -0.2055041246925857,
              "min_reward": -0.850451095185025,
              "max_reward": 0.16788622664514236,
              "num_responses": 7,
              "rvariance": 0.13244522162588326
            },
            {
              "id": "chat_sample_31",
              "rewards": [
                0.4733874231941926,
                0.21880309273665072,
                -0.21399026904117044,
                -0.6552697751675763,
                -0.027295093372306404,
                0.22728923708523543
              ],
              "variance": 0.7849683522440873,
              "mean_reward": 0.0038207692391709117,
              "min_reward": -0.6552697751675763,
              "max_reward": 0.4733874231941926,
              "num_responses": 6,
              "rvariance": 0.13324309817892613
            },
            {
              "id": "chat_sample_294",
              "rewards": [
                -0.15458725860107733,
                -0.5279776099388054,
                0.015135628370617235,
                -0.03578123772089113,
                0.09151092750787979,
                -0.4431161664529581,
                -0.29036556817843295
              ],
              "variance": 0.5227464918728193,
              "mean_reward": -0.19216875500195257,
              "min_reward": -0.5279776099388054,
              "max_reward": 0.09151092750787979,
              "num_responses": 7,
              "rvariance": 0.04781478550762872
            },
            {
              "id": "chat_sample_128",
              "rewards": [
                0.09999707185646452,
                -0.7952911569192243,
                -0.45160231080154284,
                -1.0753339204225203,
                -0.6298113421218221,
                -0.4176577334072039,
                -1.2195983743484606
              ],
              "variance": 0.9224438906911601,
              "mean_reward": -0.6413282523091871,
              "min_reward": -1.2195983743484606,
              "max_reward": 0.09999707185646452,
              "num_responses": 7,
              "rvariance": 0.16888316276717047
            },
            {
              "id": "chat_sample_173",
              "rewards": [
                -0.5279776099388054,
                -0.8631803117079021,
                -0.9522848273680418,
                -0.43463002210437335,
                -0.8546941673593174,
                -0.9098541056251181,
                -0.7231589299562541
              ],
              "variance": 0.4361878195172551,
              "mean_reward": -0.7522542820085446,
              "min_reward": -0.9522848273680418,
              "max_reward": -0.43463002210437335,
              "num_responses": 7,
              "rvariance": 0.03424002475453311
            },
            {
              "id": "chat_sample_174",
              "rewards": [
                -0.977743260413796,
                -1.0032016934595502,
                -1.1135215699911516,
                -0.6807282082133305,
                -1.2280845186970455,
                -0.7571035073505931,
                -0.8292357343135632
              ],
              "variance": 0.43279336177782124,
              "mean_reward": -0.9413740703484329,
              "min_reward": -1.2280845186970455,
              "max_reward": -0.6807282082133305,
              "num_responses": 7,
              "rvariance": 0.03306427543363489
            },
            {
              "id": "chat_sample_297",
              "rewards": [
                0.5243042892857009,
                0.26123381447957433,
                0.21031694838806597,
                -1.0116878378081349,
                0.42247055710268416,
                -0.15458725860107733,
                0.29517839187391326
              ],
              "variance": 0.9606315402597911,
              "mean_reward": 0.07817555781724665,
              "min_reward": -1.0116878378081349,
              "max_reward": 0.5243042892857009,
              "num_responses": 7,
              "rvariance": 0.23680179197550782
            },
            {
              "id": "chat_sample_264",
              "rewards": [
                -2.2697587374858212,
                -3.481155843246291,
                -2.189140366174266,
                -2.5094923153333397,
                -3.082307058862809
              ],
              "variance": 1.10022861479401,
              "mean_reward": -2.7063708642205055,
              "min_reward": -3.481155843246291,
              "max_reward": -2.189140366174266,
              "num_responses": 5,
              "rvariance": 0.2477076972997967
            },
            {
              "id": "chat_sample_275",
              "rewards": [
                -0.11215653685815369,
                -0.8971248891022411,
                -0.5788944760303137,
                -0.3327962899213566,
                -0.6552697751675763,
                -0.5364637542873901,
                -0.4176577334072039
              ],
              "variance": 0.5074714320453668,
              "mean_reward": -0.5043376363963193,
              "min_reward": -0.8971248891022411,
              "max_reward": -0.11215653685815369,
              "num_responses": 7,
              "rvariance": 0.053485571450986
            },
            {
              "id": "chat_sample_172",
              "rewards": [
                -0.19701798034400098,
                -1.177167652605537,
                -0.9607709717166265,
                -0.23944870208692462,
                -0.6467836308189916,
                -1.117764642165444,
                -0.803777301267809
              ],
              "variance": 0.919049432951726,
              "mean_reward": -0.734675840143619,
              "min_reward": -1.177167652605537,
              "max_reward": -0.19701798034400098,
              "num_responses": 7,
              "rvariance": 0.134357283958994
            },
            {
              "id": "chat_sample_145",
              "rewards": [
                0.8298054858347511,
                0.8128331971375817,
                1.3389741467498348,
                1.2371404145668181,
                1.084389816292293,
                1.2371404145668181,
                1.3729187241441738
              ],
              "variance": 0.5295354073516871,
              "mean_reward": 1.1304574570417532,
              "min_reward": 0.8128331971375817,
              "max_reward": 1.3729187241441738,
              "num_responses": 7,
              "rvariance": 0.04548974122555249
            },
            {
              "id": "chat_sample_270",
              "rewards": [
                0.5243042892857009,
                -0.5619221873331443,
                0.303664536222498,
                0.5073320005885315,
                0.17637237099372707,
                0.5582488666800398,
                0.5073320005885315
              ],
              "variance": 0.6568275725804579,
              "mean_reward": 0.28790455386084063,
              "min_reward": -0.5619221873331443,
              "max_reward": 0.5582488666800398,
              "num_responses": 7,
              "rvariance": 0.1371658551492896
            },
            {
              "id": "chat_sample_278",
              "rewards": [
                0.2442615257824049,
                -0.4261438777557886,
                -0.15458725860107733,
                0.04908020576495615,
                -0.01032280467513695,
                0.22728923708523543,
                0.21031694838806597
              ],
              "variance": 0.49728805882706506,
              "mean_reward": 0.019984853712665653,
              "min_reward": -0.4261438777557886,
              "max_reward": 0.2442615257824049,
              "num_responses": 7,
              "rvariance": 0.051538971481573874
            },
            {
              "id": "chat_sample_165",
              "rewards": [
                1.0504452388979542,
                1.084389816292293,
                1.2880572806583264,
                1.610530765904546,
                1.5086970337215293,
                1.5935584772073768,
                1.5935584772073768
              ],
              "variance": 0.5295354073516869,
              "mean_reward": 1.389891012841343,
              "min_reward": 1.0504452388979542,
              "max_reward": 1.610530765904546,
              "num_responses": 7,
              "rvariance": 0.05209745240900052
            },
            {
              "id": "chat_sample_127",
              "rewards": [
                1.0165006615036152,
                1.2201681258696486,
                1.4408078789328516,
                1.084389816292293,
                0.8128331971375817,
                1.1353066823838014,
                1.0334729502007847
              ],
              "variance": 0.373390351337728,
              "mean_reward": 1.1062113303315109,
              "min_reward": 0.8128331971375817,
              "max_reward": 1.4408078789328516,
              "num_responses": 7,
              "rvariance": 0.03223904637902943
            },
            {
              "id": "chat_sample_256",
              "rewards": [
                -0.06123967076664532,
                -0.4006854447100344,
                0.22728923708523543,
                0.1594000822965576,
                0.04059406141637142,
                -0.06972581511523004,
                0.35458140231400637
              ],
              "variance": 0.4803157701298957,
              "mean_reward": 0.03574483607432301,
              "min_reward": -0.4006854447100344,
              "max_reward": 0.35458140231400637,
              "num_responses": 7,
              "rvariance": 0.052094513035698266
            },
            {
              "id": "chat_sample_114",
              "rewards": [
                -0.6977004969105,
                0.14242779359938815,
                -0.36674086731569555,
                -0.7146727856076693,
                0.1848585153423118,
                -0.29036556817843295,
                -0.36674086731569555
              ],
              "variance": 0.8638894946859252,
              "mean_reward": -0.3012763251980419,
              "min_reward": -0.7146727856076693,
              "max_reward": 0.1848585153423118,
              "num_responses": 7,
              "rvariance": 0.10999134897002931
            },
            {
              "id": "chat_sample_119",
              "rewards": [
                -2.0915497061655417,
                -1.828479231359415,
                -1.5229780348103648,
                -2.0830635618169566,
                -1.8271532713049485,
                -1.105035425642567,
                -1.7611204605925237
              ],
              "variance": 0.7306570284131451,
              "mean_reward": -1.7456256702417596,
              "min_reward": -2.0915497061655417,
              "max_reward": -1.105035425642567,
              "num_responses": 7,
              "rvariance": 0.101029593027481
            },
            {
              "id": "chat_sample_179",
              "rewards": [
                -1.117764642165444,
                -1.7298278033071175,
                -1.4147796943659094,
                -0.9522848273680418,
                -0.7316450743048388,
                -1.1135215699911516,
                -1.3893212613201553
              ],
              "variance": 0.6767700117996323,
              "mean_reward": -1.2070206961175225,
              "min_reward": -1.7298278033071175,
              "max_reward": -0.7316450743048388,
              "num_responses": 7,
              "rvariance": 0.09390080616416642
            },
            {
              "id": "chat_sample_191",
              "rewards": [
                -0.23944870208692462,
                -0.001836660326552221,
                0.21031694838806597,
                0.23577538143382018,
                0.16788622664514236,
                0.303664536222498,
                0.1254555049022187
              ],
              "variance": 0.3598125203799925,
              "mean_reward": 0.11454474788260978,
              "min_reward": -0.23944870208692462,
              "max_reward": 0.303664536222498,
              "num_responses": 7,
              "rvariance": 0.028779404002286398
            },
            {
              "id": "chat_sample_156",
              "rewards": [
                0.3885259797083453,
                0.7279717536517344,
                0.8298054858347511,
                0.7958609084404122,
                0.9486115067149373,
                0.6940271762573955
              ],
              "variance": 0.3479319182919738,
              "mean_reward": 0.7308004684345959,
              "min_reward": 0.3885259797083453,
              "max_reward": 0.9486115067149373,
              "num_responses": 6,
              "rvariance": 0.02999810083310077
            },
            {
              "id": "chat_sample_166",
              "rewards": [
                0.3885259797083453,
                0.1848585153423118,
                0.21880309273665072,
                0.43944284579985365,
                0.33760911361683693,
                0.09151092750787979,
                0.0660524944621256
              ],
              "variance": 0.32756517185537054,
              "mean_reward": 0.2466861384534291,
              "min_reward": 0.0660524944621256,
              "max_reward": 0.43944284579985365,
              "num_responses": 7,
              "rvariance": 0.018121236408343955
            },
            {
              "id": "chat_sample_245",
              "rewards": [
                -0.18853183599541623,
                -0.2988517125270177,
                -0.12064268120673842,
                -0.570408331681729,
                -0.5279776099388054,
                -0.3327962899213566,
                -0.22247641338975516
              ],
              "variance": 0.3835737245560298,
              "mean_reward": -0.3230978392372598,
              "min_reward": -0.570408331681729,
              "max_reward": -0.12064268120673842,
              "num_responses": 7,
              "rvariance": 0.024720129471885264
            },
            {
              "id": "chat_sample_161",
              "rewards": [
                0.4564151344970231,
                0.9486115067149373,
                1.0165006615036152,
                0.9316392180177678,
                0.8807223519262595,
                1.1692512597781404,
                1.2031958371724791
              ],
              "variance": 0.4718296257813108,
              "mean_reward": 0.9437622813728889,
              "min_reward": 0.4564151344970231,
              "max_reward": 1.2031958371724791,
              "num_responses": 7,
              "rvariance": 0.05215623987504544
            },
            {
              "id": "chat_sample_296",
              "rewards": [
                -2.1679250053028043,
                -2.072455881381226,
                -2.895611883193945,
                -3.260516090183088
              ],
              "variance": 1.0499482095286456,
              "mean_reward": -2.599127215015266,
              "min_reward": -3.260516090183088,
              "max_reward": -2.072455881381226,
              "num_responses": 4,
              "rvariance": 0.2471641104983866
            },
            {
              "id": "chat_sample_130",
              "rewards": [
                -0.1800456916468315,
                -0.5873806203788985,
                -0.3243101455727719,
                0.1254555049022187,
                -0.5873806203788985,
                -0.01032280467513695,
                0.03210791706778669
              ],
              "variance": 0.656827572580458,
              "mean_reward": -0.2188394943832188,
              "min_reward": -0.5873806203788985,
              "max_reward": 0.1254555049022187,
              "num_responses": 7,
              "rvariance": 0.07275242860388018
            },
            {
              "id": "chat_sample_18",
              "rewards": [
                1.4408078789328516,
                1.0504452388979542,
                1.2880572806583264,
                0.9655837954121068,
                1.3050295693554959,
                1.3050295693554959,
                1.3389741467498348
              ],
              "variance": 0.3632069781194265,
              "mean_reward": 1.2419896399088661,
              "min_reward": 0.9655837954121068,
              "max_reward": 1.4408078789328516,
              "num_responses": 7,
              "rvariance": 0.02458491829998196
            },
            {
              "id": "chat_sample_44",
              "rewards": [
                0.6091657327715482,
                -0.39219930036144973,
                0.7109994649545649,
                0.8467777745319206,
                0.7619163310460734,
                0.5412765779828704,
                0.6940271762573955
              ],
              "variance": 0.6279746817952698,
              "mean_reward": 0.5388519653118462,
              "min_reward": -0.39219930036144973,
              "max_reward": 0.8467777745319206,
              "num_responses": 7,
              "rvariance": 0.15287092670318767
            },
            {
              "id": "chat_sample_215",
              "rewards": [
                -2.2400572322657744,
                -1.7473304760260735,
                -1.537828787420388,
                -2.1509527166056346,
                -1.4147796943659094,
                -0.8674233838821945
              ],
              "variance": 1.0544034353116523,
              "mean_reward": -1.659728715094329,
              "min_reward": -2.2400572322657744,
              "max_reward": -0.8674233838821945,
              "num_responses": 6,
              "rvariance": 0.21472727150190404
            },
            {
              "id": "chat_sample_300",
              "rewards": [
                0.16788622664514236,
                -0.06972581511523004,
                -0.06972581511523004,
                -0.06972581511523004,
                -0.477060743847297,
                -0.9225833221479952
              ],
              "variance": 0.7489022387626023,
              "mean_reward": -0.24015588078263997,
              "min_reward": -0.9225833221479952,
              "max_reward": 0.16788622664514236,
              "num_responses": 6,
              "rvariance": 0.1292447850260747
            },
            {
              "id": "chat_sample_169",
              "rewards": [
                -0.383713156012865,
                -0.6892143525619152,
                -0.45160231080154284,
                -0.3327962899213566,
                -0.5788944760303137,
                -0.09518424816098423
              ],
              "variance": 0.420064145254944,
              "mean_reward": -0.4219008055814963,
              "min_reward": -0.6892143525619152,
              "max_reward": -0.09518424816098423,
              "num_responses": 6,
              "rvariance": 0.035521224092649406
            },
            {
              "id": "chat_sample_82",
              "rewards": [
                -0.6892143525619152,
                -0.8971248891022411,
                -0.7571035073505931,
                -1.2408137352199224,
                -0.9819863325880883,
                -0.6213251977732374,
                -1.1729245804312447
              ],
              "variance": 0.5380215517002718,
              "mean_reward": -0.9086417992896061,
              "min_reward": -1.2408137352199224,
              "max_reward": -0.6213251977732374,
              "num_responses": 7,
              "rvariance": 0.04847981871726178
            },
            {
              "id": "chat_sample_77",
              "rewards": [
                0.015135628370617235,
                -0.477060743847297,
                -0.11215653685815369,
                -0.1715595472982468,
                -0.30733785687560244,
                -0.39219930036144973
              ],
              "variance": 0.3861195678606052,
              "mean_reward": -0.2408630594783554,
              "min_reward": -0.477060743847297,
              "max_reward": 0.015135628370617235,
              "num_responses": 6,
              "rvariance": 0.028335762756793306
            },
            {
              "id": "chat_sample_277",
              "rewards": [
                -1.4169012304530557,
                -1.4190227665402018,
                -1.2790013847885537,
                -1.6131433185140776,
                -0.8843956725793639
              ],
              "variance": 0.49325714026148737,
              "mean_reward": -1.3224928745750506,
              "min_reward": -1.6131433185140776,
              "max_reward": -0.8843956725793639,
              "num_responses": 5,
              "rvariance": 0.05930586126892874
            },
            {
              "id": "chat_sample_73",
              "rewards": [
                -1.3914427974073014,
                -1.444481199585956,
                -0.8546941673593174,
                -1.0116878378081349,
                -1.2365706630456301,
                -1.151709219559783
              ],
              "variance": 0.4847709959129026,
              "mean_reward": -1.1817643141276872,
              "min_reward": -1.444481199585956,
              "max_reward": -0.8546941673593174,
              "num_responses": 6,
              "rvariance": 0.0421321935918153
            },
            {
              "id": "chat_sample_6",
              "rewards": [
                -1.7754408291807604,
                -1.7791535173332662,
                -1.2790013847885537,
                -1.0583616317253508,
                -1.457210416108833,
                -1.5144918904617801,
                -1.257786023917092
              ],
              "variance": 0.5989096374013672,
              "mean_reward": -1.4459208133593766,
              "min_reward": -1.7791535173332662,
              "max_reward": -1.0583616317253508,
              "num_responses": 7,
              "rvariance": 0.06255940535309112
            },
            {
              "id": "chat_sample_80",
              "rewards": [
                -1.4147796943659094,
                -2.8362088727538515,
                -2.8362088727538515,
                -2.467061593590416
              ],
              "variance": 1.1057446086205902,
              "mean_reward": -2.388564758366007,
              "min_reward": -2.8362088727538515,
              "max_reward": -1.4147796943659094,
              "num_responses": 4,
              "rvariance": 0.3387974025755194
            },
            {
              "id": "chat_sample_224",
              "rewards": [
                -0.7910480847449319,
                -1.3214321065314774,
                -1.5208564987232185,
                -1.117764642165444,
                -0.7316450743048388,
                -1.024417054331012,
                -0.9565278995423342
              ],
              "variance": 0.633914982839279,
              "mean_reward": -1.0662416229061795,
              "min_reward": -1.5208564987232185,
              "max_reward": -0.7316450743048388,
              "num_responses": 7,
              "rvariance": 0.06798917416759119
            },
            {
              "id": "chat_sample_267",
              "rewards": [
                0.16788622664514236,
                -0.4261438777557886,
                -0.5025191768930511,
                -0.19701798034400098,
                -0.2988517125270177,
                -0.2564209907840941,
                -0.22247641338975516
              ],
              "variance": 0.4056376998623501,
              "mean_reward": -0.24793484643550937,
              "min_reward": -0.5025191768930511,
              "max_reward": 0.16788622664514236,
              "num_responses": 7,
              "rvariance": 0.03934057227725474
            },
            {
              "id": "chat_sample_308",
              "rewards": [
                0.1254555049022187,
                -0.22247641338975516,
                0.2866922475253285,
                -0.11215653685815369,
                0.29517839187391326,
                0.11696936055363398,
                -0.10367039250956896
              ],
              "variance": 0.4463711927355567,
              "mean_reward": 0.055141737442516665,
              "min_reward": -0.22247641338975516,
              "max_reward": 0.29517839187391326,
              "num_responses": 7,
              "rvariance": 0.035754536848515144
            },
            {
              "id": "chat_sample_252",
              "rewards": [
                0.42247055710268416,
                0.42247055710268416,
                0.42247055710268416,
                0.7109994649545649,
                0.6940271762573955,
                0.490359711891362,
                0.8298054858347511
              ],
              "variance": 0.3360513162039553,
              "mean_reward": 0.5703719300351608,
              "min_reward": 0.42247055710268416,
              "max_reward": 0.8298054858347511,
              "num_responses": 7,
              "rvariance": 0.024914128109833473
            },
            {
              "id": "chat_sample_159",
              "rewards": [
                0.7619163310460734,
                1.0165006615036152,
                1.2201681258696486,
                1.1692512597781404,
                0.897694640623429,
                1.084389816292293,
                1.2541127032639876
              ],
              "variance": 0.3903626400348976,
              "mean_reward": 1.057719076911027,
              "min_reward": 0.7619163310460734,
              "max_reward": 1.2541127032639876,
              "num_responses": 7,
              "rvariance": 0.027559564081854487
            },
            {
              "id": "chat_sample_188",
              "rewards": [
                1.1862235484753096,
                1.3559464354470043,
                1.5086970337215293,
                1.4068633015385126,
                1.4747524563271905,
                1.3559464354470043,
                1.3729187241441738
              ],
              "variance": 0.20027300662659964,
              "mean_reward": 1.3801925621572464,
              "min_reward": 1.1862235484753096,
              "max_reward": 1.5086970337215293,
              "num_responses": 7,
              "rvariance": 0.00928841963509601
            },
            {
              "id": "chat_sample_88",
              "rewards": [
                0.7619163310460734,
                0.3715536910111758,
                0.897694640623429,
                0.9316392180177678,
                0.7958609084404122,
                0.9316392180177678,
                0.9655837954121068
              ],
              "variance": 0.33944577394338904,
              "mean_reward": 0.8079839717955332,
              "min_reward": 0.3715536910111758,
              "max_reward": 0.9655837954121068,
              "num_responses": 7,
              "rvariance": 0.03660107635956187
            },
            {
              "id": "chat_sample_27",
              "rewards": [
                -1.257786023917092,
                -1.1262507865140288,
                -1.270515240439969,
                -1.3532551478386703,
                -1.5590441482918498,
                -0.9225833221479952,
                -1.1983830134769988
              ],
              "variance": 0.39078694725232666,
              "mean_reward": -1.2411168118038005,
              "min_reward": -1.5590441482918498,
              "max_reward": -0.9225833221479952,
              "num_responses": 7,
              "rvariance": 0.03303984189305997
            },
            {
              "id": "chat_sample_167",
              "rewards": [
                0.9825560841092762,
                0.7958609084404122,
                1.1692512597781404,
                1.0504452388979542,
                0.9316392180177678,
                1.1692512597781404,
                1.084389816292293
              ],
              "variance": 0.2919233655913147,
              "mean_reward": 1.026199112187712,
              "min_reward": 0.7958609084404122,
              "max_reward": 1.1692512597781404,
              "num_responses": 7,
              "rvariance": 0.015543406022274596
            },
            {
              "id": "chat_sample_76",
              "rewards": [
                -0.40917158905861917,
                -0.6892143525619152,
                -0.8886387447536563,
                -0.7825619403963472,
                -0.7316450743048388,
                -0.6892143525619152
              ],
              "variance": 0.28640737176473463,
              "mean_reward": -0.6984076756062154,
              "min_reward": -0.8886387447536563,
              "max_reward": -0.40917158905861917,
              "num_responses": 6,
              "rvariance": 0.02136684546035994
            },
            {
              "id": "chat_sample_209",
              "rewards": [
                -0.5364637542873901,
                -0.29036556817843295,
                0.303664536222498,
                -0.3582547229671108,
                -0.4855468881958817,
                -0.4006854447100344,
                0.2697199588281591
              ],
              "variance": 0.7892114244183797,
              "mean_reward": -0.2139902690411704,
              "min_reward": -0.5364637542873901,
              "max_reward": 0.303664536222498,
              "num_responses": 7,
              "rvariance": 0.10588210509349003
            },
            {
              "id": "chat_sample_61",
              "rewards": [
                1.5426416111158683,
                1.3050295693554959,
                1.423835590235682,
                1.5935584772073768,
                1.5256693224186988,
                1.3389741467498348,
                1.49172474502436
              ],
              "variance": 0.23761204176037243,
              "mean_reward": 1.4602047803010454,
              "min_reward": 1.3050295693554959,
              "max_reward": 1.5935584772073768,
              "num_responses": 7,
              "rvariance": 0.009993869227634952
            },
            {
              "id": "chat_sample_118",
              "rewards": [
                1.0504452388979542,
                1.0674175275951234,
                1.3389741467498348,
                1.3050295693554959,
                1.271084991961157,
                1.3050295693554959,
                1.49172474502436
              ],
              "variance": 0.33944577394338915,
              "mean_reward": 1.2613865412770602,
              "min_reward": 1.0504452388979542,
              "max_reward": 1.49172474502436,
              "num_responses": 7,
              "rvariance": 0.020728460527435783
            },
            {
              "id": "chat_sample_150",
              "rewards": [
                -0.018808949023721676,
                0.3715536910111758,
                0.19334465969089654,
                0.5243042892857009,
                0.23577538143382018,
                0.490359711891362,
                0.35458140231400637
              ],
              "variance": 0.3954543266440484,
              "mean_reward": 0.3073014552290343,
              "min_reward": -0.018808949023721676,
              "max_reward": 0.5243042892857009,
              "num_responses": 7,
              "rvariance": 0.03020206068057325
            },
            {
              "id": "chat_sample_120",
              "rewards": [
                0.8467777745319206,
                1.1013621049894624,
                1.1013621049894624,
                1.1692512597781404,
                1.3559464354470043,
                1.3729187241441738,
                1.2880572806583264
              ],
              "variance": 0.3632069781194265,
              "mean_reward": 1.176525097791213,
              "min_reward": 0.8467777745319206,
              "max_reward": 1.3729187241441738,
              "num_responses": 7,
              "rvariance": 0.02904100822618626
            },
            {
              "id": "chat_sample_244",
              "rewards": [
                -0.01032280467513695,
                -0.45160231080154284,
                -0.13761496990390787,
                -0.2055041246925857,
                -0.5958667647274832,
                -0.29036556817843295
              ],
              "variance": 0.4497656504749906,
              "mean_reward": -0.28187942382984826,
              "min_reward": -0.5958667647274832,
              "max_reward": -0.01032280467513695,
              "num_responses": 6,
              "rvariance": 0.03797572327391205
            },
            {
              "id": "chat_sample_8",
              "rewards": [
                1.457780167630021,
                1.423835590235682,
                1.5086970337215293,
                0.7788886197432427,
                1.4747524563271905,
                1.4068633015385126,
                1.457780167630021
              ],
              "variance": 0.3326568584645213,
              "mean_reward": 1.3583710481180287,
              "min_reward": 0.7788886197432427,
              "max_reward": 1.5086970337215293,
              "num_responses": 7,
              "rvariance": 0.056906267131474286
            },
            {
              "id": "chat_sample_40",
              "rewards": [
                0.5582488666800398,
                0.5921934440743788,
                0.6600825988630565,
                0.6261380214687177,
                0.897694640623429,
                0.7449440423489039,
                0.8637500632290901
              ],
              "variance": 0.29871228107018244,
              "mean_reward": 0.7061502396125166,
              "min_reward": 0.5582488666800398,
              "max_reward": 0.897694640623429,
              "num_responses": 7,
              "rvariance": 0.015202438719214102
            },
            {
              "id": "chat_sample_286",
              "rewards": [
                -0.43463002210437335,
                0.303664536222498,
                0.10848321620504925,
                0.29517839187391326,
                0.17637237099372707,
                0.2442615257824049,
                0.33760911361683693
              ],
              "variance": 0.4260044462989533,
              "mean_reward": 0.14727701894143658,
              "min_reward": -0.43463002210437335,
              "max_reward": 0.33760911361683693,
              "num_responses": 7,
              "rvariance": 0.061847353652549085
            },
            {
              "id": "chat_sample_307",
              "rewards": [
                -1.4508458078473945,
                -0.5194914655902206,
                -0.5449498986359749,
                -0.5194914655902206,
                -1.0541185595510585,
                -0.7231589299562541,
                -0.5958667647274832
              ],
              "variance": 0.6933179932793722,
              "mean_reward": -0.7725604131283722,
              "min_reward": -1.4508458078473945,
              "max_reward": -0.5194914655902206,
              "num_responses": 7,
              "rvariance": 0.10755736416493857
            },
            {
              "id": "chat_sample_206",
              "rewards": [
                1.423835590235682,
                1.2880572806583264,
                1.2201681258696486,
                0.6600825988630565,
                1.423835590235682,
                1.3389741467498348,
                1.4408078789328516
              ],
              "variance": 0.43449059064753803,
              "mean_reward": 1.2565373159350117,
              "min_reward": 0.6600825988630565,
              "max_reward": 1.4408078789328516,
              "num_responses": 7,
              "rvariance": 0.06497190747283613
            },
            {
              "id": "chat_sample_261",
              "rewards": [
                0.33760911361683693,
                -0.5025191768930511,
                -0.3327962899213566,
                -0.5025191768930511,
                -0.5364637542873901,
                -0.49403303254446645,
                -0.850451095185025
              ],
              "variance": 0.5974245621403651,
              "mean_reward": -0.41159620172964345,
              "min_reward": -0.850451095185025,
              "max_reward": 0.33760911361683693,
              "num_responses": 7,
              "rvariance": 0.11414762281940456
            },
            {
              "id": "chat_sample_79",
              "rewards": [
                0.5582488666800398,
                -0.34128243426994137,
                0.5582488666800398,
                0.42247055710268416,
                0.1509139379479729,
                0.6261380214687177,
                0.2782061031767438
              ],
              "variance": 0.6313691395347037,
              "mean_reward": 0.32184913125517955,
              "min_reward": -0.34128243426994137,
              "max_reward": 0.6261380214687177,
              "num_responses": 7,
              "rvariance": 0.09790758532449774
            },
            {
              "id": "chat_sample_69",
              "rewards": [
                0.897694640623429,
                0.9825560841092762,
                1.1522789710809709,
                0.6431103101658872,
                1.1862235484753096,
                1.457780167630021
              ],
              "variance": 0.5515993826580072,
              "mean_reward": 1.0532739536808158,
              "min_reward": 0.6431103101658872,
              "max_reward": 1.457780167630021,
              "num_responses": 6,
              "rvariance": 0.06475716992325542
            },
            {
              "id": "chat_sample_203",
              "rewards": [
                0.677054887560226,
                1.0504452388979542,
                0.5582488666800398,
                0.8467777745319206,
                1.118334393686632,
                0.7449440423489039
              ],
              "variance": 0.4667379391721602,
              "mean_reward": 0.8326342006176128,
              "min_reward": 0.5582488666800398,
              "max_reward": 1.118334393686632,
              "num_responses": 6,
              "rvariance": 0.0394080145646896
            },
            {
              "id": "chat_sample_168",
              "rewards": [
                -1.0201739821567195,
                -0.9480417551937494,
                -0.7231589299562541,
                -0.5873806203788985,
                -0.5958667647274832,
                -0.7401312186534236,
                -0.5619221873331443
              ],
              "variance": 0.39969739881834065,
              "mean_reward": -0.7395250654856674,
              "min_reward": -1.0201739821567195,
              "max_reward": -0.5619221873331443,
              "num_responses": 7,
              "rvariance": 0.028262809144416732
            },
            {
              "id": "chat_sample_265",
              "rewards": [
                -0.2055041246925857,
                -0.570408331681729,
                -0.8419649508364403,
                -1.0201739821567195,
                -0.7825619403963472,
                -0.6552697751675763
              ],
              "variance": 0.5431132383094226,
              "mean_reward": -0.6793138508218997,
              "min_reward": -1.0201739821567195,
              "max_reward": -0.2055041246925857,
              "num_responses": 6,
              "rvariance": 0.06503922728638338
            },
            {
              "id": "chat_sample_301",
              "rewards": [
                -1.3829566530587167,
                -1.491154993503172,
                -0.9735001882395036,
                -1.0456324152024739,
                -1.024417054331012,
                -1.0116878378081349,
                -1.024417054331012
              ],
              "variance": 0.4298232112558166,
              "mean_reward": -1.1362523137820035,
              "min_reward": -1.491154993503172,
              "max_reward": -0.9735001882395036,
              "num_responses": 7,
              "rvariance": 0.03743567466656822
            },
            {
              "id": "chat_sample_196",
              "rewards": [
                -1.5144918904617801,
                -2.08412432986053,
                -1.940390259956376,
                -1.5208564987232185,
                -1.828479231359415,
                -1.8313963434792409,
                -1.9157274029433018
              ],
              "variance": 0.47957323249939443,
              "mean_reward": -1.8050665652548374,
              "min_reward": -2.08412432986053,
              "max_reward": -1.5144918904617801,
              "num_responses": 7,
              "rvariance": 0.03926885329096901
            },
            {
              "id": "chat_sample_225",
              "rewards": [
                -0.7061866412590847,
                -0.3243101455727719,
                0.21880309273665072,
                0.7449440423489039,
                0.33760911361683693,
                0.3885259797083453,
                0.015135628370617235
              ],
              "variance": 1.0081539486118658,
              "mean_reward": 0.09636015284992819,
              "min_reward": -0.7061866412590847,
              "max_reward": 0.7449440423489039,
              "num_responses": 7,
              "rvariance": 0.20097964954104103
            },
            {
              "id": "chat_sample_126",
              "rewards": [
                0.19334465969089654,
                0.6261380214687177,
                0.6940271762573955,
                0.6940271762573955,
                0.8128331971375817,
                0.7958609084404122,
                0.6261380214687177
              ],
              "variance": 0.3496291471616908,
              "mean_reward": 0.6346241658173024,
              "min_reward": 0.19334465969089654,
              "max_reward": 0.8128331971375817,
              "num_responses": 7,
              "rvariance": 0.03709783044764137
            },
            {
              "id": "chat_sample_162",
              "rewards": [
                0.4733874231941926,
                0.22728923708523543,
                0.3715536910111758,
                0.35458140231400637,
                0.6091657327715482,
                0.6091657327715482,
                0.32063682491966744
              ],
              "variance": 0.3258679429856535,
              "mean_reward": 0.42368286343819633,
              "min_reward": 0.22728923708523543,
              "max_reward": 0.6091657327715482,
              "num_responses": 7,
              "rvariance": 0.018279962566665208
            },
            {
              "id": "chat_sample_49",
              "rewards": [
                -0.93106946649658,
                -1.2832444569628463,
                -0.49403303254446645,
                -0.9650140438909188,
                -0.850451095185025,
                -1.4890334574160258,
                -1.1729245804312447
              ],
              "variance": 0.6576761870153165,
              "mean_reward": -1.026538590418158,
              "min_reward": -1.4890334574160258,
              "max_reward": -0.49403303254446645,
              "num_responses": 7,
              "rvariance": 0.0898138372259332
            },
            {
              "id": "chat_sample_177",
              "rewards": [
                -0.18853183599541623,
                -0.19701798034400098,
                -0.2564209907840941,
                -0.3243101455727719,
                0.03210791706778669
              ],
              "variance": 0.2410064994998063,
              "mean_reward": -0.1868346071256993,
              "min_reward": -0.3243101455727719,
              "max_reward": 0.03210791706778669,
              "num_responses": 5,
              "rvariance": 0.014356839807624092
            },
            {
              "id": "chat_sample_273",
              "rewards": [
                -1.2408137352199224,
                -1.3341613230543545,
                -0.7401312186534236,
                -1.7844573575511318,
                -1.291730601311431,
                -0.6298113421218221,
                -1.3129459621828927
              ],
              "variance": 0.8182764688122824,
              "mean_reward": -1.19057879144214,
              "min_reward": -1.7844573575511318,
              "max_reward": -0.6298113421218221,
              "num_responses": 7,
              "rvariance": 0.13119997220108465
            },
            {
              "id": "chat_sample_285",
              "rewards": [
                -1.3808351169715705,
                -0.9098541056251181,
                -0.6298113421218221,
                -0.8886387447536563,
                -0.7061866412590847,
                -0.8631803117079021,
                -1.1559522917340752
              ],
              "variance": 0.5702689002248936,
              "mean_reward": -0.9334940791676042,
              "min_reward": -1.3808351169715705,
              "max_reward": -0.6298113421218221,
              "num_responses": 7,
              "rvariance": 0.05728691597411506
            },
            {
              "id": "chat_sample_293",
              "rewards": [
                -1.4635750243702716,
                -0.9819863325880883,
                -1.3999289417558862,
                -1.4487242717602484,
                -1.4020504778430323,
                -0.9056110334508257,
                -1.3532551478386703
              ],
              "variance": 0.5032283598710745,
              "mean_reward": -1.2793044613724318,
              "min_reward": -1.4635750243702716,
              "max_reward": -0.9056110334508257,
              "num_responses": 7,
              "rvariance": 0.046541302024430846
            },
            {
              "id": "chat_sample_233",
              "rewards": [
                -0.7995342290935167,
                -0.7316450743048388,
                -0.5279776099388054,
                -0.4261438777557886,
                -0.1800456916468315,
                -0.383713156012865,
                -0.40917158905861917
              ],
              "variance": 0.45655456595385846,
              "mean_reward": -0.4940330325444665,
              "min_reward": -0.7995342290935167,
              "max_reward": -0.1800456916468315,
              "num_responses": 7,
              "rvariance": 0.03907308930675039
            },
            {
              "id": "chat_sample_235",
              "rewards": [
                -1.527221106984657,
                -1.9220920112047402,
                -1.317189034357185,
                -1.0286601265053044,
                -1.32567517870577,
                -1.573894900901873,
                -1.2365706630456301
              ],
              "variance": 0.5597672965935201,
              "mean_reward": -1.4187575745293084,
              "min_reward": -1.9220920112047402,
              "max_reward": -1.0286601265053044,
              "num_responses": 7,
              "rvariance": 0.07050372478369181
            },
            {
              "id": "chat_sample_158",
              "rewards": [
                0.9655837954121068,
                1.1522789710809709,
                1.3898910128413433,
                0.677054887560226,
                1.1862235484753096,
                1.118334393686632,
                0.9655837954121068
              ],
              "variance": 0.41751830195036876,
              "mean_reward": 1.0649929149240993,
              "min_reward": 0.677054887560226,
              "max_reward": 1.3898910128413433,
              "num_responses": 7,
              "rvariance": 0.04299715266524824
            },
            {
              "id": "chat_sample_216",
              "rewards": [
                0.2442615257824049,
                0.5412765779828704,
                0.9995283728064457,
                0.6600825988630565,
                1.118334393686632,
                0.8807223519262595,
                0.7619163310460734
              ],
              "variance": 0.6245802240558359,
              "mean_reward": 0.7437317360133917,
              "min_reward": 0.2442615257824049,
              "max_reward": 1.118334393686632,
              "num_responses": 7,
              "rvariance": 0.07461599127750386
            },
            {
              "id": "chat_sample_242",
              "rewards": [
                -0.9480417551937494,
                -0.7740757960477624,
                -0.6807282082133305,
                -0.3327962899213566,
                -0.8334788064878556,
                -0.6467836308189916,
                -0.9225833221479952
              ],
              "variance": 0.4115780009063593,
              "mean_reward": -0.734069686975863,
              "min_reward": -0.9480417551937494,
              "max_reward": -0.3327962899213566,
              "num_responses": 7,
              "rvariance": 0.037755515224018814
            },
            {
              "id": "chat_sample_92",
              "rewards": [
                1.457780167630021,
                1.4068633015385126,
                1.4068633015385126,
                1.4408078789328516,
                1.457780167630021,
                1.4408078789328516,
                1.3389741467498348
              ],
              "variance": 0.07807252800697961,
              "mean_reward": 1.421410977564658,
              "min_reward": 1.3389741467498348,
              "max_reward": 1.457780167630021,
              "num_responses": 7,
              "rvariance": 0.001516716623958716
            },
            {
              "id": "chat_sample_250",
              "rewards": [
                -0.29036556817843295,
                -0.4176577334072039,
                -0.34128243426994137,
                -0.4261438777557886,
                -0.001836660326552221,
                -0.3158240012241872
              ],
              "variance": 0.2757996913290036,
              "mean_reward": -0.29885171252701775,
              "min_reward": -0.4261438777557886,
              "max_reward": -0.001836660326552221,
              "num_responses": 6,
              "rvariance": 0.020116091089467946
            },
            {
              "id": "chat_sample_283",
              "rewards": [
                -0.850451095185025,
                -0.1715595472982468,
                -0.22247641338975516,
                -0.07821195946381478,
                -0.24793484643550934,
                -0.1715595472982468,
                -0.4176577334072039
              ],
              "variance": 0.45655456595385835,
              "mean_reward": -0.30855016321111456,
              "min_reward": -0.850451095185025,
              "max_reward": -0.07821195946381478,
              "num_responses": 7,
              "rvariance": 0.058176076398044375
            },
            {
              "id": "chat_sample_140",
              "rewards": [
                -0.2564209907840941,
                -0.12064268120673842,
                0.0066494840220325075,
                0.04059406141637142,
                -1.1983830134769988,
                -0.6213251977732374,
                -0.5110053212416359
              ],
              "variance": 0.8723756390345099,
              "mean_reward": -0.38007623700632864,
              "min_reward": -1.1983830134769988,
              "max_reward": 0.04059406141637142,
              "num_responses": 7,
              "rvariance": 0.16486944852295413
            },
            {
              "id": "chat_sample_232",
              "rewards": [
                -1.0074447656338426,
                -0.1461011142524926,
                -0.4006854447100344,
                -0.29036556817843295,
                -0.36674086731569555,
                -0.23944870208692462,
                -0.2649071351326788
              ],
              "variance": 0.44127950612640576,
              "mean_reward": -0.3879562281871573,
              "min_reward": -1.0074447656338426,
              "max_reward": -0.1461011142524926,
              "num_responses": 7,
              "rvariance": 0.06994165288360783
            },
            {
              "id": "chat_sample_0",
              "rewards": [
                1.610530765904546,
                1.5935584772073768,
                1.678419920693224,
                1.7293367867847322,
                1.4747524563271905,
                1.712364498087563,
                1.6275030546017155
              ],
              "variance": 0.17311734471112827,
              "mean_reward": 1.632352279943764,
              "min_reward": 1.4747524563271905,
              "max_reward": 1.7293367867847322,
              "num_responses": 7,
              "rvariance": 0.006396076305686361
            },
            {
              "id": "chat_sample_34",
              "rewards": [
                1.2880572806583264,
                0.8807223519262595,
                1.1013621049894624,
                1.084389816292293,
                0.9486115067149373,
                1.0674175275951234,
                1.084389816292293
              ],
              "variance": 0.2545843304575418,
              "mean_reward": 1.064992914924099,
              "min_reward": 0.8807223519262595,
              "max_reward": 1.2880572806583264,
              "num_responses": 7,
              "rvariance": 0.01419129430324162
            },
            {
              "id": "chat_sample_68",
              "rewards": [
                1.610530765904546,
                1.5256693224186988,
                1.5426416111158683,
                1.423835590235682,
                1.118334393686632,
                1.610530765904546,
                1.7463090754819017
              ],
              "variance": 0.36320697811942626,
              "mean_reward": 1.5111216463925534,
              "min_reward": 1.118334393686632,
              "max_reward": 1.7463090754819017,
              "num_responses": 7,
              "rvariance": 0.03402618534679473
            },
            {
              "id": "chat_sample_149",
              "rewards": [
                -0.2733932794812635,
                0.05756635011354087,
                0.05756635011354087,
                -0.08669810381239951,
                0.09151092750787979,
                0.015135628370617235,
                -0.08669810381239951
              ],
              "variance": 0.23252035515122155,
              "mean_reward": -0.032144318714354816,
              "min_reward": -0.2733932794812635,
              "max_reward": 0.09151092750787979,
              "num_responses": 7,
              "rvariance": 0.01396790193227096
            },
            {
              "id": "chat_sample_309",
              "rewards": [
                -0.3243101455727719,
                -0.837721878662148,
                -0.5279776099388054,
                -0.5534360429845595,
                -0.1800456916468315,
                -0.6043529090760679,
                -0.4431161664529581
              ],
              "variance": 0.43109613290810417,
              "mean_reward": -0.49585149204773454,
              "min_reward": -0.837721878662148,
              "max_reward": -0.1800456916468315,
              "num_responses": 7,
              "rvariance": 0.03784810548303955
            },
            {
              "id": "chat_sample_243",
              "rewards": [
                -0.7655896516991778,
                -0.803777301267809,
                -0.6977004969105,
                -0.5449498986359749,
                -0.6552697751675763,
                -1.2408137352199224,
                -0.23944870208692462
              ],
              "variance": 0.5558424548322998,
              "mean_reward": -0.7067927944268408,
              "min_reward": -1.2408137352199224,
              "max_reward": -0.23944870208692462,
              "num_responses": 7,
              "rvariance": 0.07791176359264669
            },
            {
              "id": "chat_sample_281",
              "rewards": [
                -2.2718802735729673,
                -2.3949293666274456,
                -1.9366775718038702,
                -1.8559266044868687,
                -2.3206756035773295,
                -2.399172438801738,
                -2.27612334574726
              ],
              "variance": 0.492249410620093,
              "mean_reward": -2.2079121720882116,
              "min_reward": -2.399172438801738,
              "max_reward": -1.8559266044868687,
              "num_responses": 7,
              "rvariance": 0.041496891795487253
            },
            {
              "id": "chat_sample_99",
              "rewards": [
                1.8820873850592574,
                1.831170518967749,
                1.7463090754819017,
                1.8820873850592574,
                1.8481428076649185,
                1.8481428076649185,
                1.8820873850592574
              ],
              "variance": 0.08486144348584745,
              "mean_reward": 1.8457181949938946,
              "min_reward": 1.7463090754819017,
              "max_reward": 1.8820873850592574,
              "num_responses": 7,
              "rvariance": 0.002010531338735973
            },
            {
              "id": "chat_sample_43",
              "rewards": [
                0.7109994649545649,
                0.21031694838806597,
                0.6261380214687177,
                0.6600825988630565,
                0.5243042892857009,
                0.5412765779828704,
                0.5582488666800398
              ],
              "variance": 0.28173999237301295,
              "mean_reward": 0.5473381096604308,
              "min_reward": 0.21031694838806597,
              "max_reward": 0.7109994649545649,
              "num_responses": 7,
              "rvariance": 0.022853627424959326
            },
            {
              "id": "chat_sample_148",
              "rewards": [
                -0.07821195946381478,
                0.0066494840220325075,
                -0.383713156012865,
                -0.5194914655902206
              ],
              "variance": 0.45994902369329227,
              "mean_reward": -0.24369177426121696,
              "min_reward": -0.5194914655902206,
              "max_reward": 0.0066494840220325075,
              "num_responses": 4,
              "rvariance": 0.046431442947259406
            },
            {
              "id": "chat_sample_249",
              "rewards": [
                0.7279717536517344,
                0.5412765779828704,
                0.7958609084404122,
                0.43944284579985365,
                0.490359711891362,
                0.8807223519262595,
                0.6940271762573955
              ],
              "variance": 0.35981252037999256,
              "mean_reward": 0.6528087608499841,
              "min_reward": 0.43944284579985365,
              "max_reward": 0.8807223519262595,
              "num_responses": 7,
              "rvariance": 0.02344444145871068
            },
            {
              "id": "chat_sample_100",
              "rewards": [
                1.084389816292293,
                1.3729187241441738,
                1.3729187241441738,
                1.1862235484753096,
                1.3220018580526653,
                1.1692512597781404
              ],
              "variance": 0.24609818610895706,
              "mean_reward": 1.251283988481126,
              "min_reward": 1.084389816292293,
              "max_reward": 1.3729187241441738,
              "num_responses": 6,
              "rvariance": 0.01223448817653004
            },
            {
              "id": "chat_sample_141",
              "rewards": [
                -0.6552697751675763,
                -0.6128390534246526,
                -0.23096255773833987,
                -0.39219930036144973,
                -0.39219930036144973,
                -0.6128390534246526,
                -0.943798683019457
              ],
              "variance": 0.4429767349961229,
              "mean_reward": -0.5485868176425112,
              "min_reward": -0.943798683019457,
              "max_reward": -0.23096255773833987,
              "num_responses": 7,
              "rvariance": 0.046518521881338426
            },
            {
              "id": "chat_sample_97",
              "rewards": [
                0.5921934440743788,
                0.40549826840551473,
                0.6940271762573955,
                0.5412765779828704,
                0.4564151344970231,
                0.6261380214687177,
                0.5921934440743788
              ],
              "variance": 0.21724529532376907,
              "mean_reward": 0.5582488666800398,
              "min_reward": 0.40549826840551473,
              "max_reward": 0.6940271762573955,
              "num_responses": 7,
              "rvariance": 0.008477152603676234
            },
            {
              "id": "chat_sample_137",
              "rewards": [
                -0.46008845515012753,
                0.22728923708523543,
                0.22728923708523543,
                0.3885259797083453,
                0.32063682491966744,
                0.2866922475253285,
                0.33760911361683693
              ],
              "variance": 0.40563769986235,
              "mean_reward": 0.18970774068436022,
              "min_reward": -0.46008845515012753,
              "max_reward": 0.3885259797083453,
              "num_responses": 7,
              "rvariance": 0.07328739454488886
            },
            {
              "id": "chat_sample_207",
              "rewards": [
                -1.1007923534682744,
                -0.7316450743048388,
                -0.9140971777994105,
                -0.837721878662148,
                -1.1389800030369057,
                -1.0413893430281813,
                -1.2280845186970455
              ],
              "variance": 0.37933065238173747,
              "mean_reward": -0.9989586212852578,
              "min_reward": -1.2280845186970455,
              "max_reward": -0.7316450743048388,
              "num_responses": 7,
              "rvariance": 0.026990060504544406
            },
            {
              "id": "chat_sample_190",
              "rewards": [
                -0.9353125386708723,
                -0.570408331681729,
                -0.6043529090760679,
                -0.5364637542873901,
                -0.49403303254446645,
                -0.4006854447100344,
                -0.5110053212416359
              ],
              "variance": 0.28004276350329604,
              "mean_reward": -0.5788944760303137,
              "min_reward": -0.9353125386708723,
              "max_reward": -0.4006854447100344,
              "num_responses": 7,
              "rvariance": 0.024731886965094242
            },
            {
              "id": "chat_sample_254",
              "rewards": [
                0.19334465969089654,
                0.6261380214687177,
                0.4564151344970231,
                0.4733874231941926,
                0.35458140231400637,
                0.7788886197432427,
                0.5243042892857009
              ],
              "variance": 0.39715155551376535,
              "mean_reward": 0.48672279288482573,
              "min_reward": 0.19334465969089654,
              "max_reward": 0.7788886197432427,
              "num_responses": 7,
              "rvariance": 0.03011975822811038
            },
            {
              "id": "chat_sample_171",
              "rewards": [
                -0.7571035073505931,
                -1.467818096544564,
                -1.2026260856512914,
                -1.0795769925968126,
                -1.1983830134769988,
                -0.8716664560564868,
                -0.7995342290935167
              ],
              "variance": 0.5261409496122532,
              "mean_reward": -1.0538154829671806,
              "min_reward": -1.467818096544564,
              "max_reward": -0.7571035073505931,
              "num_responses": 7,
              "rvariance": 0.05728305804665588
            },
            {
              "id": "chat_sample_131",
              "rewards": [
                1.1353066823838014,
                1.3389741467498348,
                1.3898910128413433,
                1.423835590235682,
                1.423835590235682,
                1.271084991961157,
                1.5426416111158683
              ],
              "variance": 0.2545843304575417,
              "mean_reward": 1.3607956607890528,
              "min_reward": 1.1353066823838014,
              "max_reward": 1.5426416111158683,
              "num_responses": 7,
              "rvariance": 0.014461716647048208
            },
            {
              "id": "chat_sample_272",
              "rewards": [
                -1.2492998795685073,
                -1.1814107247798293,
                -1.1898968691284142,
                -1.2068691578255837,
                -1.270515240439969,
                -0.9607709717166265,
                -1.096549281293982
              ],
              "variance": 0.2155480664540521,
              "mean_reward": -1.165044589250416,
              "min_reward": -1.270515240439969,
              "max_reward": -0.9607709717166265,
              "num_responses": 7,
              "rvariance": 0.009611015855017462
            },
            {
              "id": "chat_sample_317",
              "rewards": [
                -1.6110217824269313,
                -0.383713156012865,
                -0.3582547229671108,
                -0.001836660326552221,
                -0.2988517125270177,
                -0.36674086731569555,
                -0.30733785687560244
              ],
              "variance": 0.69459091493166,
              "mean_reward": -0.4753938226359678,
              "min_reward": -1.6110217824269313,
              "max_reward": -0.001836660326552221,
              "num_responses": 7,
              "rvariance": 0.22960707875805975
            },
            {
              "id": "chat_sample_221",
              "rewards": [
                -1.9387991078910165,
                -2.0459366802918986,
                -1.9780475255032208,
                -2.282487954008698,
                -2.035328999856168,
                -2.282487954008698,
                -1.8377609517406794
              ],
              "variance": 0.3841041085778163,
              "mean_reward": -2.0572641676143397,
              "min_reward": -2.282487954008698,
              "max_reward": -1.8377609517406794,
              "num_responses": 7,
              "rvariance": 0.02436455428724751
            },
            {
              "id": "chat_sample_263",
              "rewards": [
                -1.0116878378081349,
                -0.8207495899649785,
                -0.6128390534246526,
                -0.46008845515012753,
                -0.5788944760303137,
                -0.5364637542873901,
                -0.5194914655902206
              ],
              "variance": 0.4013946276880576,
              "mean_reward": -0.6486020903222597,
              "min_reward": -1.0116878378081349,
              "max_reward": -0.46008845515012753,
              "num_responses": 7,
              "rvariance": 0.033198016918887054
            },
            {
              "id": "chat_sample_112",
              "rewards": [
                2.085754849425291,
                1.865115096362088,
                1.678419920693224,
                2.0008934059394434,
                1.6953922093903935,
                1.899059673756427,
                1.831170518967749
              ],
              "variance": 0.34623468942225677,
              "mean_reward": 1.8651150963620877,
              "min_reward": 1.678419920693224,
              "max_reward": 2.085754849425291,
              "num_responses": 7,
              "rvariance": 0.01901186651892436
            },
            {
              "id": "chat_sample_138",
              "rewards": [
                -0.6213251977732374,
                -0.5619221873331443,
                -0.06123967076664532,
                -0.19701798034400098,
                -0.2055041246925857,
                -0.29036556817843295,
                0.07453863881071034
              ],
              "variance": 0.5787550445734785,
              "mean_reward": -0.2661194414681909,
              "min_reward": -0.6213251977732374,
              "max_reward": 0.07453863881071034,
              "num_responses": 7,
              "rvariance": 0.054390163584752065
            },
            {
              "id": "chat_sample_1",
              "rewards": [
                -2.026842855507583,
                -2.210355727045728,
                -2.2039911187842893,
                -1.4699396326317102,
                -2.0554835926840562,
                -2.25915105705009
              ],
              "variance": 0.4863621479782627,
              "mean_reward": -2.0376273306172425,
              "min_reward": -2.25915105705009,
              "max_reward": -1.4699396326317102,
              "num_responses": 6,
              "rvariance": 0.07154820729354061
            },
            {
              "id": "chat_sample_42",
              "rewards": [
                -1.1686815082569524,
                -1.4720611687188563,
                -1.3829566530587167,
                -1.291730601311431,
                -1.5908671895990425,
                -1.3129459621828927,
                -1.3468905395772317
              ],
              "variance": 0.27707261298129127,
              "mean_reward": -1.3665905175293034,
              "min_reward": -1.5908671895990425,
              "max_reward": -1.1686815082569524,
              "num_responses": 7,
              "rvariance": 0.015675677820875627
            },
            {
              "id": "chat_sample_101",
              "rewards": [
                -1.39780740566874,
                -1.3214321065314774,
                -1.317189034357185,
                -0.9947155491109654,
                -1.4147796943659094,
                -0.8801526004050716,
                -0.7825619403963472
              ],
              "variance": 0.563479984746026,
              "mean_reward": -1.1583769044050996,
              "min_reward": -1.4147796943659094,
              "max_reward": -0.7825619403963472,
              "num_responses": 7,
              "rvariance": 0.06004404813162142
            },
            {
              "id": "chat_sample_21",
              "rewards": [
                -1.8268880792940554,
                -1.6004141019912004,
                -1.3468905395772317,
                -1.2662721682656768,
                -1.7796839013550527,
                -1.8268880792940554,
                -1.4784257769802949
              ],
              "variance": 0.5122448882414457,
              "mean_reward": -1.5893518066796524,
              "min_reward": -1.8268880792940554,
              "max_reward": -1.2662721682656768,
              "num_responses": 7,
              "rvariance": 0.046381163589093256
            },
            {
              "id": "chat_sample_66",
              "rewards": [
                -0.4855468881958817,
                -0.09518424816098423,
                -0.1461011142524926,
                0.10848321620504925,
                0.0066494840220325075,
                -0.07821195946381478,
                0.08302478315929505
              ],
              "variance": 0.3750875802074449,
              "mean_reward": -0.0866981038123995,
              "min_reward": -0.4855468881958817,
              "max_reward": 0.10848321620504925,
              "num_responses": 7,
              "rvariance": 0.034052639706514946
            },
            {
              "id": "chat_sample_151",
              "rewards": [
                -0.4006854447100344,
                -0.2055041246925857,
                -0.45160231080154284,
                -0.19701798034400098,
                -0.16307340294966205,
                -0.4431161664529581,
                -0.2988517125270177
              ],
              "variance": 0.2630704748061266,
              "mean_reward": -0.3085501632111146,
              "min_reward": -0.45160231080154284,
              "max_reward": -0.16307340294966205,
              "num_responses": 7,
              "rvariance": 0.013053756835272585
            },
            {
              "id": "chat_sample_33",
              "rewards": [
                0.5582488666800398,
                0.32063682491966744,
                0.16788622664514236,
                0.16788622664514236,
                0.5752211553772093,
                0.33760911361683693,
                0.303664536222498
              ],
              "variance": 0.3971515555137653,
              "mean_reward": 0.34730756430093374,
              "min_reward": 0.16788622664514236,
              "max_reward": 0.5752211553772093,
              "num_responses": 7,
              "rvariance": 0.02336213900624781
            },
            {
              "id": "chat_sample_219",
              "rewards": [
                -0.37522701166428024,
                -0.06972581511523004,
                -0.15458725860107733,
                -0.23944870208692462
              ],
              "variance": 0.23930927063008933,
              "mean_reward": -0.20974719686687807,
              "min_reward": -0.37522701166428024,
              "max_reward": -0.06972581511523004,
              "num_responses": 4,
              "rvariance": 0.012728588663711668
            },
            {
              "id": "chat_sample_5",
              "rewards": [
                0.4564151344970231,
                0.1848585153423118,
                0.6940271762573955,
                0.04908020576495615,
                0.21880309273665072,
                -0.2649071351326788,
                0.677054887560226
              ],
              "variance": 0.7603585336331917,
              "mean_reward": 0.28790455386084063,
              "min_reward": -0.2649071351326788,
              "max_reward": 0.6940271762573955,
              "num_responses": 7,
              "rvariance": 0.10325724473458471
            },
            {
              "id": "chat_sample_86",
              "rewards": [
                1.1692512597781404,
                0.7619163310460734,
                1.0504452388979542,
                1.1522789710809709,
                1.2201681258696486,
                1.2880572806583264,
                1.3389741467498348
              ],
              "variance": 0.3733903513377278,
              "mean_reward": 1.1401559077258498,
              "min_reward": 0.7619163310460734,
              "max_reward": 1.3389741467498348,
              "num_responses": 7,
              "rvariance": 0.031416021854400664
            },
            {
              "id": "chat_sample_108",
              "rewards": [
                0.8467777745319206,
                0.9825560841092762,
                0.9316392180177678,
                0.9316392180177678,
                0.9486115067149373,
                1.1862235484753096,
                1.1013621049894624
              ],
              "variance": 0.23761204176037243,
              "mean_reward": 0.9898299221223489,
              "min_reward": 0.8467777745319206,
              "max_reward": 1.1862235484753096,
              "num_responses": 7,
              "rvariance": 0.011428283399130781
            },
            {
              "id": "chat_sample_28",
              "rewards": [
                -1.1389800030369057,
                -1.0413893430281813,
                -0.9225833221479952,
                -1.0329031986795967,
                -1.1898968691284142,
                -0.8843956725793639,
                -0.6977004969105
              ],
              "variance": 0.3496291471616908,
              "mean_reward": -0.9868355579301367,
              "min_reward": -1.1898968691284142,
              "max_reward": -0.6977004969105,
              "num_responses": 7,
              "rvariance": 0.02395736209995253
            },
            {
              "id": "chat_sample_255",
              "rewards": [
                0.5073320005885315,
                0.6431103101658872,
                0.897694640623429,
                0.7109994649545649,
                1.118334393686632,
                0.8128331971375817,
                0.897694640623429
              ],
              "variance": 0.39715155551376535,
              "mean_reward": 0.7982855211114366,
              "min_reward": 0.5073320005885315,
              "max_reward": 1.118334393686632,
              "num_responses": 7,
              "rvariance": 0.034108487799257625
            },
            {
              "id": "chat_sample_29",
              "rewards": [
                1.1692512597781404,
                1.1522789710809709,
                1.2031958371724791,
                1.3389741467498348,
                1.2880572806583264,
                1.1862235484753096,
                1.271084991961157
              ],
              "variance": 0.14596168279565713,
              "mean_reward": 1.2298665765537453,
              "min_reward": 1.1522789710809709,
              "max_reward": 1.3389741467498348,
              "num_responses": 7,
              "rvariance": 0.004185667582397691
            },
            {
              "id": "chat_sample_60",
              "rewards": [
                1.6614476319960545,
                1.5596138998130378,
                1.3050295693554959,
                1.5596138998130378,
                1.6614476319960545,
                1.4068633015385126,
                1.49172474502436
              ],
              "variance": 0.2953178233307485,
              "mean_reward": 1.5208200970766506,
              "min_reward": 1.3050295693554959,
              "max_reward": 1.6614476319960545,
              "num_responses": 7,
              "rvariance": 0.014708624004436848
            },
            {
              "id": "chat_sample_125",
              "rewards": [
                -1.3214321065314774,
                -1.0838200647711052,
                -0.9013679612765334,
                -1.3596197561001087,
                -0.977743260413796,
                -1.6269333030805277,
                -0.9819863325880883
              ],
              "variance": 0.5193520341333853,
              "mean_reward": -1.1789861121088054,
              "min_reward": -1.6269333030805277,
              "max_reward": -0.9013679612765334,
              "num_responses": 7,
              "rvariance": 0.05985886761357995
            },
            {
              "id": "chat_sample_314",
              "rewards": [
                -0.03578123772089113,
                0.5752211553772093,
                0.2866922475253285,
                0.6940271762573955,
                0.5582488666800398,
                0.1848585153423118,
                0.08302478315929505
              ],
              "variance": 0.5872411889220632,
              "mean_reward": 0.3351845009458127,
              "min_reward": -0.03578123772089113,
              "max_reward": 0.6940271762573955,
              "num_responses": 7,
              "rvariance": 0.06604183935485353
            },
            {
              "id": "chat_sample_310",
              "rewards": [
                0.9316392180177678,
                0.8467777745319206,
                0.9995283728064457,
                1.0334729502007847,
                0.9995283728064457,
                0.9995283728064457,
                1.0334729502007847
              ],
              "variance": 0.1357783095773557,
              "mean_reward": 0.9777068587672278,
              "min_reward": 0.8467777745319206,
              "max_reward": 1.0334729502007847,
              "num_responses": 7,
              "rvariance": 0.00384470027933721
            },
            {
              "id": "chat_sample_222",
              "rewards": [
                0.07453863881071034,
                0.3715536910111758,
                0.42247055710268416,
                0.5921934440743788,
                0.3715536910111758,
                0.6261380214687177,
                0.42247055710268416
              ],
              "variance": 0.3530236049011247,
              "mean_reward": 0.41155980008307524,
              "min_reward": 0.07453863881071034,
              "max_reward": 0.6261380214687177,
              "num_responses": 7,
              "rvariance": 0.027956379477657643
            },
            {
              "id": "chat_sample_143",
              "rewards": [
                -1.4975196017646106,
                -0.9989586212852578,
                -0.803777301267809,
                -1.2323275908713378,
                -1.16443843608266,
                -0.7868050125706396,
                -0.8843956725793639
              ],
              "variance": 0.5414160094397056,
              "mean_reward": -1.0526031766316686,
              "min_reward": -1.4975196017646106,
              "max_reward": -0.7868050125706396,
              "num_responses": 7,
              "rvariance": 0.05807044266999493
            },
            {
              "id": "chat_sample_12",
              "rewards": [
                -0.044267382069475864,
                -0.40917158905861917,
                0.2782061031767438,
                0.21031694838806597,
                0.0066494840220325075,
                -0.09518424816098423,
                -0.018808949023721676
              ],
              "variance": 0.4582517948235753,
              "mean_reward": -0.010322804675136951,
              "min_reward": -0.40917158905861917,
              "max_reward": 0.2782061031767438,
              "num_responses": 7,
              "rvariance": 0.042817850893811245
            },
            {
              "id": "chat_sample_248",
              "rewards": [
                -1.7844573575511318,
                -1.257786023917092,
                -1.5293426430718033,
                -1.4826688491545872,
                -1.3087028900086004
              ],
              "variance": 0.4042587014057051,
              "mean_reward": -1.4725915527406428,
              "min_reward": -1.7844573575511318,
              "max_reward": -1.257786023917092,
              "num_responses": 5,
              "rvariance": 0.03471668547042932
            },
            {
              "id": "chat_sample_64",
              "rewards": [
                1.0674175275951234,
                0.897694640623429,
                0.8467777745319206,
                0.9825560841092762,
                1.2031958371724791,
                1.0165006615036152,
                0.897694640623429
              ],
              "variance": 0.24440095723924005,
              "mean_reward": 0.9874053094513248,
              "min_reward": 0.8467777745319206,
              "max_reward": 1.2031958371724791,
              "num_responses": 7,
              "rvariance": 0.01281566759779069
            },
            {
              "id": "chat_sample_4",
              "rewards": [
                1.0334729502007847,
                1.0504452388979542,
                1.2371404145668181,
                1.3559464354470043,
                1.2031958371724791,
                1.1353066823838014,
                1.271084991961157
              ],
              "variance": 0.26137324593640976,
              "mean_reward": 1.1837989358042855,
              "min_reward": 1.0334729502007847,
              "max_reward": 1.3559464354470043,
              "num_responses": 7,
              "rvariance": 0.011886825634281091
            },
            {
              "id": "chat_sample_311",
              "rewards": [
                -0.383713156012865,
                -0.2733932794812635,
                0.08302478315929505,
                0.07453863881071034,
                0.14242779359938815,
                0.14242779359938815,
                0.2442615257824049
              ],
              "variance": 0.500682516566499,
              "mean_reward": 0.004224871351008301,
              "min_reward": -0.383713156012865,
              "max_reward": 0.2442615257824049,
              "num_responses": 7,
              "rvariance": 0.04779127052121076
            },
            {
              "id": "chat_sample_117",
              "rewards": [
                -1.317189034357185,
                -1.1686815082569524,
                -0.850451095185025,
                -0.9140971777994105,
                -0.6807282082133305,
                -0.8589372395336098,
                -1.0413893430281813
              ],
              "variance": 0.4455225783006983,
              "mean_reward": -0.9759248009105279,
              "min_reward": -1.317189034357185,
              "max_reward": -0.6807282082133305,
              "num_responses": 7,
              "rvariance": 0.03975649359952248
            },
            {
              "id": "chat_sample_39",
              "rewards": [
                0.14242779359938815,
                0.17637237099372707,
                -0.027295093372306404,
                0.40549826840551473,
                0.32063682491966744,
                0.2866922475253285,
                -0.027295093372306404
              ],
              "variance": 0.38187649568631277,
              "mean_reward": 0.18243390267128756,
              "min_reward": -0.027295093372306404,
              "max_reward": 0.40549826840551473,
              "num_responses": 7,
              "rvariance": 0.02419104227748106
            },
            {
              "id": "chat_sample_287",
              "rewards": [
                0.07453863881071034,
                0.14242779359938815,
                0.35458140231400637,
                0.1509139379479729,
                0.23577538143382018,
                0.42247055710268416
              ],
              "variance": 0.280042763503296,
              "mean_reward": 0.23011795186809703,
              "min_reward": 0.07453863881071034,
              "max_reward": 0.42247055710268416,
              "num_responses": 6,
              "rvariance": 0.015115074012730689
            },
            {
              "id": "chat_sample_313",
              "rewards": [
                -1.117764642165444,
                -0.9947155491109654,
                -0.6722420638647457,
                -0.7571035073505931,
                -0.7061866412590847,
                -0.4685745994987123,
                -0.5279776099388054
              ],
              "variance": 0.5397187805699887,
              "mean_reward": -0.7492235161697643,
              "min_reward": -1.117764642165444,
              "max_reward": -0.4685745994987123,
              "num_responses": 7,
              "rvariance": 0.047377553728919684
            },
            {
              "id": "chat_sample_3",
              "rewards": [
                1.6614476319960545,
                1.3050295693554959,
                1.4408078789328516,
                1.6614476319960545,
                1.5256693224186988,
                1.4747524563271905,
                1.3389741467498348
              ],
              "variance": 0.33605131620395534,
              "mean_reward": 1.4868755196823114,
              "min_reward": 1.3050295693554959,
              "max_reward": 1.6614476319960545,
              "num_responses": 7,
              "rvariance": 0.01709539512586025
            },
            {
              "id": "chat_sample_170",
              "rewards": [
                -0.9225833221479952,
                -0.9056110334508257,
                -0.6977004969105,
                -0.7868050125706396,
                -1.0413893430281813,
                -0.8801526004050716
              ],
              "variance": 0.23973357784751848,
              "mean_reward": -0.8723736347522023,
              "min_reward": -1.0413893430281813,
              "max_reward": -0.6977004969105,
              "num_responses": 6,
              "rvariance": 0.011680875586135205
            },
            {
              "id": "chat_sample_83",
              "rewards": [
                -1.2408137352199224,
                -1.6704247928670244,
                -1.7298278033071175,
                -1.2620290960913843,
                -1.395685869581594,
                -1.327796714792916,
                -1.457210416108833
              ],
              "variance": 0.4406430453002621,
              "mean_reward": -1.4405412039955416,
              "min_reward": -1.7298278033071175,
              "max_reward": -1.2408137352199224,
              "num_responses": 7,
              "rvariance": 0.03189885984700237
            },
            {
              "id": "chat_sample_279",
              "rewards": [
                0.4564151344970231,
                0.3715536910111758,
                0.6940271762573955,
                0.29517839187391326,
                0.5412765779828704,
                0.5752211553772093,
                0.4733874231941926
              ],
              "variance": 0.28173999237301306,
              "mean_reward": 0.4867227928848257,
              "min_reward": 0.29517839187391326,
              "max_reward": 0.6940271762573955,
              "num_responses": 7,
              "rvariance": 0.014976106974941195
            },
            {
              "id": "chat_sample_55",
              "rewards": [
                -0.1461011142524926,
                0.1594000822965576,
                0.4733874231941926,
                -0.3582547229671108,
                -0.3158240012241872,
                0.13394164925080343
              ],
              "variance": 0.6534331148410241,
              "mean_reward": -0.008908447283706156,
              "min_reward": -0.3582547229671108,
              "max_reward": 0.4733874231941926,
              "num_responses": 6,
              "rvariance": 0.08606750389064823
            },
            {
              "id": "chat_sample_103",
              "rewards": [
                0.303664536222498,
                -0.18853183599541623,
                0.42247055710268416,
                0.08302478315929505,
                0.0066494840220325075,
                0.29517839187391326,
                0.40549826840551473
              ],
              "variance": 0.4837102278693295,
              "mean_reward": 0.18970774068436022,
              "min_reward": -0.18853183599541623,
              "max_reward": 0.42247055710268416,
              "num_responses": 7,
              "rvariance": 0.04468729231403944
            },
            {
              "id": "chat_sample_113",
              "rewards": [
                0.1848585153423118,
                0.303664536222498,
                0.4564151344970231,
                0.6600825988630565,
                0.3715536910111758,
                0.5921934440743788,
                0.4564151344970231
              ],
              "variance": 0.3632069781194264,
              "mean_reward": 0.432169007786781,
              "min_reward": 0.1848585153423118,
              "max_reward": 0.6600825988630565,
              "num_responses": 7,
              "rvariance": 0.022868324291470548
            },
            {
              "id": "chat_sample_104",
              "rewards": [
                0.08302478315929505,
                0.43944284579985365,
                0.5752211553772093,
                0.5752211553772093,
                0.5412765779828704,
                0.490359711891362,
                0.6600825988630565
              ],
              "variance": 0.312290112027918,
              "mean_reward": 0.48066126120726516,
              "min_reward": 0.08302478315929505,
              "max_reward": 0.6600825988630565,
              "num_responses": 7,
              "rvariance": 0.03052245237051802
            },
            {
              "id": "chat_sample_282",
              "rewards": [
                0.8128331971375817,
                0.897694640623429,
                0.9316392180177678,
                1.0165006615036152,
                1.0165006615036152,
                0.9146669293205985,
                0.9146669293205985
              ],
              "variance": 0.15275059827452508,
              "mean_reward": 0.9292146053467437,
              "min_reward": 0.8128331971375817,
              "max_reward": 1.0165006615036152,
              "num_responses": 7,
              "rvariance": 0.004315000007696499
            },
            {
              "id": "chat_sample_62",
              "rewards": [
                1.5086970337215293,
                1.4408078789328516,
                1.3898910128413433,
                1.457780167630021,
                1.4408078789328516,
                1.423835590235682,
                1.4747524563271905
              ],
              "variance": 0.07807252800697939,
              "mean_reward": 1.4480817169459244,
              "min_reward": 1.3898910128413433,
              "max_reward": 1.5086970337215293,
              "num_responses": 7,
              "rvariance": 0.0012227792937341555
            },
            {
              "id": "chat_sample_91",
              "rewards": [
                0.42247055710268416,
                0.20183080403948125,
                0.4733874231941926,
                0.5243042892857009,
                0.20183080403948125,
                0.3715536910111758,
                0.5073320005885315
              ],
              "variance": 0.312290112027918,
              "mean_reward": 0.386101367037321,
              "min_reward": 0.20183080403948125,
              "max_reward": 0.5243042892857009,
              "num_responses": 7,
              "rvariance": 0.01583734335249914
            },
            {
              "id": "chat_sample_284",
              "rewards": [
                -1.3214321065314774,
                -0.803777301267809,
                -0.7910480847449319,
                -0.7868050125706396,
                -0.8801526004050716,
                -0.8631803117079021,
                -0.6382974864704068
              ],
              "variance": 0.3292624007250873,
              "mean_reward": -0.8692418433854625,
              "min_reward": -1.3214321065314774,
              "max_reward": -0.6382974864704068,
              "num_responses": 7,
              "rvariance": 0.039308974014255586
            },
            {
              "id": "chat_sample_84",
              "rewards": [
                0.42247055710268416,
                0.5243042892857009,
                0.4564151344970231,
                0.5921934440743788,
                0.6600825988630565,
                0.4564151344970231,
                0.19334465969089654
              ],
              "variance": 0.2885289078518808,
              "mean_reward": 0.47217511685868047,
              "min_reward": 0.19334465969089654,
              "max_reward": 0.6600825988630565,
              "num_responses": 7,
              "rvariance": 0.0190206846388311
            },
            {
              "id": "chat_sample_175",
              "rewards": [
                0.32063682491966744,
                -0.06972581511523004,
                0.29517839187391326,
                0.303664536222498,
                0.4564151344970231,
                0.5243042892857009,
                0.5243042892857009
              ],
              "variance": 0.3750875802074449,
              "mean_reward": 0.33639680728132487,
              "min_reward": -0.06972581511523004,
              "max_reward": 0.5243042892857009,
              "num_responses": 7,
              "rvariance": 0.036139594751109325
            },
            {
              "id": "chat_sample_185",
              "rewards": [
                0.7619163310460734,
                1.0674175275951234,
                1.0674175275951234,
                1.084389816292293,
                1.1522789710809709,
                1.118334393686632,
                1.0674175275951234
              ],
              "variance": 0.18669517566886418,
              "mean_reward": 1.0455960135559057,
              "min_reward": 0.7619163310460734,
              "max_reward": 1.1522789710809709,
              "num_responses": 7,
              "rvariance": 0.014297111742122457
            },
            {
              "id": "chat_sample_154",
              "rewards": [
                -1.2832444569628463,
                -0.5873806203788985,
                -0.7061866412590847,
                -0.663755919516161,
                -0.9607709717166265,
                -0.7655896516991778,
                -0.570408331681729
              ],
              "variance": 0.5091686609150838,
              "mean_reward": -0.7910480847449319,
              "min_reward": -1.2832444569628463,
              "max_reward": -0.570408331681729,
              "num_responses": 7,
              "rvariance": 0.05503976508454835
            },
            {
              "id": "chat_sample_189",
              "rewards": [
                -2.0682128092069334,
                -1.5441933956818266,
                -1.4296304469759327,
                -1.3829566530587167,
                -1.5102488182874876,
                -1.4296304469759327,
                -1.4466027356731022
              ],
              "variance": 0.34284023168282296,
              "mean_reward": -1.5444964722657044,
              "min_reward": -2.0682128092069334,
              "max_reward": -1.3829566530587167,
              "num_responses": 7,
              "rvariance": 0.04821692851754218
            },
            {
              "id": "chat_sample_218",
              "rewards": [
                -0.09518424816098423,
                -0.49403303254446645,
                -0.16307340294966205,
                -0.13761496990390787,
                -0.2649071351326788,
                -0.24793484643550934
              ],
              "variance": 0.26307047480612655,
              "mean_reward": -0.23379127252120144,
              "min_reward": -0.49403303254446645,
              "max_reward": -0.09518424816098423,
              "num_responses": 6,
              "rvariance": 0.01705946945216614
            },
            {
              "id": "chat_sample_257",
              "rewards": [
                0.33760911361683693,
                0.33760911361683693,
                0.6091657327715482,
                0.6940271762573955,
                0.5243042892857009,
                0.6940271762573955,
                0.4564151344970231
              ],
              "variance": 0.3564180626405586,
              "mean_reward": 0.5218796766146767,
              "min_reward": 0.33760911361683693,
              "max_reward": 0.6940271762573955,
              "num_responses": 7,
              "rvariance": 0.01987016352318007
            },
            {
              "id": "chat_sample_13",
              "rewards": [
                0.5243042892857009,
                0.35458140231400637,
                0.33760911361683693,
                0.17637237099372707,
                0.21880309273665072
              ],
              "variance": 0.2630704748061266,
              "mean_reward": 0.3223340537893844,
              "min_reward": 0.17637237099372707,
              "max_reward": 0.5243042892857009,
              "num_responses": 5,
              "rvariance": 0.014817733541416198
            },
            {
              "id": "chat_sample_237",
              "rewards": [
                -0.943798683019457,
                -0.8165065177906862,
                -0.5279776099388054,
                -0.4261438777557886,
                -0.5279776099388054,
                -0.5873806203788985,
                -0.4176577334072039
              ],
              "variance": 0.4446739638658398,
              "mean_reward": -0.6067775217470921,
              "min_reward": -0.943798683019457,
              "max_reward": -0.4176577334072039,
              "num_responses": 7,
              "rvariance": 0.03410848779925762
            },
            {
              "id": "chat_sample_89",
              "rewards": [
                0.6431103101658872,
                0.9146669293205985,
                0.8807223519262595,
                0.9316392180177678,
                1.084389816292293,
                1.084389816292293,
                1.118334393686632
              ],
              "variance": 0.312290112027918,
              "mean_reward": 0.9510361193859616,
              "min_reward": 0.6431103101658872,
              "max_reward": 1.118334393686632,
              "num_responses": 7,
              "rvariance": 0.02357377388400948
            },
            {
              "id": "chat_sample_23",
              "rewards": [
                0.490359711891362,
                -0.24793484643550934,
                0.2697199588281591,
                0.2442615257824049,
                0.5243042892857009,
                0.09999707185646452,
                0.19334465969089654
              ],
              "variance": 0.5431132383094226,
              "mean_reward": 0.2248646244142112,
              "min_reward": -0.24793484643550934,
              "max_reward": 0.5243042892857009,
              "num_responses": 7,
              "rvariance": 0.057523535524945844
            },
            {
              "id": "chat_sample_236",
              "rewards": [
                -0.1800456916468315,
                0.04059406141637142,
                0.16788622664514236,
                -0.23944870208692462,
                0.0660524944621256,
                -0.36674086731569555,
                0.14242779359938815
              ],
              "variance": 0.4429767349961228,
              "mean_reward": -0.05275352641806059,
              "min_reward": -0.36674086731569555,
              "max_reward": 0.16788622664514236,
              "num_responses": 7,
              "rvariance": 0.037036103608294214
            },
            {
              "id": "chat_sample_234",
              "rewards": [
                -1.1135215699911516,
                -1.0413893430281813,
                -0.8971248891022411,
                -0.8080203734421014,
                -0.9225833221479952,
                -0.8971248891022411,
                -1.1814107247798293
              ],
              "variance": 0.27919414906843754,
              "mean_reward": -0.9801678730848202,
              "min_reward": -1.1814107247798293,
              "max_reward": -0.8080203734421014,
              "num_responses": 7,
              "rvariance": 0.015538996962321206
            },
            {
              "id": "chat_sample_194",
              "rewards": [
                0.9655837954121068,
                1.3050295693554959,
                1.271084991961157,
                0.9486115067149373,
                1.3220018580526653,
                1.118334393686632,
                1.4408078789328516
              ],
              "variance": 0.4107293864715008,
              "mean_reward": 1.1959219991594066,
              "min_reward": 0.9486115067149373,
              "max_reward": 1.4408078789328516,
              "num_responses": 7,
              "rvariance": 0.030522452370518018
            },
            {
              "id": "chat_sample_70",
              "rewards": [
                1.6275030546017155,
                1.610530765904546,
                1.610530765904546,
                1.712364498087563,
                1.6953922093903935,
                1.610530765904546,
                1.7463090754819017
              ],
              "variance": 0.1154115631407524,
              "mean_reward": 1.6590230193250302,
              "min_reward": 1.610530765904546,
              "max_reward": 1.7463090754819017,
              "num_responses": 7,
              "rvariance": 0.002833555863364738
            },
            {
              "id": "chat_sample_74",
              "rewards": [
                -0.13761496990390787,
                -0.6298113421218221,
                -0.2564209907840941,
                -0.4261438777557886,
                -0.4855468881958817,
                -0.5364637542873901,
                -0.5449498986359749
              ],
              "variance": 0.3699958935982942,
              "mean_reward": -0.43099310309783706,
              "min_reward": -0.6298113421218221,
              "max_reward": -0.13761496990390787,
              "num_responses": 7,
              "rvariance": 0.026169240509892333
            },
            {
              "id": "chat_sample_200",
              "rewards": [
                -1.4381165913245175,
                -1.3765920447972781,
                -1.5123703543746339,
                -1.0286601265053044,
                -1.4402381274116636,
                -1.0413893430281813,
                -0.9989586212852578
              ],
              "variance": 0.45231149377956603,
              "mean_reward": -1.2623321726752625,
              "min_reward": -1.5123703543746339,
              "max_reward": -0.9989586212852578,
              "num_responses": 7,
              "rvariance": 0.04441558399441311
            },
            {
              "id": "chat_sample_260",
              "rewards": [
                0.5073320005885315,
                0.6431103101658872,
                0.8467777745319206,
                0.6431103101658872,
                0.8128331971375817,
                0.9825560841092762,
                0.7279717536517344
              ],
              "variance": 0.312290112027918,
              "mean_reward": 0.7376702043358313,
              "min_reward": 0.5073320005885315,
              "max_reward": 0.9825560841092762,
              "num_responses": 7,
              "rvariance": 0.021222275242213023
            },
            {
              "id": "chat_sample_315",
              "rewards": [
                0.5752211553772093,
                0.897694640623429,
                0.9825560841092762,
                0.8807223519262595,
                0.9995283728064457,
                1.118334393686632,
                1.118334393686632
              ],
              "variance": 0.35981252037999245,
              "mean_reward": 0.9389130560308405,
              "min_reward": 0.5752211553772093,
              "max_reward": 1.118334393686632,
              "num_responses": 7,
              "rvariance": 0.029617125393426386
            },
            {
              "id": "chat_sample_240",
              "rewards": [
                -0.15458725860107733,
                -0.01032280467513695,
                0.26123381447957433,
                0.1594000822965576,
                0.023621772719201965,
                0.04908020576495615,
                0.13394164925080343
              ],
              "variance": 0.26816216141527743,
              "mean_reward": 0.0660524944621256,
              "min_reward": -0.15458725860107733,
              "max_reward": 0.26123381447957433,
              "num_responses": 7,
              "rvariance": 0.015431709836789253
            },
            {
              "id": "chat_sample_20",
              "rewards": [
                1.678419920693224,
                1.644475343298885,
                1.610530765904546,
                1.6614476319960545,
                1.6275030546017155,
                1.5765861885102073,
                1.6275030546017155
              ],
              "variance": 0.07128361252811177,
              "mean_reward": 1.632352279943764,
              "min_reward": 1.5765861885102073,
              "max_reward": 1.678419920693224,
              "num_responses": 7,
              "rvariance": 0.000964114443136548
            },
            {
              "id": "chat_sample_210",
              "rewards": [
                0.40549826840551473,
                0.8637500632290901,
                0.7109994649545649,
                0.7449440423489039,
                0.7958609084404122,
                0.5582488666800398,
                0.8467777745319206
              ],
              "variance": 0.35641806264055864,
              "mean_reward": 0.7037256269414922,
              "min_reward": 0.40549826840551473,
              "max_reward": 0.8637500632290901,
              "num_responses": 7,
              "rvariance": 0.023773651268562197
            },
            {
              "id": "chat_sample_93",
              "rewards": [
                -0.7146727856076693,
                -0.6467836308189916,
                -0.7316450743048388,
                -0.9140971777994105,
                -0.9692571160652113,
                -0.5788944760303137,
                -0.6807282082133305
              ],
              "variance": 0.3165331842022103,
              "mean_reward": -0.7480112098342523,
              "min_reward": -0.9692571160652113,
              "max_reward": -0.5788944760303137,
              "num_responses": 7,
              "rvariance": 0.01732687077341209
            },
            {
              "id": "chat_sample_226",
              "rewards": [
                -0.13761496990390787,
                0.21031694838806597,
                0.40549826840551473,
                0.42247055710268416,
                0.09151092750787979,
                0.22728923708523543,
                0.3715536910111758
              ],
              "variance": 0.4124266153412178,
              "mean_reward": 0.22728923708523546,
              "min_reward": -0.13761496990390787,
              "max_reward": 0.42247055710268416,
              "num_responses": 7,
              "rvariance": 0.034649332486870806
            },
            {
              "id": "chat_sample_30",
              "rewards": [
                1.271084991961157,
                1.2541127032639876,
                1.3220018580526653,
                1.2371404145668181,
                1.3559464354470043,
                1.3559464354470043,
                1.2880572806583264
              ],
              "variance": 0.10862264766188456,
              "mean_reward": 1.2977557313424233,
              "min_reward": 1.2371404145668181,
              "max_reward": 1.3559464354470043,
              "num_responses": 7,
              "rvariance": 0.001963501365900042
            },
            {
              "id": "chat_sample_142",
              "rewards": [
                0.35458140231400637,
                0.5073320005885315,
                0.5243042892857009,
                0.677054887560226,
                0.5243042892857009,
                0.6600825988630565,
                0.23577538143382018
              ],
              "variance": 0.35981252037999245,
              "mean_reward": 0.4976335499044347,
              "min_reward": 0.23577538143382018,
              "max_reward": 0.677054887560226,
              "num_responses": 7,
              "rvariance": 0.021304577694675902
            },
            {
              "id": "chat_sample_136",
              "rewards": [
                -0.7061866412590847,
                -0.5449498986359749,
                -0.39219930036144973,
                -0.2988517125270177,
                -0.5364637542873901,
                -0.5788944760303137,
                -0.5534360429845595
              ],
              "variance": 0.2749510768941452,
              "mean_reward": -0.5158545465836843,
              "min_reward": -0.7061866412590847,
              "max_reward": -0.2988517125270177,
              "num_responses": 7,
              "rvariance": 0.01503783381428835
            },
            {
              "id": "chat_sample_16",
              "rewards": [
                1.5935584772073768,
                1.7632813641790712,
                1.6614476319960545,
                1.5256693224186988,
                1.678419920693224,
                1.678419920693224,
                1.610530765904546
              ],
              "variance": 0.14596168279565735,
              "mean_reward": 1.644475343298885,
              "min_reward": 1.5256693224186988,
              "max_reward": 1.7632813641790712,
              "num_responses": 7,
              "rvariance": 0.0049381471477725645
            },
            {
              "id": "chat_sample_22",
              "rewards": [
                1.3050295693554959,
                1.2031958371724791,
                1.4068633015385126,
                1.2541127032639876,
                1.5086970337215293,
                1.3729187241441738,
                1.271084991961157
              ],
              "variance": 0.2138508375843351,
              "mean_reward": 1.3317003087367623,
              "min_reward": 1.2031958371724791,
              "max_reward": 1.5086970337215293,
              "num_responses": 7,
              "rvariance": 0.009370722087558878
            },
            {
              "id": "chat_sample_217",
              "rewards": [
                -0.570408331681729,
                -0.8928818169279487,
                -0.8716664560564868,
                -0.9692571160652113,
                -0.5194914655902206,
                -0.7571035073505931,
                -0.5958667647274832
              ],
              "variance": 0.37339035133772813,
              "mean_reward": -0.7395250654856674,
              "min_reward": -0.9692571160652113,
              "max_reward": -0.5194914655902206,
              "num_responses": 7,
              "rvariance": 0.027388345586998677
            }
          ]
        },
        "semantic_benchmark_chat_hard_filtered.json": {
          "file_name": "semantic_benchmark_chat_hard_filtered.json",
          "processed_samples": 200,
          "global_mean": 0.007814628239205703,
          "global_std": 1.6897494157987996,
          "mean_variance": 0.5953950757661374,
          "mean_rvariance": 0.10832700954050342,
          "sample_results": [
            {
              "id": "chat_hard_sample_121",
              "rewards": [
                0.37449953575610156,
                -1.0541516461463902,
                0.37449953575610156,
                -1.0541516461463902,
                0.37449953575610156,
                -1.0541516461463902
              ],
              "variance": 1.4286511819024919,
              "mean_reward": -0.33982605519514425,
              "min_reward": -1.0541516461463902,
              "max_reward": 0.37449953575610156,
              "num_responses": 6,
              "rvariance": 0.5102610498878467
            },
            {
              "id": "chat_hard_sample_77",
              "rewards": [
                1.678317119239929,
                0.22770447094896853,
                1.752292584969508,
                1.28994592415964,
                0.3305766029791641,
                1.752292584969508,
                1.9279843160772576
              ],
              "variance": 1.533141527245522,
              "mean_reward": 1.2798733719062823,
              "min_reward": 0.22770447094896853,
              "max_reward": 1.9279843160772576,
              "num_responses": 7,
              "rvariance": 0.43335574991887293
            },
            {
              "id": "chat_hard_sample_265",
              "rewards": [
                1.0356552607142127,
                1.0356552607142127,
                -1.3361831092404097,
                -0.25544778959734343,
                1.0356552607142127,
                0.021671240225571153,
                0.13407927213497028
              ],
              "variance": 1.7233971781687825,
              "mean_reward": 0.23872648509506092,
              "min_reward": -1.3361831092404097,
              "max_reward": 1.0356552607142127,
              "num_responses": 7,
              "rvariance": 0.6696998404046958
            },
            {
              "id": "chat_hard_sample_334",
              "rewards": [
                2.7509613723188227,
                1.4933784549159819,
                1.3546744566730216,
                1.2806989909434425,
                1.6320824531589422,
                1.419402989186403
              ],
              "variance": 0.8738351889306504,
              "mean_reward": 1.6551997861994356,
              "min_reward": 1.2806989909434425,
              "max_reward": 2.7509613723188227,
              "num_responses": 6,
              "rvariance": 0.25226340946267756
            },
            {
              "id": "chat_hard_sample_61",
              "rewards": [
                1.7707864514019025,
                1.0633960603628048,
                1.60434165351035,
                1.7707864514019025,
                0.9108216622955483,
                0.7582472642282919,
                1.262205124511048
              ],
              "variance": 0.9209945483332568,
              "mean_reward": 1.305797809673121,
              "min_reward": 0.7582472642282919,
              "max_reward": 1.7707864514019025,
              "num_responses": 7,
              "rvariance": 0.14829056966416615
            },
            {
              "id": "chat_hard_sample_133",
              "rewards": [
                2.1776515129145864,
                0.7305064645796998,
                0.9108216622955483,
                0.3190179364589174,
                0.6010493995529368,
                0.4484750014856804
              ],
              "variance": 1.1604901186327685,
              "mean_reward": 0.8645869962145615,
              "min_reward": 0.3190179364589174,
              "max_reward": 2.1776515129145864,
              "num_responses": 6,
              "rvariance": 0.38075008571697805
            },
            {
              "id": "chat_hard_sample_62",
              "rewards": [
                0.8738339294307589,
                -0.34676125510729233,
                1.160488859132877,
                1.3269336570244294
              ],
              "variance": 1.2575829174028406,
              "mean_reward": 0.7536237976201933,
              "min_reward": -0.34676125510729233,
              "max_reward": 1.3269336570244294,
              "num_responses": 4,
              "rvariance": 0.4298802783064525
            },
            {
              "id": "chat_hard_sample_84",
              "rewards": [
                1.0125379276737192,
                -0.883083381646739,
                0.7212595313635025,
                -1.0171639132816008,
                -1.0171639132816008,
                -0.883083381646739
              ],
              "variance": 1.8840626428002116,
              "mean_reward": -0.344449521803243,
              "min_reward": -1.0171639132816008,
              "max_reward": 1.0125379276737192,
              "num_responses": 6,
              "rvariance": 0.7437488164972588
            },
            {
              "id": "chat_hard_sample_343",
              "rewards": [
                0.15488487187141434,
                -0.5293881861271902,
                -0.3074617889384536,
                0.6195432659853315
              ],
              "variance": 0.9429560147217256,
              "mean_reward": -0.015605459302224511,
              "min_reward": -0.5293881861271902,
              "max_reward": 0.6195432659853315,
              "num_responses": 4,
              "rvariance": 0.19540841594763325
            },
            {
              "id": "chat_hard_sample_87",
              "rewards": [
                0.6287901992015289,
                0.017047773617472475,
                -0.32826738867489763,
                -0.8969537814710351,
                -0.05230422550400771
              ],
              "variance": 1.0535724533204864,
              "mean_reward": -0.12633748456618782,
              "min_reward": -0.8969537814710351,
              "max_reward": 0.6287901992015289,
              "num_responses": 5,
              "rvariance": 0.2461766475465704
            },
            {
              "id": "chat_hard_sample_110",
              "rewards": [
                0.684271798498713,
                -1.5211217735643567,
                -1.6320849721587252,
                -2.5752721602108553,
                -1.6320849721587252,
                -1.345430042456607,
                -1.6320849721587252
              ],
              "variance": 1.4758105413050986,
              "mean_reward": -1.3791152991727547,
              "min_reward": -2.5752721602108553,
              "max_reward": 0.684271798498713,
              "num_responses": 7,
              "rvariance": 0.8430912932409512
            },
            {
              "id": "chat_hard_sample_150",
              "rewards": [
                0.8368461965659695,
                0.18840500478012975,
                0.8507165963902654,
                0.8322227299578707,
                0.32595313637106543,
                0.8460931297821668,
                0.7120125981473051
              ],
              "variance": 0.577008632690715,
              "mean_reward": 0.6560356274278247,
              "min_reward": 0.18840500478012975,
              "max_reward": 0.8507165963902654,
              "num_responses": 7,
              "rvariance": 0.06693188032547918
            },
            {
              "id": "chat_hard_sample_65",
              "rewards": [
                -1.0264108464977981,
                -1.0680220459706862,
                -0.4207367208368712,
                -1.4656401742671727,
                -0.3721903214518351,
                -1.6228380389425276,
                -0.3721903214518351
              ],
              "variance": 1.1563289986854794,
              "mean_reward": -0.906861209916961,
              "min_reward": -1.6228380389425276,
              "max_reward": -0.3721903214518351,
              "num_responses": 7,
              "rvariance": 0.23902637403049987
            },
            {
              "id": "chat_hard_sample_46",
              "rewards": [
                0.772117664052588,
                1.5303661877807713,
                1.964972048942047,
                1.8262680506990867,
                1.807774184266692,
                1.7245517853209158,
                2.038947514671626
              ],
              "variance": 0.7674954569443808,
              "mean_reward": 1.6664282051048183,
              "min_reward": 0.772117664052588,
              "max_reward": 2.038947514671626,
              "num_responses": 7,
              "rvariance": 0.1564441559615181
            },
            {
              "id": "chat_hard_sample_114",
              "rewards": [
                1.576600853861758,
                0.3721878024520522,
                0.5571264667759994,
                0.5571264667759994
              ],
              "variance": 0.8430891359867942,
              "mean_reward": 0.7657603974664522,
              "min_reward": 0.3721878024520522,
              "max_reward": 1.576600853861758,
              "num_responses": 4,
              "rvariance": 0.2248544668361035
            },
            {
              "id": "chat_hard_sample_371",
              "rewards": [
                0.39761686879659497,
                -0.17453712395561655,
                0.056347239786311246,
                0.5756203332083941
              ],
              "variance": 0.6274911087178926,
              "mean_reward": 0.21376182945892094,
              "min_reward": -0.17453712395561655,
              "max_reward": 0.5756203332083941,
              "num_responses": 4,
              "rvariance": 0.08507492062257158
            },
            {
              "id": "chat_hard_sample_223",
              "rewards": [
                0.772117664052588,
                1.8447619171314815,
                1.1974765919976664,
                0.425357668445187,
                1.8909965832124682
              ],
              "variance": 1.3084410500919263,
              "mean_reward": 1.2261420849678781,
              "min_reward": 0.425357668445187,
              "max_reward": 1.8909965832124682,
              "num_responses": 5,
              "rvariance": 0.33458751352049343
            },
            {
              "id": "chat_hard_sample_52",
              "rewards": [
                -0.7628732498361734,
                -0.9801761804168113,
                0.13003373885288394,
                0.4577219347018778,
                -0.37681378805993376,
                -0.14853012428506146,
                -0.5201412529109928
              ],
              "variance": 1.1109034392609103,
              "mean_reward": -0.31439698885060163,
              "min_reward": -0.9801761804168113,
              "max_reward": 0.4577219347018778,
              "num_responses": 7,
              "rvariance": 0.21597393831473388
            },
            {
              "id": "chat_hard_sample_372",
              "rewards": [
                0.023260556872105074,
                -0.4854652533502527,
                -1.6783196382397119,
                -0.7027681839308906
              ],
              "variance": 1.2562970157524633,
              "mean_reward": -0.7108231296621874,
              "min_reward": -1.6783196382397119,
              "max_reward": 0.023260556872105074,
              "num_responses": 4,
              "rvariance": 0.38144485187800914
            },
            {
              "id": "chat_hard_sample_346",
              "rewards": [
                1.4009091227540083,
                1.5581069874293634,
                0.8692104628226602,
                1.0217848608899165,
                1.4286499224026004
              ],
              "variance": 0.5760839393690955,
              "mean_reward": 1.2557322712597099,
              "min_reward": 0.8692104628226602,
              "max_reward": 1.5581069874293634,
              "num_responses": 5,
              "rvariance": 0.06930756009628605
            },
            {
              "id": "chat_hard_sample_108",
              "rewards": [
                0.23926313746921524,
                -0.3213321887627496,
                0.5178270006071606,
                0.5178270006071606,
                0.3398235361953615
              ],
              "variance": 0.6149210588771242,
              "mean_reward": 0.25868169722322965,
              "min_reward": -0.3213321887627496,
              "max_reward": 0.5178270006071606,
              "num_responses": 5,
              "rvariance": 0.09553795259263106
            },
            {
              "id": "chat_hard_sample_64",
              "rewards": [
                1.6598232528075343,
                1.1188776596599888,
                0.4831510010464205,
                0.9709267282008311,
                1.2067235252138637,
                1.174359258957173
              ],
              "variance": 0.7062345243870731,
              "mean_reward": 1.1023102376476352,
              "min_reward": 0.4831510010464205,
              "max_reward": 1.6598232528075343,
              "num_responses": 6,
              "rvariance": 0.12130137074333748
            },
            {
              "id": "chat_hard_sample_233",
              "rewards": [
                -0.3190204554587003,
                -0.7397559167956801,
                -0.10749685813818569,
                -0.02543032584443414,
                0.813728863525476,
                -0.09536025829192665,
                -0.25082432298924473
              ],
              "variance": 0.7975479898970224,
              "mean_reward": -0.10345132485609936,
              "min_reward": -0.7397559167956801,
              "max_reward": 0.813728863525476,
              "num_responses": 7,
              "rvariance": 0.18863728433071889
            },
            {
              "id": "chat_hard_sample_47",
              "rewards": [
                -1.6875665714559092,
                -1.7522951039692907,
                -0.8044844493090616,
                -1.4378993746185806
              ],
              "variance": 0.7383676173133591,
              "mean_reward": -1.4205613748382104,
              "min_reward": -1.7522951039692907,
              "max_reward": -0.8044844493090616,
              "num_responses": 4,
              "rvariance": 0.14029760661747537
            },
            {
              "id": "chat_hard_sample_26",
              "rewards": [
                0.1571966051754637,
                0.1046046725083412,
                0.3167062031548681,
                0.642660599025825,
                0.547879533559802,
                1.0633960603628048,
                1.086513393403298
              ],
              "variance": 0.9364831614703873,
              "mean_reward": 0.559851009598629,
              "min_reward": 0.1046046725083412,
              "max_reward": 1.086513393403298,
              "num_responses": 7,
              "rvariance": 0.13806154610566196
            },
            {
              "id": "chat_hard_sample_379",
              "rewards": [
                0.7490003310120945,
                1.2806989909434425,
                1.3546744566730216,
                1.6968109856723237,
                1.2714520577272452,
                0.6195432659853315,
                1.1235011262680876
              ],
              "variance": 0.7943115632713531,
              "mean_reward": 1.1565258877545066,
              "min_reward": 0.6195432659853315,
              "max_reward": 1.6968109856723237,
              "num_responses": 7,
              "rvariance": 0.11647369669260547
            },
            {
              "id": "chat_hard_sample_247",
              "rewards": [
                -0.08495745842370463,
                0.39299340218849627,
                -0.29705898907023154,
                0.4831510010464205
              ],
              "variance": 0.6895322512653167,
              "mean_reward": 0.12353198893524515,
              "min_reward": -0.29705898907023154,
              "max_reward": 0.4831510010464205,
              "num_responses": 4,
              "rvariance": 0.1055749768859752
            },
            {
              "id": "chat_hard_sample_215",
              "rewards": [
                0.18493740482405574,
                0.2982123367224733,
                -0.06328495869824208,
                -0.3051500556344042,
                -0.26585058946556545,
                0.04392167327704605,
                0.7073891315392065
              ],
              "variance": 0.7434534305822678,
              "mean_reward": 0.08573927750922426,
              "min_reward": -0.3051500556344042,
              "max_reward": 0.7073891315392065,
              "num_responses": 7,
              "rvariance": 0.10597149295649474
            },
            {
              "id": "chat_hard_sample_49",
              "rewards": [
                -1.47488710748337,
                -2.390333495886908,
                -2.0851846997523955,
                -1.345430042456607,
                -1.8447644361312643,
                -1.317689242808015,
                -1.9464807015094352
              ],
              "variance": 0.8729104956090303,
              "mean_reward": -1.7721099608611421,
              "min_reward": -2.390333495886908,
              "max_reward": -1.317689242808015,
              "num_responses": 7,
              "rvariance": 0.1418279036711767
            },
            {
              "id": "chat_hard_sample_415",
              "rewards": [
                -0.48084178674215405,
                0.7536237976201933,
                1.0587725937547061,
                0.4369163349654337,
                0.017914673606490975,
                0.5964259329448381,
                1.2344643248624558
              ],
              "variance": 1.310637196730773,
              "mean_reward": 0.516753695858852,
              "min_reward": -0.48084178674215405,
              "max_reward": 1.2344643248624558,
              "num_responses": 7,
              "rvariance": 0.30310846633625005
            },
            {
              "id": "chat_hard_sample_297",
              "rewards": [
                -0.9986700468492061,
                -0.9986700468492061,
                -0.23926565646899803,
                -1.3084423095918176,
                -1.1235036452678704,
                -0.589493252032473,
                -0.48084178674215405
              ],
              "variance": 0.8132677763645576,
              "mean_reward": -0.8198409634002466,
              "min_reward": -1.3084423095918176,
              "max_reward": -0.23926565646899803,
              "num_responses": 7,
              "rvariance": 0.1285643112798846
            },
            {
              "id": "chat_hard_sample_80",
              "rewards": [
                0.36987606914800286,
                0.36987606914800286,
                0.527073933823358,
                0.527073933823358,
                -0.22886285660077602
              ],
              "variance": 0.5164412201246225,
              "mean_reward": 0.31300742986838914,
              "min_reward": -0.22886285660077602,
              "max_reward": 0.527073933823358,
              "num_responses": 5,
              "rvariance": 0.07834808557124202
            },
            {
              "id": "chat_hard_sample_413",
              "rewards": [
                0.06357140636146542,
                -0.337514321891095,
                -0.883083381646739,
                -0.6195457849851144,
                -0.6149223183770157,
                -0.12483485791855574
              ],
              "variance": 0.7206828575373816,
              "mean_reward": -0.41938820974284235,
              "min_reward": -0.883083381646739,
              "max_reward": 0.06357140636146542,
              "num_responses": 6,
              "rvariance": 0.10333747606395227
            },
            {
              "id": "chat_hard_sample_306",
              "rewards": [
                0.8183523301335748,
                0.3583174026277562,
                0.45078673478972975,
                1.003290994457522,
                0.43460460166138437,
                0.8460931297821668,
                0.7674941974444892
              ],
              "variance": 0.5048825536043757,
              "mean_reward": 0.6684199129852318,
              "min_reward": 0.3583174026277562,
              "max_reward": 1.003290994457522,
              "num_responses": 7,
              "rvariance": 0.053457031959628795
            },
            {
              "id": "chat_hard_sample_43",
              "rewards": [
                -1.2622076435108307,
                -1.2807015099432255,
                -1.5396156399967516,
                -2.0851846997523955,
                -0.5525055191676835,
                -1.4009116417537912,
                -1.6968135046721067
              ],
              "variance": 0.8738351889306506,
              "mean_reward": -1.4025628798281125,
              "min_reward": -2.0851846997523955,
              "max_reward": -0.5525055191676835,
              "num_responses": 7,
              "rvariance": 0.18978420959424538
            },
            {
              "id": "chat_hard_sample_102",
              "rewards": [
                1.3269336570244294,
                0.4646571346140258,
                0.8553400629983642,
                0.5085800673909633,
                1.0587725937547061,
                0.8229757967416734
              ],
              "variance": 0.7062345243870732,
              "mean_reward": 0.8395432187540269,
              "min_reward": 0.4646571346140258,
              "max_reward": 1.3269336570244294,
              "num_responses": 6,
              "rvariance": 0.08936852693046882
            },
            {
              "id": "chat_hard_sample_187",
              "rewards": [
                -0.21961592338457867,
                -2.0851846997523955,
                -0.020806859236335462,
                -0.07831122517456278,
                -0.013871659324187442,
                -0.020806859236335462
              ],
              "variance": 1.1350610522882256,
              "mean_reward": -0.40643287101806586,
              "min_reward": -2.0851846997523955,
              "max_reward": -0.013871659324187442,
              "num_responses": 6,
              "rvariance": 0.5687152059541553
            },
            {
              "id": "chat_hard_sample_360",
              "rewards": [
                0.2103664711685985,
                -0.9801761804168113,
                -0.9801761804168113,
                -1.1373740450921666,
                -0.9385649809439233,
                -0.9385649809439233
              ],
              "variance": 0.6946758578668265,
              "mean_reward": -0.7940816494408396,
              "min_reward": -1.1373740450921666,
              "max_reward": 0.2103664711685985,
              "num_responses": 6,
              "rvariance": 0.2062964851651089
            },
            {
              "id": "chat_hard_sample_236",
              "rewards": [
                1.0772664601871007,
                0.41611073522898967,
                0.5594382000800487,
                0.929315528727943,
                0.6241667325934303,
                0.4947096675666672,
                0.6241667325934303
              ],
              "variance": 0.52522580668001,
              "mean_reward": 0.6750248652825157,
              "min_reward": 0.41611073522898967,
              "max_reward": 1.0772664601871007,
              "num_responses": 7,
              "rvariance": 0.04922078799277828
            },
            {
              "id": "chat_hard_sample_259",
              "rewards": [
                2.112922980401205,
                2.0481944478878233,
                1.8262680506990867,
                2.149910713265994,
                1.7985272510504946,
                1.6690701860237316,
                2.066688314320218
              ],
              "variance": 0.3809736485073312,
              "mean_reward": 1.953083134806936,
              "min_reward": 1.6690701860237316,
              "max_reward": 2.149910713265994,
              "num_responses": 7,
              "rvariance": 0.029553587486774082
            },
            {
              "id": "chat_hard_sample_127",
              "rewards": [
                0.9616797949846337,
                1.2806989909434425,
                0.670401398674417,
                1.262205124511048,
                1.0125379276737192
              ],
              "variance": 0.4863886871719809,
              "mean_reward": 1.037504647357452,
              "min_reward": 0.670401398674417,
              "max_reward": 1.2806989909434425,
              "num_responses": 5,
              "rvariance": 0.05015426674160771
            },
            {
              "id": "chat_hard_sample_280",
              "rewards": [
                -0.1126982580722967,
                -0.7721201830523708,
                0.028317473474713004,
                -0.04190142563578568,
                -0.43923058726926595,
                0.17800220491190774,
                -0.446165787181414
              ],
              "variance": 0.6647389115793877,
              "mean_reward": -0.22939950897493036,
              "min_reward": -0.7721201830523708,
              "max_reward": 0.17800220491190774,
              "num_responses": 7,
              "rvariance": 0.09524733479938584
            },
            {
              "id": "chat_hard_sample_421",
              "rewards": [
                0.4877744676545192,
                0.5964259329448381,
                0.8507165963902654,
                0.9339389953360417,
                0.943185928552239,
                1.003290994457522,
                1.0264083274980154
              ],
              "variance": 0.4595725808450086,
              "mean_reward": 0.83453446326192,
              "min_reward": 0.4877744676545192,
              "max_reward": 1.0264083274980154,
              "num_responses": 7,
              "rvariance": 0.03774011095723728
            },
            {
              "id": "chat_hard_sample_270",
              "rewards": [
                0.656530998850121,
                1.0911368600113969,
                -0.09189265833585265,
                0.929315528727943,
                0.0011184863192574923,
                0.9200685955117457
              ],
              "variance": 1.0556132803779676,
              "mean_reward": 0.5843796351807686,
              "min_reward": -0.09189265833585265,
              "max_reward": 1.0911368600113969,
              "num_responses": 6,
              "rvariance": 0.21520238928202465
            },
            {
              "id": "chat_hard_sample_276",
              "rewards": [
                1.2714520577272452,
                0.49239793426261785,
                1.4009091227540083,
                0.30283580333057203,
                0.3814347356682496,
                0.8830808626469562
              ],
              "variance": 0.9940453207412159,
              "mean_reward": 0.7886850860649415,
              "min_reward": 0.30283580333057203,
              "max_reward": 1.4009091227540083,
              "num_responses": 6,
              "rvariance": 0.18441353873653862
            },
            {
              "id": "chat_hard_sample_349",
              "rewards": [
                -0.7906140494847655,
                -0.7906140494847655,
                -1.6690727050235146,
                -1.6690727050235146,
                -1.3361831092404097,
                -1.6690727050235146,
                -0.5779345855122263
              ],
              "variance": 0.9635304411277648,
              "mean_reward": -1.2146519869703873,
              "min_reward": -1.6690727050235146,
              "max_reward": -0.5779345855122263,
              "num_responses": 7,
              "rvariance": 0.1998985392631034
            },
            {
              "id": "chat_hard_sample_267",
              "rewards": [
                -0.07571052520750728,
                -0.5640641856879303,
                0.10749433913840288,
                -0.23579805651292404,
                -0.17453712395561655,
                -0.2716299227256888,
                -0.19303099038801125
              ],
              "variance": 0.3861750484414422,
              "mean_reward": -0.2010394950484679,
              "min_reward": -0.5640641856879303,
              "max_reward": 0.10749433913840288,
              "num_responses": 7,
              "rvariance": 0.03566358306121376
            },
            {
              "id": "chat_hard_sample_14",
              "rewards": [
                0.49008620095856853,
                -0.08495745842370463,
                0.06761693964355177,
                0.14159240537313064,
                -0.0007597969902825959,
                -0.14564045765499978
              ],
              "variance": 0.43113826120520177,
              "mean_reward": 0.07798963881771065,
              "min_reward": -0.14564045765499978,
              "max_reward": 0.49008620095856853,
              "num_responses": 6,
              "rvariance": 0.04279002191964151
            },
            {
              "id": "chat_hard_sample_13",
              "rewards": [
                0.9108216622955483,
                1.7153048521047185,
                1.7615395181857052,
                1.1188776596599888,
                1.5673539206455607,
                -1.5950972392939358,
                1.807774184266692
              ],
              "variance": 1.871579282958345,
              "mean_reward": 1.0409392225520395,
              "min_reward": -1.5950972392939358,
              "max_reward": 1.807774184266692,
              "num_responses": 7,
              "rvariance": 1.2586964698447847
            },
            {
              "id": "chat_hard_sample_147",
              "rewards": [
                0.40455206870874294,
                -0.41148978762067384,
                0.25428940394553595,
                0.0699286729476011,
                0.13523513878699495
              ],
              "variance": 0.563369406196824,
              "mean_reward": 0.09050309935364022,
              "min_reward": -0.41148978762067384,
              "max_reward": 0.40455206870874294,
              "num_responses": 5,
              "rvariance": 0.07597476593429656
            },
            {
              "id": "chat_hard_sample_173",
              "rewards": [
                1.807774184266692,
                0.9478093951603377,
                0.9200685955117457,
                0.9478093951603377,
                0.9200685955117457,
                0.9478093951603377
              ],
              "variance": 0.4577231942017691,
              "mean_reward": 1.0818899267951994,
              "min_reward": 0.9200685955117457,
              "max_reward": 1.807774184266692,
              "num_responses": 6,
              "rvariance": 0.10553550144201664
            },
            {
              "id": "chat_hard_sample_345",
              "rewards": [
                -1.1697383113488573,
                -1.215972977429844,
                -1.8725052357798564,
                -1.3916647085375937,
                -1.6320849721587252,
                -1.4194055081861858
              ],
              "variance": 0.5594394595799401,
              "mean_reward": -1.4502286189068438,
              "min_reward": -1.8725052357798564,
              "max_reward": -1.1697383113488573,
              "num_responses": 6,
              "rvariance": 0.058219931387633365
            },
            {
              "id": "chat_hard_sample_412",
              "rewards": [
                -0.323643922066799,
                -0.970929247200614,
                -0.466971386917858,
                -0.41148978762067384,
                -0.970929247200614,
                -0.466971386917858,
                -0.6796508508903972
              ],
              "variance": 0.5945778058014901,
              "mean_reward": -0.6129408326878306,
              "min_reward": -0.970929247200614,
              "max_reward": -0.323643922066799,
              "num_responses": 7,
              "rvariance": 0.06109300294709262
            },
            {
              "id": "chat_hard_sample_21",
              "rewards": [
                0.6750248652825157,
                0.8322227299578707,
                1.5581069874293634,
                1.6690701860237316,
                1.1512419259166795,
                1.678317119239929
              ],
              "variance": 0.9200698550116373,
              "mean_reward": 1.2606639689750148,
              "min_reward": 0.6750248652825157,
              "max_reward": 1.678317119239929,
              "num_responses": 6,
              "rvariance": 0.16136839664147404
            },
            {
              "id": "chat_hard_sample_357",
              "rewards": [
                -1.5396156399967516,
                -1.174361777956956,
                -0.9339415143358246,
                -1.0772689791868837,
                -1.1096332454435744,
                -1.0541516461463902,
                -1.3639239088890016
              ],
              "variance": 0.4281330079099377,
              "mean_reward": -1.1789852445650546,
              "min_reward": -1.5396156399967516,
              "max_reward": -0.9339415143358246,
              "num_responses": 7,
              "rvariance": 0.03643767479400859
            },
            {
              "id": "chat_hard_sample_184",
              "rewards": [
                -0.5155177863028941,
                -0.09767199159597599,
                0.3398235361953615,
                -0.15951085747929583,
                0.41148726862089097,
                0.45078673478972975
              ],
              "variance": 0.7686513235964053,
              "mean_reward": 0.07156615070463605,
              "min_reward": -0.5155177863028941,
              "max_reward": 0.45078673478972975,
              "num_responses": 6,
              "rvariance": 0.12633705404707607
            },
            {
              "id": "chat_hard_sample_348",
              "rewards": [
                0.3305766029791641,
                0.9663032615927325,
                1.4841315216997846,
                0.9663032615927325,
                0.9663032615927325,
                0.9154451289036469
              ],
              "variance": 0.602206525704853,
              "mean_reward": 0.9381771730601322,
              "min_reward": 0.3305766029791641,
              "max_reward": 1.4841315216997846,
              "num_responses": 6,
              "rvariance": 0.11168909666020466
            },
            {
              "id": "chat_hard_sample_283",
              "rewards": [
                -1.8447644361312643,
                -1.6413319053749225,
                -1.8447644361312643,
                -1.0495281795382916,
                -1.6228380389425276,
                -1.6875665714559092
              ],
              "variance": 0.5085813268908546,
              "mean_reward": -1.615132261262363,
              "min_reward": -1.8447644361312643,
              "max_reward": -1.0495281795382916,
              "num_responses": 6,
              "rvariance": 0.07189372973124485
            },
            {
              "id": "chat_hard_sample_0",
              "rewards": [
                -0.9431884475520219,
                -0.6241692515932131,
                0.01343569032989538,
                -0.07542155854450111,
                -0.05085939218897687,
                -0.5478820525595849,
                0.43229286835733505
              ],
              "variance": 0.9327554915176081,
              "mean_reward": -0.25654173482158105,
              "min_reward": -0.9431884475520219,
              "max_reward": 0.43229286835733505,
              "num_responses": 7,
              "rvariance": 0.1877147921263472
            },
            {
              "id": "chat_hard_sample_258",
              "rewards": [
                0.2635363371617333,
                0.156040738523439,
                0.5525030001679007,
                0.5964259329448381,
                0.36756433584395354,
                0.7166360647554038,
                0.8322227299578707
              ],
              "variance": 0.5423326331299749,
              "mean_reward": 0.497847019907877,
              "min_reward": 0.156040738523439,
              "max_reward": 0.8322227299578707,
              "num_responses": 7,
              "rvariance": 0.05158392110002644
            },
            {
              "id": "chat_hard_sample_161",
              "rewards": [
                0.2288603376009932,
                -0.344449521803243,
                0.07281833957766279,
                -0.39993112110042717,
                -0.025574809175937224
              ],
              "variance": 0.5441820197732146,
              "mean_reward": -0.09365535498019029,
              "min_reward": -0.39993112110042717,
              "max_reward": 0.2288603376009932,
              "num_responses": 5,
              "rvariance": 0.0586134765365748
            },
            {
              "id": "chat_hard_sample_4",
              "rewards": [
                -0.1872516571278879,
                0.4762158011342725,
                0.24504247072933857,
                0.3536939360196575,
                0.5871789997286407,
                0.38605820227634824,
                0.2843419368981773
              ],
              "variance": 0.4484762609855718,
              "mean_reward": 0.3064685270940782,
              "min_reward": -0.1872516571278879,
              "max_reward": 0.5871789997286407,
              "num_responses": 7,
              "rvariance": 0.052028518405285336
            },
            {
              "id": "chat_hard_sample_238",
              "rewards": [
                0.019070540258515643,
                -0.13177005783070375,
                0.22192513768884517,
                -0.17338125730359186,
                -0.0861133250757293,
                -0.31670872215465096
              ],
              "variance": 0.36554282870280186,
              "mean_reward": -0.07782961406955251,
              "min_reward": -0.31670872215465096,
              "max_reward": 0.22192513768884517,
              "num_responses": 6,
              "rvariance": 0.028069014542663848
            },
            {
              "id": "chat_hard_sample_8",
              "rewards": [
                -1.47488710748337,
                -0.6750273842822986,
                -0.4877769866543021,
                -0.7952375160928642,
                -0.38837245458018044,
                -0.3837489879720818,
                -0.6149223183770157
              ],
              "variance": 0.6805742847121254,
              "mean_reward": -0.6885675364917303,
              "min_reward": -1.47488710748337,
              "max_reward": -0.3837489879720818,
              "num_responses": 7,
              "rvariance": 0.1226617408250179
            },
            {
              "id": "chat_hard_sample_32",
              "rewards": [
                1.11425419305189,
                1.345427523456824,
                1.4656376552673898,
                1.7153048521047185,
                1.60434165351035,
                2.122169913617402,
                1.419402989186403
              ],
              "variance": 0.6250926854149417,
              "mean_reward": 1.5409341114564252,
              "min_reward": 1.11425419305189,
              "max_reward": 2.122169913617402,
              "num_responses": 7,
              "rvariance": 0.08756838257329343
            },
            {
              "id": "chat_hard_sample_109",
              "rewards": [
                0.11211780574650156,
                -0.41148978762067384,
                0.02586125683916058,
                0.025283323513148246,
                0.02586125683916058,
                0.02586125683916058,
                -0.0612621920571989
              ],
              "variance": 0.26171710668468584,
              "mean_reward": -0.03682386855724874,
              "min_reward": -0.41148978762067384,
              "max_reward": 0.11211780574650156,
              "num_responses": 7,
              "rvariance": 0.02554299757889908
            },
            {
              "id": "chat_hard_sample_188",
              "rewards": [
                -0.2750975226817628,
                -0.39993112110042717,
                -0.8553425819981471,
                -0.3837489879720818,
                -0.20921312351635662,
                -0.2589153895534174,
                -0.08958092503180332
              ],
              "variance": 0.4207354613369798,
              "mean_reward": -0.3531185216934281,
              "min_reward": -0.8553425819981471,
              "max_reward": -0.08958092503180332,
              "num_responses": 7,
              "rvariance": 0.05149728379244275
            },
            {
              "id": "chat_hard_sample_53",
              "rewards": [
                -1.9279868350770406,
                -2.0112092340228167,
                -1.5581095064291461,
                -1.7707889704016855,
                -1.78928283683408,
                -1.6320849721587252,
                -1.604344172510133
              ],
              "variance": 0.3754254885776127,
              "mean_reward": -1.756258075347661,
              "min_reward": -2.0112092340228167,
              "max_reward": -1.5581095064291461,
              "num_responses": 7,
              "rvariance": 0.024793184400808112
            },
            {
              "id": "chat_hard_sample_356",
              "rewards": [
                -2.149913232265777,
                -1.8540113693474616,
                -1.733801237536896,
                -2.0851846997523955,
                -1.96497456794183,
                -2.1406662990495797,
                -2.122172432617185
              ],
              "variance": 0.3384377557128233,
              "mean_reward": -2.0072462626444465,
              "min_reward": -2.149913232265777,
              "max_reward": -1.733801237536896,
              "num_responses": 7,
              "rvariance": 0.022496743615935958
            },
            {
              "id": "chat_hard_sample_63",
              "rewards": [
                0.7351299311877985,
                1.1003837932275942,
                1.2437112580786531,
                1.6598232528075343,
                1.345427523456824,
                1.447143788834995,
                1.3176867238082322
              ],
              "variance": 0.5779333260123347,
              "mean_reward": 1.2641866102002333,
              "min_reward": 0.7351299311877985,
              "max_reward": 1.6598232528075343,
              "num_responses": 7,
              "rvariance": 0.07237365754724916
            },
            {
              "id": "chat_hard_sample_159",
              "rewards": [
                -1.604344172510133,
                -2.1314193658333824,
                -2.038950033671409,
                -1.2899484431594228
              ],
              "variance": 0.7194114042201547,
              "mean_reward": -1.7661655037935868,
              "min_reward": -2.1314193658333824,
              "max_reward": -1.2899484431594228,
              "num_responses": 4,
              "rvariance": 0.11519765389326071
            },
            {
              "id": "chat_hard_sample_152",
              "rewards": [
                -0.015822184299479073,
                -0.2566036562493681,
                -0.061840125383211236,
                -0.4276719207490192,
                -0.005780592760014755,
                0.0015158154808909727
              ],
              "variance": 0.34000539985963174,
              "mean_reward": -0.12770044399336689,
              "min_reward": -0.4276719207490192,
              "max_reward": 0.0015158154808909727,
              "num_responses": 6,
              "rvariance": 0.025835757232288037
            },
            {
              "id": "chat_hard_sample_318",
              "rewards": [
                0.08784460605398349,
                0.8877043292550549,
                0.7027656649311077,
                -0.26816232276961477,
                0.943185928552239,
                0.8830808626469562
              ],
              "variance": 1.0056039872614626,
              "mean_reward": 0.5394031781116211,
              "min_reward": -0.26816232276961477,
              "max_reward": 0.943185928552239,
              "num_responses": 6,
              "rvariance": 0.21420383943349033
            },
            {
              "id": "chat_hard_sample_176",
              "rewards": [
                -2.0112092340228167,
                -1.6690727050235146,
                -1.9742215011580273,
                -1.78928283683408,
                -1.9557276347256327,
                -1.863258302563659,
                -1.1836087111731532
              ],
              "variance": 0.5141294868205732,
              "mean_reward": -1.7780544179286977,
              "min_reward": -2.0112092340228167,
              "max_reward": -1.1836087111731532,
              "num_responses": 7,
              "rvariance": 0.07100556516477215
            },
            {
              "id": "chat_hard_sample_274",
              "rewards": [
                -0.5779345855122263,
                -0.35600818832348974,
                -0.10171752487806233,
                -0.3143969888506016,
                -0.2878120558540342,
                -0.43923058726926595
              ],
              "variance": 0.3138177960246979,
              "mean_reward": -0.34618332178128003,
              "min_reward": -0.5779345855122263,
              "max_reward": -0.10171752487806233,
              "num_responses": 6,
              "rvariance": 0.021107345226818175
            },
            {
              "id": "chat_hard_sample_389",
              "rewards": [
                -0.221927656688628,
                -0.5224529862150421,
                0.5848672664245914,
                -0.19303099038801125,
                -0.25429192294531877,
                -0.16297845743536984,
                -0.011307080190007706
              ],
              "variance": 0.5887190067090402,
              "mean_reward": -0.11158883249111232,
              "min_reward": -0.5224529862150421,
              "max_reward": 0.5848672664245914,
              "num_responses": 7,
              "rvariance": 0.10081848959457547
            },
            {
              "id": "chat_hard_sample_42",
              "rewards": [
                -0.7721201830523708,
                -1.0772689791868837,
                -0.8877068482548378,
                -0.9385649809439233,
                0.3375118028913121,
                -0.8553425819981471,
                0.28087433694210334
              ],
              "variance": 1.2975759035628942,
              "mean_reward": -0.5589453476575352,
              "min_reward": -1.0772689791868837,
              "max_reward": 0.3375118028913121,
              "num_responses": 7,
              "rvariance": 0.30901170480497536
            },
            {
              "id": "chat_hard_sample_5",
              "rewards": [
                -1.5118748403481594,
                -0.15951085747929583,
                0.16875527169571036,
                -0.7351324501875813,
                0.011268440357349124,
                -0.21268072347243064,
                -0.17800472391169053
              ],
              "variance": 1.1200925791445062,
              "mean_reward": -0.37388284047801407,
              "min_reward": -1.5118748403481594,
              "max_reward": 0.16875527169571036,
              "num_responses": 7,
              "rvariance": 0.28266205833825814
            },
            {
              "id": "chat_hard_sample_17",
              "rewards": [
                0.8830808626469562,
                0.5224504672152592,
                1.1235011262680876,
                1.1281245928761863,
                1.1882296587814691,
                0.5316974004314566
              ],
              "variance": 0.6311031920054697,
              "mean_reward": 0.8961806847032358,
              "min_reward": 0.5224504672152592,
              "max_reward": 1.1882296587814691,
              "num_responses": 6,
              "rvariance": 0.07724318471116481
            },
            {
              "id": "chat_hard_sample_182",
              "rewards": [
                0.41148726862089097,
                0.4877744676545192,
                -0.18840752377991257,
                0.18031393821595706
              ],
              "variance": 0.5426793931255824,
              "mean_reward": 0.22279203767786368,
              "min_reward": -0.18840752377991257,
              "max_reward": 0.4877744676545192,
              "num_responses": 4,
              "rvariance": 0.06917776166348467
            },
            {
              "id": "chat_hard_sample_140",
              "rewards": [
                -0.5409468526474369,
                -0.7674967164442721,
                -0.7397559167956801,
                -0.3259556553708483,
                -0.09824992492198834
              ],
              "variance": 0.567068179483303,
              "mean_reward": -0.4944810132360451,
              "min_reward": -0.7674967164442721,
              "max_reward": -0.09824992492198834,
              "num_responses": 5,
              "rvariance": 0.06445125966736213
            },
            {
              "id": "chat_hard_sample_251",
              "rewards": [
                -0.37681378805993376,
                0.1872491381281051,
                -0.7027681839308906,
                -0.466971386917858,
                -0.33057912197894695,
                -0.35831992162753906
              ],
              "variance": 0.5132047934989533,
              "mean_reward": -0.3413672107311772,
              "min_reward": -0.7027681839308906,
              "max_reward": 0.1872491381281051,
              "num_responses": 6,
              "rvariance": 0.07124709231608974
            },
            {
              "id": "chat_hard_sample_98",
              "rewards": [
                0.4022403354046936,
                0.30745926993867073,
                0.8507165963902654,
                0.6380371324177262,
                0.2057430045604998,
                0.527073933823358,
                0.813728863525476
              ],
              "variance": 0.5617511928839893,
              "mean_reward": 0.5349998765800985,
              "min_reward": 0.2057430045604998,
              "max_reward": 0.8507165963902654,
              "num_responses": 7,
              "rvariance": 0.05226518617234331
            },
            {
              "id": "chat_hard_sample_409",
              "rewards": [
                0.929315528727943,
                0.37449953575610156,
                0.6241667325934303,
                0.7582472642282919,
                0.5432560669517034,
                0.6935187317149104
              ],
              "variance": 0.384903595124215,
              "mean_reward": 0.6538339766620634,
              "min_reward": 0.37449953575610156,
              "max_reward": 0.929315528727943,
              "num_responses": 6,
              "rvariance": 0.029917074882567497
            },
            {
              "id": "chat_hard_sample_248",
              "rewards": [
                -0.20112205695218394,
                -0.6472865846337065,
                -0.323643922066799,
                -0.5270764528231409,
                -0.5085825863907462,
                -0.3028383223303549,
                -0.47621832013405535
              ],
              "variance": 0.31300868936828063,
              "mean_reward": -0.42668117790442667,
              "min_reward": -0.6472865846337065,
              "max_reward": -0.20112205695218394,
              "num_responses": 7,
              "rvariance": 0.020676910269793455
            },
            {
              "id": "chat_hard_sample_382",
              "rewards": [
                -0.7073916505389893,
                -0.7166385837551866,
                -0.0647297920132729,
                -0.5132060529988448,
                -0.5848697854243743,
                -0.4692831202219073,
                -0.29243552246213284
              ],
              "variance": 0.5097371935428795,
              "mean_reward": -0.4783649296306726,
              "min_reward": -0.7166385837551866,
              "max_reward": -0.0647297920132729,
              "num_responses": 7,
              "rvariance": 0.046790144587000704
            },
            {
              "id": "chat_hard_sample_254",
              "rewards": [
                0.6287901992015289,
                0.1791580715639324,
                0.7027656649311077,
                0.36987606914800286,
                0.49008620095856853,
                0.28318607024615267
              ],
              "variance": 0.43460586116127575,
              "mean_reward": 0.4423103793415489,
              "min_reward": 0.1791580715639324,
              "max_reward": 0.7027656649311077,
              "num_responses": 6,
              "rvariance": 0.03411843671078633
            },
            {
              "id": "chat_hard_sample_2",
              "rewards": [
                -1.7153073711045013,
                -1.2529607102946334,
                -1.114256712051673,
                -1.6875665714559092,
                -1.2344668438622386,
                -1.3824177753213964,
                -1.6228380389425276
              ],
              "variance": 0.5122801001773338,
              "mean_reward": -1.4299734318618398,
              "min_reward": -1.7153073711045013,
              "max_reward": -1.114256712051673,
              "num_responses": 7,
              "rvariance": 0.05092305089980167
            },
            {
              "id": "chat_hard_sample_203",
              "rewards": [
                -0.09536025829192665,
                -0.07831122517456278,
                -0.05403802548204471,
                -0.30977352224250293,
                0.05085687318919406,
                -0.026875159159464975,
                0.010907232028591415
              ],
              "variance": 0.20801265236498961,
              "mean_reward": -0.07179915501895949,
              "min_reward": -0.30977352224250293,
              "max_reward": 0.05085687318919406,
              "num_responses": 7,
              "rvariance": 0.011635400420180918
            },
            {
              "id": "chat_hard_sample_68",
              "rewards": [
                0.35600566932370686,
                -0.0038029771600662965,
                -0.39530765449232846,
                -0.15373152421917247,
                -0.09478232496591432
              ],
              "variance": 0.5107594131132637,
              "mean_reward": -0.05832376230275493,
              "min_reward": -0.39530765449232846,
              "max_reward": 0.35600566932370686,
              "num_responses": 5,
              "rvariance": 0.05972628106901591
            },
            {
              "id": "chat_hard_sample_220",
              "rewards": [
                -0.05346009215603238,
                -0.4877769866543021,
                -0.4646596536138087,
                -0.6102988517689171,
                -0.4276719207490192,
                -0.5617524523838809,
                -0.4068663210125752
              ],
              "variance": 0.3156671826679374,
              "mean_reward": -0.4303551826197908,
              "min_reward": -0.6102988517689171,
              "max_reward": -0.05346009215603238,
              "num_responses": 7,
              "rvariance": 0.02810398037237418
            },
            {
              "id": "chat_hard_sample_11",
              "rewards": [
                -0.344449521803243,
                0.5825555331205421,
                0.15488487187141434,
                0.30514753663462135
              ],
              "variance": 0.6939823378756117,
              "mean_reward": 0.1745346049558337,
              "min_reward": -0.344449521803243,
              "max_reward": 0.5825555331205421,
              "num_responses": 4,
              "rvariance": 0.11331786289507201
            },
            {
              "id": "chat_hard_sample_6",
              "rewards": [
                0.22770447094896853,
                0.5155152673031113,
                0.8322227299578707,
                0.8969512624712522,
                0.5501912668638513,
                0.9940440612413245
              ],
              "variance": 0.5738877927302485,
              "mean_reward": 0.6694381764643964,
              "min_reward": 0.22770447094896853,
              "max_reward": 0.9940440612413245,
              "num_responses": 6,
              "rvariance": 0.06944512493243161
            },
            {
              "id": "chat_hard_sample_286",
              "rewards": [
                -1.5396156399967516,
                -1.6413319053749225,
                -1.5026279071319621,
                -1.5396156399967516,
                -0.9801761804168113,
                -1.4009116417537912
              ],
              "variance": 0.39992986160053556,
              "mean_reward": -1.4340464857784985,
              "min_reward": -1.6413319053749225,
              "max_reward": -0.9801761804168113,
              "num_responses": 6,
              "rvariance": 0.046176086859082394
            },
            {
              "id": "chat_hard_sample_400",
              "rewards": [
                1.2714520577272452,
                1.1235011262680876,
                1.3269336570244294,
                0.9246920621198443,
                1.0633960603628048,
                1.0818899267951994,
                0.9940440612413245
              ],
              "variance": 0.3273414358533865,
              "mean_reward": 1.112272707362705,
              "min_reward": 0.9246920621198443,
              "max_reward": 1.3269336570244294,
              "num_responses": 7,
              "rvariance": 0.017717145356236263
            },
            {
              "id": "chat_hard_sample_209",
              "rewards": [
                -1.0495281795382916,
                -0.7166385837551866,
                -1.0032935134573047,
                -1.1789852445650546,
                -0.473906586830006,
                -0.7305089835794827,
                -0.7628732498361734
              ],
              "variance": 0.4817652205638825,
              "mean_reward": -0.8451049059373571,
              "min_reward": -1.1789852445650546,
              "max_reward": -0.473906586830006,
              "num_responses": 7,
              "rvariance": 0.050353521370042835
            },
            {
              "id": "chat_hard_sample_337",
              "rewards": [
                1.5950947202941528,
                1.0633960603628048,
                1.2991928573758373,
                0.7443768644039959,
                0.5525030001679007,
                0.8414696631740681,
                0.8322227299578707
              ],
              "variance": 0.7499262838336058,
              "mean_reward": 0.9897508422480901,
              "min_reward": 0.5525030001679007,
              "max_reward": 1.5950947202941528,
              "num_responses": 7,
              "rvariance": 0.10940223831449283
            },
            {
              "id": "chat_hard_sample_268",
              "rewards": [
                -0.7536263166199761,
                -0.18956339043193723,
                -0.5617524523838809,
                -0.18956339043193723,
                -0.18956339043193723,
                -0.6056753851608184
              ],
              "variance": 0.4900874604584601,
              "mean_reward": -0.4149573875767478,
              "min_reward": -0.7536263166199761,
              "max_reward": -0.18956339043193723,
              "num_responses": 6,
              "rvariance": 0.05417102516670664
            },
            {
              "id": "chat_hard_sample_249",
              "rewards": [
                0.32826486967511476,
                0.9246920621198443,
                0.6334136658096275,
                0.3606291359318055,
                0.5871789997286407,
                0.8044819303092787,
                0.26006873720565926
              ],
              "variance": 0.5515795663461724,
              "mean_reward": 0.5569613429685673,
              "min_reward": 0.26006873720565926,
              "max_reward": 0.9246920621198443,
              "num_responses": 7,
              "rvariance": 0.05460628845519254
            },
            {
              "id": "chat_hard_sample_295",
              "rewards": [
                -0.31208525554655225,
                1.1188776596599888,
                1.4656376552673898,
                1.28994592415964,
                1.474884588483587,
                1.1789827255652716,
                1.5950947202941528
              ],
              "variance": 0.9764761476304409,
              "mean_reward": 1.115905431126211,
              "min_reward": -0.31208525554655225,
              "max_reward": 1.5950947202941528,
              "num_responses": 7,
              "rvariance": 0.36489087321838615
            },
            {
              "id": "chat_hard_sample_153",
              "rewards": [
                -0.6704039176741998,
                -0.6704039176741998,
                -0.6704039176741998,
                -0.7212620503632854,
                -0.6704039176741998,
                -1.7430481707530934
              ],
              "variance": 0.5617511928839896,
              "mean_reward": -0.8576543153021964,
              "min_reward": -1.7430481707530934,
              "max_reward": -0.6704039176741998,
              "num_responses": 6,
              "rvariance": 0.15712932914212355
            },
            {
              "id": "chat_hard_sample_192",
              "rewards": [
                -0.5709993856000782,
                -0.7490028500118774,
                -0.16991365734751784,
                -0.4022428544044765,
                -0.3190204554587003
              ],
              "variance": 0.4482450876551669,
              "mean_reward": -0.44223584056453,
              "min_reward": -0.7490028500118774,
              "max_reward": -0.16991365734751784,
              "num_responses": 5,
              "rvariance": 0.04032537803124934
            },
            {
              "id": "chat_hard_sample_363",
              "rewards": [
                -0.9940465802411074,
                -1.3731708421051991,
                -1.100386312227377,
                -1.1789852445650546,
                -0.970929247200614,
                -1.100386312227377
              ],
              "variance": 0.2935901296142662,
              "mean_reward": -1.119650756427788,
              "min_reward": -1.3731708421051991,
              "max_reward": -0.970929247200614,
              "num_responses": 6,
              "rvariance": 0.017738291554572985
            },
            {
              "id": "chat_hard_sample_129",
              "rewards": [
                -0.35369645501944036,
                -0.6472865846337065,
                -0.337514321891095,
                -0.33289085528299633,
                -0.33289085528299633
              ],
              "variance": 0.19695967750500365,
              "mean_reward": -0.40085581442204693,
              "min_reward": -0.6472865846337065,
              "max_reward": -0.33289085528299633,
              "num_responses": 5,
              "rvariance": 0.015240549140794046
            },
            {
              "id": "chat_hard_sample_359",
              "rewards": [
                -1.215972977429844,
                -1.1235036452678704,
                -0.9663057805925154,
                -1.2252199106460413,
                -1.3084423095918176,
                -0.6472865846337065,
                -0.9293180477277259
              ],
              "variance": 0.44200340773423386,
              "mean_reward": -1.059435607984217,
              "min_reward": -1.3084423095918176,
              "max_reward": -0.6472865846337065,
              "num_responses": 7,
              "rvariance": 0.04479542793925568
            },
            {
              "id": "chat_hard_sample_7",
              "rewards": [
                -0.26238298950949146,
                0.9755501948089298,
                0.9246920621198443,
                0.813728863525476,
                1.0680195269709034,
                1.0264083274980154
              ],
              "variance": 0.7715409902264672,
              "mean_reward": 0.7576693309022796,
              "min_reward": -0.26238298950949146,
              "max_reward": 1.0680195269709034,
              "num_responses": 6,
              "rvariance": 0.21459266061109483
            },
            {
              "id": "chat_hard_sample_316",
              "rewards": [
                0.13407927213497028,
                -0.2173041900805293,
                -0.1306141911786791,
                -0.01770046760901916,
                -0.22077179003660333,
                0.15257313856736499,
                -0.13234799115671608
              ],
              "variance": 0.3601680487708871,
              "mean_reward": -0.06172660276560167,
              "min_reward": -0.22077179003660333,
              "max_reward": 0.15257313856736499,
              "num_responses": 7,
              "rvariance": 0.020776465423177234
            },
            {
              "id": "chat_hard_sample_41",
              "rewards": [
                -0.8553425819981471,
                -0.15951085747929583,
                -0.08784712505376631,
                0.0638603730244716,
                -0.3906841878842298,
                -0.7952375160928642
              ],
              "variance": 0.8132966730308583,
              "mean_reward": -0.37079364924730523,
              "min_reward": -0.8553425819981471,
              "max_reward": 0.0638603730244716,
              "num_responses": 6,
              "rvariance": 0.1214931950979301
            },
            {
              "id": "chat_hard_sample_143",
              "rewards": [
                0.670401398674417,
                0.5848672664245914,
                0.6195432659853315,
                0.5709968666002954
              ],
              "variance": 0.07998597232010707,
              "mean_reward": 0.6114521994211588,
              "min_reward": 0.5709968666002954,
              "max_reward": 0.670401398674417,
              "num_responses": 4,
              "rvariance": 0.001470966516706253
            },
            {
              "id": "chat_hard_sample_370",
              "rewards": [
                -0.3837489879720818,
                -0.6657804510661012,
                -0.589493252032473,
                -0.47621832013405535,
                -0.7212620503632854,
                -0.7443793834037787,
                -0.6981447173227919
              ],
              "variance": 0.2912783963102168,
              "mean_reward": -0.6112895946135097,
              "min_reward": -0.7443793834037787,
              "max_reward": -0.3837489879720818,
              "num_responses": 7,
              "rvariance": 0.015830565155974176
            },
            {
              "id": "chat_hard_sample_91",
              "rewards": [
                1.7153048521047185,
                1.391662189537811,
                0.9755501948089298,
                1.909490449644863,
                1.3639213898892188,
                1.391662189537811,
                1.2714520577272452
              ],
              "variance": 0.6398877785608572,
              "mean_reward": 1.431291903321514,
              "min_reward": 0.9755501948089298,
              "max_reward": 1.909490449644863,
              "num_responses": 7,
              "rvariance": 0.07860947148702167
            },
            {
              "id": "chat_hard_sample_245",
              "rewards": [
                -0.4438540538773646,
                -0.8137313825252589,
                -0.4715948535259567,
                -0.6010519185527197,
                -0.5085825863907462,
                -0.7166385837551866,
                -0.7073916505389893
              ],
              "variance": 0.29497716959669573,
              "mean_reward": -0.6089778613094603,
              "min_reward": -0.8137313825252589,
              "max_reward": -0.4438540538773646,
              "num_responses": 7,
              "rvariance": 0.017068871988774246
            },
            {
              "id": "chat_hard_sample_131",
              "rewards": [
                0.18609327147608043,
                0.5201387339112099,
                0.3421352694994108,
                0.38605820227634824,
                0.5918024663367395,
                0.5108918006950126
              ],
              "variance": 0.2918563296362291,
              "mean_reward": 0.4228532906991336,
              "min_reward": 0.18609327147608043,
              "max_reward": 0.5918024663367395,
              "num_responses": 6,
              "rvariance": 0.018280607472138537
            },
            {
              "id": "chat_hard_sample_171",
              "rewards": [
                -1.5950972392939358,
                -1.128127111875969,
                -0.8553425819981471,
                -1.3269361760242122,
                -1.604344172510133,
                -1.4101585749699885,
                -1.2807015099432255
              ],
              "variance": 0.5797827126555744,
              "mean_reward": -1.3143867666593732,
              "min_reward": -1.604344172510133,
              "max_reward": -0.8553425819981471,
              "num_responses": 7,
              "rvariance": 0.05982175894118127
            },
            {
              "id": "chat_hard_sample_329",
              "rewards": [
                2.2608739118603625,
                1.2529581912948506,
                1.678317119239929,
                1.1882296587814691,
                1.1882296587814691
              ],
              "variance": 0.83962153603072,
              "mean_reward": 1.513721707991616,
              "min_reward": 1.1882296587814691,
              "max_reward": 2.2608739118603625,
              "num_responses": 5,
              "rvariance": 0.17304316499760636
            },
            {
              "id": "chat_hard_sample_384",
              "rewards": [
                0.1259882055707976,
                0.03785337335391653,
                -0.4253601874449699,
                -0.12367899126653106,
                -0.2589153895534174,
                -0.23579805651292404,
                -0.08784712505376631
              ],
              "variance": 0.3986006149507074,
              "mean_reward": -0.13825116727241352,
              "min_reward": -0.4253601874449699,
              "max_reward": 0.1259882055707976,
              "num_responses": 7,
              "rvariance": 0.03001357296841931
            },
            {
              "id": "chat_hard_sample_29",
              "rewards": [
                -0.2912796558101082,
                0.10749433913840288,
                0.7258829979716012,
                0.6611544654582197,
                0.6102963327691342,
                0.5016448674788152,
                0.4438515348775817
              ],
              "variance": 0.7390611373045738,
              "mean_reward": 0.3941492688405209,
              "min_reward": -0.2912796558101082,
              "max_reward": 0.7258829979716012,
              "num_responses": 7,
              "rvariance": 0.11343829625072813
            },
            {
              "id": "chat_hard_sample_106",
              "rewards": [
                -0.3629433882356377,
                -0.7906140494847655,
                -0.4415423205733153,
                -0.6380396514175092,
                -0.37681378805993376,
                -0.3213321887627496,
                -0.4900887199583514
              ],
              "variance": 0.35277050219792927,
              "mean_reward": -0.4887677294988945,
              "min_reward": -0.7906140494847655,
              "max_reward": -0.3213321887627496,
              "num_responses": 7,
              "rvariance": 0.024575057426561138
            },
            {
              "id": "chat_hard_sample_320",
              "rewards": [
                0.3398235361953615,
                -0.3074617889384536,
                0.054902406471280404,
                0.03640854003888569,
                0.046811339907107716,
                0.012857757003883046
              ],
              "variance": 0.34466498730060624,
              "mean_reward": 0.03055696511301079,
              "min_reward": -0.3074617889384536,
              "max_reward": 0.3398235361953615,
              "num_responses": 6,
              "rvariance": 0.03518448303186972
            },
            {
              "id": "chat_hard_sample_23",
              "rewards": [
                0.6750248652825157,
                1.0680195269709034,
                1.2991928573758373,
                1.0264083274980154,
                1.6320824531589422,
                1.215970458430061,
                1.9187373828610603
              ],
              "variance": 0.8608894824279739,
              "mean_reward": 1.262205124511048,
              "min_reward": 0.6750248652825157,
              "max_reward": 1.9187373828610603,
              "num_responses": 7,
              "rvariance": 0.14420548769046881
            },
            {
              "id": "chat_hard_sample_235",
              "rewards": [
                0.0212377902310619,
                -0.0047562285151784385,
                0.45541020139782845,
                -0.24042152312102272,
                -0.2022779236042086,
                0.28087433694210334,
                -0.13119212450469142
              ],
              "variance": 0.5682240461353277,
              "mean_reward": 0.025553504117984644,
              "min_reward": -0.24042152312102272,
              "max_reward": 0.45541020139782845,
              "num_responses": 7,
              "rvariance": 0.05687455425914657
            },
            {
              "id": "chat_hard_sample_202",
              "rewards": [
                0.12309853894073591,
                0.30977100324272006,
                0.3143944698508187,
                -0.15488739087119716,
                -0.07917812516358128,
                0.3143944698508187,
                0.3791230023642002
              ],
              "variance": 0.449747714302799,
              "mean_reward": 0.17238799545921646,
              "min_reward": -0.15488739087119716,
              "max_reward": 0.3791230023642002,
              "num_responses": 7,
              "rvariance": 0.03925275335896059
            },
            {
              "id": "chat_hard_sample_304",
              "rewards": [
                -1.8262705696988697,
                -0.8322252489576536,
                -0.5455703192555356,
                -0.7212620503632854,
                -0.39530765449232846,
                -0.6380396514175092,
                -0.6056753851608184
              ],
              "variance": 0.7443781239038872,
              "mean_reward": -0.7949072684780001,
              "min_reward": -1.8262705696988697,
              "max_reward": -0.39530765449232846,
              "num_responses": 7,
              "rvariance": 0.1932559185163603
            },
            {
              "id": "chat_hard_sample_277",
              "rewards": [
                -0.16182259078334515,
                -0.10460719150812402,
                -0.11732172468039538,
                -0.22770698994875135,
                -0.27394165602973813,
                0.028750923469222252
              ],
              "variance": 0.21289618896979384,
              "mean_reward": -0.14277487158018864,
              "min_reward": -0.27394165602973813,
              "max_reward": 0.028750923469222252,
              "num_responses": 6,
              "rvariance": 0.009384456422794478
            },
            {
              "id": "chat_hard_sample_196",
              "rewards": [
                -0.7212620503632854,
                -0.9755527138087127,
                -0.7536263166199761,
                -0.45310098709356195,
                -0.6010519185527197,
                -0.49702391987049943,
                -0.5779345855122263
              ],
              "variance": 0.36294212873574627,
              "mean_reward": -0.6542217845458546,
              "min_reward": -0.9755527138087127,
              "max_reward": -0.45310098709356195,
              "num_responses": 7,
              "rvariance": 0.027348105650162925
            },
            {
              "id": "chat_hard_sample_185",
              "rewards": [
                -2.4458150951840922,
                -2.723223091670013,
                -2.094431632968593,
                -1.9002460354284485,
                -2.408827362319303,
                -2.242382564427751,
                -2.112925499400988
              ],
              "variance": 0.5400208998259255,
              "mean_reward": -2.2754073259141694,
              "min_reward": -2.723223091670013,
              "max_reward": -1.9002460354284485,
              "num_responses": 7,
              "rvariance": 0.06405254973367551
            },
            {
              "id": "chat_hard_sample_160",
              "rewards": [
                -1.3361831092404097,
                -1.3639239088890016,
                -1.4194055081861858,
                -1.8447644361312643,
                -1.4194055081861858,
                -1.7800359036178828,
                -1.4194055081861858
              ],
              "variance": 0.45309972759367056,
              "mean_reward": -1.5118748403481594,
              "min_reward": -1.8447644361312643,
              "max_reward": -1.3361831092404097,
              "num_responses": 7,
              "rvariance": 0.03730494764361457
            },
            {
              "id": "chat_hard_sample_163",
              "rewards": [
                0.05114583985220023,
                0.39761686879659497,
                0.39761686879659497,
                -0.17338125730359186,
                0.39761686879659497,
                0.020226406910540316
              ],
              "variance": 0.47419429399312074,
              "mean_reward": 0.18180693264148892,
              "min_reward": -0.17338125730359186,
              "max_reward": 0.39761686879659497,
              "num_responses": 6,
              "rvariance": 0.051510170561776085
            },
            {
              "id": "chat_hard_sample_266",
              "rewards": [
                0.4993331341747659,
                -0.05692769211210639,
                0.418422468533039,
                0.4438515348775817,
                0.35138220271560816,
                0.3398235361953615,
                0.5825555331205421
              ],
              "variance": 0.351499048880702,
              "mean_reward": 0.368348673929256,
              "min_reward": -0.05692769211210639,
              "max_reward": 0.5825555331205421,
              "num_responses": 7,
              "rvariance": 0.0361730152013336
            },
            {
              "id": "chat_hard_sample_289",
              "rewards": [
                -0.9940465802411074,
                -1.604344172510133,
                -0.7027681839308906,
                -0.5340116527352888,
                -0.7351324501875813,
                -0.6287927182013118,
                -0.9663057805925154
              ],
              "variance": 0.6472853251338151,
              "mean_reward": -0.8807716483426897,
              "min_reward": -1.604344172510133,
              "max_reward": -0.5340116527352888,
              "num_responses": 7,
              "rvariance": 0.11147662583958155
            },
            {
              "id": "chat_hard_sample_69",
              "rewards": [
                0.24966593733743725,
                -0.14448459100297512,
                0.15835247182748835,
                0.5617499333840981,
                0.36987606914800286,
                0.32826486967511476,
                0.39068166888444694
              ],
              "variance": 0.42189132798900447,
              "mean_reward": 0.273443765607659,
              "min_reward": -0.14448459100297512,
              "max_reward": 0.5617499333840981,
              "num_responses": 7,
              "rvariance": 0.042520745320064654
            },
            {
              "id": "chat_hard_sample_40",
              "rewards": [
                -0.49471218656645005,
                -1.0264108464977981,
                -0.8091079159171602,
                -0.49933565317454875,
                -0.9755527138087127,
                -0.41842498753282187,
                -0.6935212507146933
              ],
              "variance": 0.5316986599313481,
              "mean_reward": -0.7024379363160264,
              "min_reward": -1.0264108464977981,
              "max_reward": -0.41842498753282187,
              "num_responses": 7,
              "rvariance": 0.050867428521368704
            },
            {
              "id": "chat_hard_sample_313",
              "rewards": [
                -0.7813671162685681,
                -0.6010519185527197,
                -0.5871815187284236,
                -0.9755527138087127,
                -0.7305089835794827,
                -0.6195457849851144,
                -0.6657804510661012
              ],
              "variance": 0.2635375966616247,
              "mean_reward": -0.7087126409984459,
              "min_reward": -0.9755527138087127,
              "max_reward": -0.5871815187284236,
              "num_responses": 7,
              "rvariance": 0.01615884625221587
            },
            {
              "id": "chat_hard_sample_226",
              "rewards": [
                0.3352000695872628,
                0.8507165963902654,
                0.2982123367224733,
                0.43229286835733505,
                0.2982123367224733,
                1.031031794106114,
                0.2982123367224733
              ],
              "variance": 0.6246303387541317,
              "mean_reward": 0.506268334086914,
              "min_reward": 0.2982123367224733,
              "max_reward": 1.031031794106114,
              "num_responses": 7,
              "rvariance": 0.07980284416312687
            },
            {
              "id": "chat_hard_sample_28",
              "rewards": [
                0.06877280629557644,
                0.8969512624712522,
                0.9847971280251272,
                1.1697357923490743,
                1.0495256605385086,
                1.0911368600113969,
                1.215970458430061
              ],
              "variance": 0.6225497787804869,
              "mean_reward": 0.9252699954458566,
              "min_reward": 0.06877280629557644,
              "max_reward": 1.215970458430061,
              "num_responses": 7,
              "rvariance": 0.13216491961084348
            },
            {
              "id": "chat_hard_sample_323",
              "rewards": [
                0.4230459351411377,
                1.3731683231054161,
                1.3084397905920346,
                1.4841315216997846
              ],
              "variance": 0.7621784703450671,
              "mean_reward": 1.1471963926345932,
              "min_reward": 0.4230459351411377,
              "max_reward": 1.4841315216997846,
              "num_responses": 4,
              "rvariance": 0.17874547825793258
            },
            {
              "id": "chat_hard_sample_116",
              "rewards": [
                -0.4484775204854633,
                -0.06790842530634075,
                -0.2670064561175901,
                -0.34676125510729233,
                0.01618087362845397,
                -0.12021139131045705,
                -0.13177005783070375
              ],
              "variance": 0.3531750555261379,
              "mean_reward": -0.19513631893277048,
              "min_reward": -0.4484775204854633,
              "max_reward": 0.01618087362845397,
              "num_responses": 7,
              "rvariance": 0.023258303272413523
            },
            {
              "id": "chat_hard_sample_36",
              "rewards": [
                1.0587725937547061,
                1.345427523456824,
                1.3546744566730216,
                1.7153048521047185,
                1.5118723213483765,
                1.909490449644863,
                1.5396131209969686
              ],
              "variance": 0.5622135395447996,
              "mean_reward": 1.490736473997068,
              "min_reward": 1.0587725937547061,
              "max_reward": 1.909490449644863,
              "num_responses": 7,
              "rvariance": 0.06497740810448274
            },
            {
              "id": "chat_hard_sample_351",
              "rewards": [
                0.3352000695872628,
                0.024849873518638994,
                0.46928060122212445,
                0.36987606914800286,
                0.7258829979716012,
                0.3999286021006443,
                0.4392280682694831
              ],
              "variance": 0.3608615687621019,
              "mean_reward": 0.3948923259739653,
              "min_reward": 0.024849873518638994,
              "max_reward": 0.7258829979716012,
              "num_responses": 7,
              "rvariance": 0.036885693966175984
            },
            {
              "id": "chat_hard_sample_296",
              "rewards": [
                1.0402787273223113,
                2.0851821807526125,
                1.7800333846181,
                1.3546744566730216,
                1.5396131209969686,
                1.835514983915284
              ],
              "variance": 0.762871990336282,
              "mean_reward": 1.605882809046383,
              "min_reward": 1.0402787273223113,
              "max_reward": 2.0851821807526125,
              "num_responses": 6,
              "rvariance": 0.11669875525736738
            },
            {
              "id": "chat_hard_sample_338",
              "rewards": [
                -0.6010519185527197,
                -0.3652551215396871,
                -0.29243552246213284,
                -0.39993112110042717,
                -0.1907192570839619,
                -0.27394165602973813,
                -0.36987858814778574
              ],
              "variance": 0.23972674362991653,
              "mean_reward": -0.3561733121309218,
              "min_reward": -0.6010519185527197,
              "max_reward": -0.1907192570839619,
              "num_responses": 7,
              "rvariance": 0.014335741001459661
            },
            {
              "id": "chat_hard_sample_354",
              "rewards": [
                -0.6565335178499039,
                -0.018928575926795373,
                0.2566011372495853,
                -0.3190204554587003,
                0.24157487077326456,
                -0.2797209892898615,
                -0.027597575816980396
              ],
              "variance": 0.7016110577789745,
              "mean_reward": -0.11480358661705596,
              "min_reward": -0.6565335178499039,
              "max_reward": 0.2566011372495853,
              "num_responses": 7,
              "rvariance": 0.09201679677346526
            },
            {
              "id": "chat_hard_sample_186",
              "rewards": [
                0.23926313746921524,
                0.35600566932370686,
                -0.05057042552597071,
                0.6149197993772328,
                0.34444700280346013,
                0.4785275344383218
              ],
              "variance": 0.452377310936155,
              "mean_reward": 0.330432119647661,
              "min_reward": -0.05057042552597071,
              "max_reward": 0.6149197993772328,
              "num_responses": 6,
              "rvariance": 0.042865106322179373
            },
            {
              "id": "chat_hard_sample_54",
              "rewards": [
                2.4920472422652966,
                0.8692104628226602,
                0.6796483318906144,
                0.7073891315392065,
                1.5581069874293634,
                0.9663032615927325,
                1.3639213898892188
              ],
              "variance": 1.2353902776839671,
              "mean_reward": 1.2338038296327274,
              "min_reward": 0.6796483318906144,
              "max_reward": 2.4920472422652966,
              "num_responses": 7,
              "rvariance": 0.35628074716393526
            },
            {
              "id": "chat_hard_sample_241",
              "rewards": [
                -0.48084178674215405,
                -1.0079169800654035,
                -0.8322252489576536,
                -0.883083381646739,
                -0.827601782349555,
                -0.9524353807682193,
                -0.9755527138087127
              ],
              "variance": 0.2996006362047946,
              "mean_reward": -0.8513796106197768,
              "min_reward": -1.0079169800654035,
              "max_reward": -0.48084178674215405,
              "num_responses": 7,
              "rvariance": 0.02705297985400677
            },
            {
              "id": "chat_hard_sample_67",
              "rewards": [
                0.8830808626469562,
                1.0818899267951994,
                0.9894205946332258,
                0.9755501948089298,
                0.9385624619441404,
                1.2252173916462585,
                1.2252173916462585
              ],
              "variance": 0.3088475694209918,
              "mean_reward": 1.0455626891601384,
              "min_reward": 0.8830808626469562,
              "max_reward": 1.2252173916462585,
              "num_responses": 7,
              "rvariance": 0.01596776702277553
            },
            {
              "id": "chat_hard_sample_262",
              "rewards": [
                0.09015633935803283,
                -0.15835499082727117,
                -0.16297845743536984,
                -0.5178295196069435,
                -0.3259556553708483,
                -0.43923058726926595,
                -0.2670064561175901
              ],
              "variance": 0.41171970145118747,
              "mean_reward": -0.2544570467527509,
              "min_reward": -0.5178295196069435,
              "max_reward": 0.09015633935803283,
              "num_responses": 7,
              "rvariance": 0.03501974039791615
            },
            {
              "id": "chat_hard_sample_244",
              "rewards": [
                -1.0772689791868837,
                -1.4933809739157646,
                -1.4009116417537912,
                -0.9801761804168113,
                -1.6505788385911198,
                -1.1836087111731532,
                -1.1512444449164625
              ],
              "variance": 0.5178282601070521,
              "mean_reward": -1.276738538564855,
              "min_reward": -1.6505788385911198,
              "max_reward": -0.9801761804168113,
              "num_responses": 7,
              "rvariance": 0.050609820564783026
            },
            {
              "id": "chat_hard_sample_85",
              "rewards": [
                1.2529581912948506,
                1.835514983915284,
                1.6413293863751395,
                1.678317119239929,
                1.4009091227540083,
                1.7153048521047185,
                1.3546744566730216
              ],
              "variance": 0.44940095430719174,
              "mean_reward": 1.5541440160509932,
              "min_reward": 1.2529581912948506,
              "max_reward": 1.835514983915284,
              "num_responses": 7,
              "rvariance": 0.04030637480925293
            },
            {
              "id": "chat_hard_sample_398",
              "rewards": [
                0.40455206870874294,
                -0.6334161848094104,
                -0.6334161848094104,
                -0.42304845414092057,
                -0.6519100512418051,
                -0.6334161848094104,
                -0.5617524523838809
              ],
              "variance": 0.5488054863813134,
              "mean_reward": -0.4474867776408707,
              "min_reward": -0.6519100512418051,
              "max_reward": 0.40455206870874294,
              "num_responses": 7,
              "rvariance": 0.12644602570122865
            },
            {
              "id": "chat_hard_sample_319",
              "rewards": [
                -1.5303687067805543,
                -1.3361831092404097,
                -1.2067260442136467,
                -1.4286524414023831,
                -1.4009116417537912,
                -1.4933809739157646,
                -1.2714545767270282
              ],
              "variance": 0.26261290334000487,
              "mean_reward": -1.38109678486194,
              "min_reward": -1.5303687067805543,
              "max_reward": -1.2067260442136467,
              "num_responses": 7,
              "rvariance": 0.011712546009165537
            },
            {
              "id": "chat_hard_sample_190",
              "rewards": [
                -0.5062708530866967,
                -0.9339415143358246,
                -0.5918049853365224,
                -0.12599072457058041,
                -0.0861133250757293,
                -0.4715948535259567
              ],
              "variance": 0.6568212250130185,
              "mean_reward": -0.4526193759885517,
              "min_reward": -0.9339415143358246,
              "max_reward": -0.0861133250757293,
              "num_responses": 6,
              "rvariance": 0.08254919095636294
            },
            {
              "id": "chat_hard_sample_20",
              "rewards": [
                -0.01878409259529229,
                0.8738339294307589,
                1.003290994457522,
                0.79985846370118,
                0.8738339294307589,
                1.678317119239929,
                -0.16182259078334515
              ],
              "variance": 1.3493009362409984,
              "mean_reward": 0.7212182504116446,
              "min_reward": -0.16182259078334515,
              "max_reward": 1.678317119239929,
              "num_responses": 7,
              "rvariance": 0.33939074951874554
            },
            {
              "id": "chat_hard_sample_264",
              "rewards": [
                0.38605820227634824,
                0.7027656649311077,
                1.1188776596599888,
                0.7212595313635025,
                0.9200685955117457,
                1.086513393403298,
                0.9663032615927325
              ],
              "variance": 0.5233764200367704,
              "mean_reward": 0.843120901248389,
              "min_reward": 0.38605820227634824,
              "max_reward": 1.1188776596599888,
              "num_responses": 7,
              "rvariance": 0.057118947603286965
            },
            {
              "id": "chat_hard_sample_27",
              "rewards": [
                0.534009133735506,
                0.6472840656339236,
                0.8553400629983642,
                0.8044819303092787,
                0.8784573960388575,
                0.8784573960388575,
                1.2714520577272452
              ],
              "variance": 0.43368116783965616,
              "mean_reward": 0.8384974346402905,
              "min_reward": 0.534009133735506,
              "max_reward": 1.2714520577272452,
              "num_responses": 7,
              "rvariance": 0.04590852988883798
            },
            {
              "id": "chat_hard_sample_115",
              "rewards": [
                -0.473906586830006,
                -0.39993112110042717,
                -0.2566036562493681,
                -0.38837245458018044,
                0.06212657304643459,
                -0.11905552465843239,
                -0.17338125730359186
              ],
              "variance": 0.38293862181577315,
              "mean_reward": -0.2498748610965102,
              "min_reward": -0.473906586830006,
              "max_reward": 0.06212657304643459,
              "num_responses": 7,
              "rvariance": 0.030320545785864263
            },
            {
              "id": "chat_hard_sample_260",
              "rewards": [
                0.30283580333057203,
                0.41379900192494035,
                0.4484750014856804,
                0.12425440559276059,
                0.45309846809377907,
                0.3167062031548681,
                0.6056728661610356
              ],
              "variance": 0.2827249830852343,
              "mean_reward": 0.3806916785348052,
              "min_reward": 0.12425440559276059,
              "max_reward": 0.6056728661610356,
              "num_responses": 7,
              "rvariance": 0.01963795785851923
            },
            {
              "id": "chat_hard_sample_175",
              "rewards": [
                -0.2797209892898615,
                -0.03511070905514075,
                -0.24042152312102272,
                -0.23001872325280068,
                0.10344880585631654,
                0.03438577339784252,
                -0.2646947228135408
              ],
              "variance": 0.3327162157853012,
              "mean_reward": -0.1303045840397439,
              "min_reward": -0.2797209892898615,
              "max_reward": 0.10344880585631654,
              "num_responses": 7,
              "rvariance": 0.02189715090636322
            },
            {
              "id": "chat_hard_sample_200",
              "rewards": [
                0.17222287165178438,
                0.13523513878699495,
                -0.14679632430702447,
                -0.34676125510729233
              ],
              "variance": 0.4478983276595595,
              "mean_reward": -0.046524892243884376,
              "min_reward": -0.34676125510729233,
              "max_reward": 0.17222287165178438,
              "num_responses": 4,
              "rvariance": 0.04527088169078558
            },
            {
              "id": "chat_hard_sample_240",
              "rewards": [
                0.07108453959962578,
                -0.25429192294531877,
                -0.2034337902562333,
                -0.044791092265847356
              ],
              "variance": 0.275356333178577,
              "mean_reward": -0.10785806646694342,
              "min_reward": -0.25429192294531877,
              "max_reward": 0.07108453959962578,
              "num_responses": 4,
              "rvariance": 0.016643873200438287
            },
            {
              "id": "chat_hard_sample_130",
              "rewards": [
                0.36756433584395354,
                0.18609327147608043,
                0.5432560669517034,
                0.7166360647554038,
                0.4762158011342725,
                0.6195432659853315,
                0.42766940174923634
              ],
              "variance": 0.3634044753965561,
              "mean_reward": 0.4767111725565688,
              "min_reward": 0.18609327147608043,
              "max_reward": 0.7166360647554038,
              "num_responses": 7,
              "rvariance": 0.025881474407069817
            },
            {
              "id": "chat_hard_sample_374",
              "rewards": [
                0.41379900192494035,
                0.6796483318906144,
                0.42766940174923634,
                0.5525030001679007,
                0.4993331341747659,
                0.41148726862089097,
                0.36987606914800286
              ],
              "variance": 0.2085183440252505,
              "mean_reward": 0.47918802966805024,
              "min_reward": 0.36987606914800286,
              "max_reward": 0.6796483318906144,
              "num_responses": 7,
              "rvariance": 0.009918233519009929
            },
            {
              "id": "chat_hard_sample_257",
              "rewards": [
                -0.11558792470235837,
                -0.5085825863907462,
                0.03785337335391653,
                -0.09189265833585265,
                -0.09015885835781565,
                0.06935073962158878,
                -0.18031645721573988
              ],
              "variance": 0.3620752287467278,
              "mean_reward": -0.1256191960038582,
              "min_reward": -0.5085825863907462,
              "max_reward": 0.06935073962158878,
              "num_responses": 7,
              "rvariance": 0.030983549540555894
            },
            {
              "id": "chat_hard_sample_237",
              "rewards": [
                -0.6842743174984959,
                -0.6102988517689171,
                -0.45772445370166065,
                -0.5247647195190915,
                -0.7490028500118774,
                -0.6102988517689171,
                -0.6981447173227919
              ],
              "variance": 0.22053935720630702,
              "mean_reward": -0.6192155373702501,
              "min_reward": -0.7490028500118774,
              "max_reward": -0.45772445370166065,
              "num_responses": 7,
              "rvariance": 0.00892379264341797
            },
            {
              "id": "chat_hard_sample_22",
              "rewards": [
                -0.26585058946556545,
                0.7212595313635025,
                0.425357668445187,
                0.23695140416516589,
                0.2843419368981773
              ],
              "variance": 0.6676285782094492,
              "mean_reward": 0.2804119902812935,
              "min_reward": -0.26585058946556545,
              "max_reward": 0.7212595313635025,
              "num_responses": 5,
              "rvariance": 0.10313257543085667
            },
            {
              "id": "chat_hard_sample_292",
              "rewards": [
                0.29590060341842406,
                0.24273073742528922,
                0.11558540570257557,
                0.040454073320972034,
                0.1311896055049086,
                0.09651360594416851,
                -0.10865272479021036
              ],
              "variance": 0.28318732974604405,
              "mean_reward": 0.11624590093230394,
              "min_reward": -0.10865272479021036,
              "max_reward": 0.29590060341842406,
              "num_responses": 7,
              "rvariance": 0.015030161856910793
            },
            {
              "id": "chat_hard_sample_92",
              "rewards": [
                0.540944333647654,
                0.261224603857684,
                0.17222287165178438,
                0.1641318050876117,
                0.1011370725522672,
                0.3120827365467694
              ],
              "variance": 0.29387909627727227,
              "mean_reward": 0.25862390389062845,
              "min_reward": 0.1011370725522672,
              "max_reward": 0.540944333647654,
              "num_responses": 6,
              "rvariance": 0.020627572106766974
            },
            {
              "id": "chat_hard_sample_407",
              "rewards": [
                -0.6611569844580025,
                -1.2067260442136467,
                -0.3490729884113417,
                -1.3269361760242122,
                -0.41611325422877254
              ],
              "variance": 0.9029630285616721,
              "mean_reward": -0.792001089467195,
              "min_reward": -1.3269361760242122,
              "max_reward": -0.3490729884113417,
              "num_responses": 5,
              "rvariance": 0.16254989642400763
            },
            {
              "id": "chat_hard_sample_44",
              "rewards": [
                -1.3824177753213964,
                -0.8137313825252589,
                -0.6472865846337065,
                -1.1096332454435744,
                -0.9200711145115286,
                -0.9755527138087127
              ],
              "variance": 0.5155165268030029,
              "mean_reward": -0.9747821360406963,
              "min_reward": -1.3824177753213964,
              "max_reward": -0.6472865846337065,
              "num_responses": 6,
              "rvariance": 0.053422701197515354
            },
            {
              "id": "chat_hard_sample_119",
              "rewards": [
                0.6149197993772328,
                0.5733085999043448,
                0.5871789997286407,
                0.09073427268404517,
                0.813728863525476
              ],
              "variance": 0.4504412342940137,
              "mean_reward": 0.535974107043948,
              "min_reward": 0.09073427268404517,
              "max_reward": 0.813728863525476,
              "num_responses": 5,
              "rvariance": 0.057126888515784444
            },
            {
              "id": "chat_hard_sample_303",
              "rewards": [
                0.09998120590024252,
                0.2519776706414866,
                0.6472840656339236,
                0.30977100324272006,
                0.43460460166138437,
                0.34444700280346013,
                0.49008620095856853
              ],
              "variance": 0.3617862620837216,
              "mean_reward": 0.368307392977398,
              "min_reward": 0.09998120590024252,
              "max_reward": 0.6472840656339236,
              "num_responses": 7,
              "rvariance": 0.026654393707378092
            },
            {
              "id": "chat_hard_sample_365",
              "rewards": [
                -2.251629497643948,
                -1.937233768293238,
                -1.8077767032664749,
                -1.9927153675904221,
                -1.7430481707530934
              ],
              "variance": 0.37912426186409176,
              "mean_reward": -1.9464807015094354,
              "min_reward": -2.251629497643948,
              "max_reward": -1.7430481707530934,
              "num_responses": 5,
              "rvariance": 0.031192506320476165
            },
            {
              "id": "chat_hard_sample_45",
              "rewards": [
                -0.26585058946556545,
                -0.1277245245486174,
                -0.2022779236042086,
                -0.28665618920200947,
                -0.03251000908808524,
                -0.14332872435095045,
                0.015313973639435468
              ],
              "variance": 0.2607924133630661,
              "mean_reward": -0.14900485523142873,
              "min_reward": -0.28665618920200947,
              "max_reward": 0.015313973639435468,
              "num_responses": 7,
              "rvariance": 0.01092794754309164
            },
            {
              "id": "chat_hard_sample_78",
              "rewards": [
                0.10055913922625485,
                0.19996367130037646,
                -0.0002902261628975739,
                0.4877744676545192
              ],
              "variance": 0.37146664529442824,
              "mean_reward": 0.19700176300456324,
              "min_reward": -0.0002902261628975739,
              "max_reward": 0.4877744676545192,
              "num_responses": 4,
              "rvariance": 0.03319571183527528
            },
            {
              "id": "chat_hard_sample_189",
              "rewards": [
                2.2331331122117706,
                2.0019597818068364,
                2.112922980401205,
                2.3440963108061386
              ],
              "variance": 0.27555860984268143,
              "mean_reward": 2.1730280463064875,
              "min_reward": 2.0019597818068364,
              "max_reward": 2.3440963108061386,
              "num_responses": 4,
              "rvariance": 0.016438485033200487
            },
            {
              "id": "chat_hard_sample_39",
              "rewards": [
                1.1050072598356928,
                0.7166360647554038,
                1.1789827255652716,
                1.1974765919976664,
                1.1558653925247784
              ],
              "variance": 0.3180945026371892,
              "mean_reward": 1.0707936069357626,
              "min_reward": 0.7166360647554038,
              "max_reward": 1.1974765919976664,
              "num_responses": 5,
              "rvariance": 0.032317762305063516
            },
            {
              "id": "chat_hard_sample_387",
              "rewards": [
                -1.0587751127544889,
                -1.2529607102946334,
                -1.114256712051673,
                -1.3639239088890016,
                -0.9847996470249101,
                -1.072645512578785,
                -0.970929247200614
              ],
              "variance": 0.3180945026371891,
              "mean_reward": -1.1168986929705866,
              "min_reward": -1.3639239088890016,
              "max_reward": -0.970929247200614,
              "num_responses": 7,
              "rvariance": 0.017662177358726012
            },
            {
              "id": "chat_hard_sample_118",
              "rewards": [
                0.7258829979716012,
                1.3176867238082322,
                1.1050072598356928,
                1.215970458430061,
                1.3361805902406267,
                1.262205124511048
              ],
              "variance": 0.4114885281207825,
              "mean_reward": 1.160488859132877,
              "min_reward": 0.7258829979716012,
              "max_reward": 1.3361805902406267,
              "num_responses": 6,
              "rvariance": 0.04349393699291539
            },
            {
              "id": "chat_hard_sample_154",
              "rewards": [
                -0.6380396514175092,
                -0.6981447173227919,
                -0.4068663210125752,
                -0.32826738867489763,
                -0.575622852208177,
                -0.5039591197826474,
                -0.6888977841065946
              ],
              "variance": 0.31716980931556943,
              "mean_reward": -0.5485425477893132,
              "min_reward": -0.6981447173227919,
              "max_reward": -0.32826738867489763,
              "num_responses": 7,
              "rvariance": 0.01734349384935119
            },
            {
              "id": "chat_hard_sample_103",
              "rewards": [
                0.5132035339990619,
                0.08900047270600817,
                0.36987606914800286,
                0.540944333647654,
                -0.04710282556989669,
                0.285497803550202,
                0.418422468533039
              ],
              "variance": 0.4897407004628525,
              "mean_reward": 0.30997740800201024,
              "min_reward": -0.04710282556989669,
              "max_reward": 0.540944333647654,
              "num_responses": 7,
              "rvariance": 0.04099015856647555
            },
            {
              "id": "chat_hard_sample_162",
              "rewards": [
                0.8923277958631536,
                0.5224504672152592,
                0.5132035339990619,
                0.5825555331205421
              ],
              "variance": 0.283418503076449,
              "mean_reward": 0.6276343325495042,
              "min_reward": 0.5132035339990619,
              "max_reward": 0.8923277958631536,
              "num_responses": 4,
              "rvariance": 0.02406319521561883
            },
            {
              "id": "chat_hard_sample_321",
              "rewards": [
                0.6010493995529368,
                1.11425419305189,
                1.0125379276737192,
                1.174359258957173,
                1.262205124511048,
                0.8229757967416734,
                0.8044819303092787
              ],
              "variance": 0.486388687171981,
              "mean_reward": 0.9702662329711026,
              "min_reward": 0.6010493995529368,
              "max_reward": 1.262205124511048,
              "num_responses": 7,
              "rvariance": 0.04784309802343441
            },
            {
              "id": "chat_hard_sample_273",
              "rewards": [
                -0.6287927182013118,
                -0.6287927182013118,
                -0.6287927182013118,
                -0.9663057805925154,
                -0.6287927182013118,
                -0.9663057805925154,
                -0.6287927182013118
              ],
              "variance": 0.3375130623912036,
              "mean_reward": -0.7252250217416556,
              "min_reward": -0.9663057805925154,
              "max_reward": -0.6287927182013118,
              "num_responses": 7,
              "rvariance": 0.02324797291524255
            },
            {
              "id": "chat_hard_sample_291",
              "rewards": [
                0.4831510010464205,
                1.0911368600113969,
                0.9709267282008311,
                1.0587725937547061,
                0.9616797949846337,
                0.8738339294307589,
                1.678317119239929
              ],
              "variance": 0.6084482056257863,
              "mean_reward": 1.0168311466669537,
              "min_reward": 0.4831510010464205,
              "max_reward": 1.678317119239929,
              "num_responses": 7,
              "rvariance": 0.10789367216060075
            },
            {
              "id": "chat_hard_sample_312",
              "rewards": [
                -0.8368487155657524,
                -0.6287927182013118,
                -0.8091079159171602,
                -0.5779345855122263,
                -0.4646596536138087,
                -0.5686876522960289,
                -0.5409468526474369
              ],
              "variance": 0.3097722627426115,
              "mean_reward": -0.6324254419648179,
              "min_reward": -0.8368487155657524,
              "max_reward": -0.4646596536138087,
              "num_responses": 7,
              "rvariance": 0.016652031340988284
            },
            {
              "id": "chat_hard_sample_314",
              "rewards": [
                -0.841472182173851,
                -0.6519100512418051,
                -0.6380396514175092,
                -0.8738364484305418,
                -0.8784599150386404,
                -1.215972977429844
              ],
              "variance": 0.402241594904585,
              "mean_reward": -0.849948537622032,
              "min_reward": -1.215972977429844,
              "max_reward": -0.6380396514175092,
              "num_responses": 6,
              "rvariance": 0.03659231470058447
            },
            {
              "id": "chat_hard_sample_399",
              "rewards": [
                0.8877043292550549,
                1.1419949927004822,
                1.2252173916462585,
                0.684271798498713,
                0.9570563283765351,
                1.0264083274980154,
                1.3731683231054161
              ],
              "variance": 0.47806644727740344,
              "mean_reward": 1.0422602130114966,
              "min_reward": 0.684271798498713,
              "max_reward": 1.3731683231054161,
              "num_responses": 7,
              "rvariance": 0.04463924902569484
            },
            {
              "id": "chat_hard_sample_219",
              "rewards": [
                -0.9108241812953312,
                -1.2714545767270282,
                -1.1050097788354758,
                -0.957058847376318,
                -0.9663057805925154,
                -0.9847996470249101,
                -1.0217873798896995
              ],
              "variance": 0.23302271704817346,
              "mean_reward": -1.0310343131058968,
              "min_reward": -1.2714545767270282,
              "max_reward": -0.9108241812953312,
              "num_responses": 7,
              "rvariance": 0.01280143586460645
            },
            {
              "id": "chat_hard_sample_406",
              "rewards": [
                -0.7582497832280748,
                -1.0541516461463902,
                -0.7906140494847655,
                -0.9616823139844166,
                -0.6287927182013118,
                -0.6704039176741998,
                -0.8137313825252589
              ],
              "variance": 0.3449106089641615,
              "mean_reward": -0.8110894016063455,
              "min_reward": -1.0541516461463902,
              "max_reward": -0.6287927182013118,
              "num_responses": 7,
              "rvariance": 0.019714315932441554
            },
            {
              "id": "chat_hard_sample_253",
              "rewards": [
                0.7536237976201933,
                1.0079144610656205,
                1.2067235252138637,
                0.9663032615927325,
                1.11425419305189,
                0.7397533977958972,
                1.1050072598356928
              ],
              "variance": 0.4031662882262047,
              "mean_reward": 0.9847971280251271,
              "min_reward": 0.7397533977958972,
              "max_reward": 1.2067235252138637,
              "num_responses": 7,
              "rvariance": 0.02783212940601695
            },
            {
              "id": "chat_hard_sample_24",
              "rewards": [
                1.160488859132877,
                1.5118723213483765,
                1.8170211174828894,
                1.9279843160772576,
                1.7985272510504946,
                1.8170211174828894
              ],
              "variance": 0.5363221265394467,
              "mean_reward": 1.6721524970957973,
              "min_reward": 1.160488859132877,
              "max_reward": 1.9279843160772576,
              "num_responses": 6,
              "rvariance": 0.06848062425621103
            },
            {
              "id": "chat_hard_sample_60",
              "rewards": [
                0.8183523301335748,
                0.929315528727943,
                0.9108216622955483,
                1.2991928573758373,
                1.3269336570244294,
                1.1974765919976664,
                1.1789827255652716
              ],
              "variance": 0.4364552478045154,
              "mean_reward": 1.0944393361600386,
              "min_reward": 0.8183523301335748,
              "max_reward": 1.3269336570244294,
              "num_responses": 7,
              "rvariance": 0.035849604471438756
            },
            {
              "id": "chat_hard_sample_386",
              "rewards": [
                -2.325604963373527,
                -2.612259893075645,
                -2.4458150951840922,
                -2.251629497643948,
                -1.9834684343742246,
                -2.2886172305087373
              ],
              "variance": 0.41148852812078207,
              "mean_reward": -2.317899185693362,
              "min_reward": -2.612259893075645,
              "max_reward": -1.9834684343742246,
              "num_responses": 6,
              "rvariance": 0.03669385280709641
            },
            {
              "id": "chat_hard_sample_216",
              "rewards": [
                -1.6690727050235146,
                -1.1327505784840677,
                -1.4841340406995673,
                -1.1327505784840677,
                -1.1512444449164625,
                -1.4841340406995673
              ],
              "variance": 0.44385279437747327,
              "mean_reward": -1.3423477313845413,
              "min_reward": -1.6690727050235146,
              "max_reward": -1.1327505784840677,
              "num_responses": 6,
              "rvariance": 0.04522305375410165
            },
            {
              "id": "chat_hard_sample_300",
              "rewards": [
                2.7139736394540335,
                2.4920472422652966,
                2.7694552387512177,
                2.9174061702103753,
                2.8249368380484015,
                2.861924570913191,
                2.7879491051836123
              ],
              "variance": 0.25891413005352604,
              "mean_reward": 2.766813257832304,
              "min_reward": 2.4920472422652966,
              "max_reward": 2.9174061702103753,
              "num_responses": 7,
              "rvariance": 0.01626354719985443
            },
            {
              "id": "chat_hard_sample_352",
              "rewards": [
                -1.1235036452678704,
                -0.6565335178499039,
                -0.6657804510661012,
                -0.5501937858636342,
                -0.22886285660077602,
                -0.8553425819981471
              ],
              "variance": 0.5998947924008036,
              "mean_reward": -0.6800361397744054,
              "min_reward": -1.1235036452678704,
              "max_reward": -0.22886285660077602,
              "num_responses": 6,
              "rvariance": 0.07476129055506309
            },
            {
              "id": "chat_hard_sample_311",
              "rewards": [
                -2.251629497643948,
                -1.9557276347256327,
                -1.8077767032664749,
                -1.835517502915067,
                -1.96497456794183,
                -1.9557276347256327,
                -1.3731708421051991
              ],
              "variance": 0.4457021810207127,
              "mean_reward": -1.8777891976176837,
              "min_reward": -2.251629497643948,
              "max_reward": -1.3731708421051991,
              "num_responses": 7,
              "rvariance": 0.06011928413405414
            },
            {
              "id": "chat_hard_sample_419",
              "rewards": [
                -0.8368487155657524,
                -0.7351324501875813,
                -0.6426631180256078,
                -0.6935212507146933,
                -0.5918049853365224,
                -0.7721201830523708,
                -0.6010519185527197
              ],
              "variance": 0.2006584507914827,
              "mean_reward": -0.6961632316336068,
              "min_reward": -0.8368487155657524,
              "max_reward": -0.5918049853365224,
              "num_responses": 7,
              "rvariance": 0.007126644502597153
            },
            {
              "id": "chat_hard_sample_287",
              "rewards": [
                -1.9094929686446458,
                -1.9927153675904221,
                -1.7800359036178828,
                -2.094431632968593,
                -1.9834684343742246,
                -2.094431632968593,
                -1.706060437888304
              ],
              "variance": 0.34398591564254155,
              "mean_reward": -1.937233768293238,
              "min_reward": -2.094431632968593,
              "max_reward": -1.706060437888304,
              "num_responses": 7,
              "rvariance": 0.01908000269133134
            },
            {
              "id": "chat_hard_sample_55",
              "rewards": [
                -0.3005265890263056,
                -1.0125404466735022,
                -0.20805725686433196,
                -0.2519801896412694,
                -0.20805725686433196,
                -0.3860607212761311,
                -0.31208525554655225
              ],
              "variance": 0.4285953545707475,
              "mean_reward": -0.38275824512748924,
              "min_reward": -1.0125404466735022,
              "max_reward": -0.20805725686433196,
              "num_responses": 7,
              "rvariance": 0.06950528783590146
            }
          ]
        },
        "semantic_benchmark_reasoning_filtered.json": {
          "file_name": "semantic_benchmark_reasoning_filtered.json",
          "processed_samples": 200,
          "global_mean": 0.004518677838950534,
          "global_std": 1.4384692662030714,
          "mean_variance": 0.7627793007283853,
          "mean_rvariance": 0.16700046945868968,
          "sample_results": [
            {
              "id": "reasoning_sample_9",
              "rewards": [
                1.658781579991156,
                1.615332615547882,
                1.952062089983257,
                0.2439746753070393,
                0.44492613585718255,
                1.9846488133157127,
                1.8977508844291644
              ],
              "variance": 1.600551227679114,
              "mean_reward": 1.3996395420616277,
              "min_reward": 0.2439746753070393,
              "max_reward": 1.9846488133157127,
              "num_responses": 7,
              "rvariance": 0.46517692833003715
            },
            {
              "id": "reasoning_sample_5",
              "rewards": [
                1.5501591688829706,
                0.19237903003065118,
                1.5718836511046077,
                1.349207708332827,
                0.5834197100201192
              ],
              "variance": 1.2143985561895145,
              "mean_reward": 1.0494098536742351,
              "min_reward": 0.19237903003065118,
              "max_reward": 1.5718836511046077,
              "num_responses": 5,
              "rvariance": 0.31305122919984185
            },
            {
              "id": "reasoning_sample_85",
              "rewards": [
                -0.8395338754971114,
                -0.6440135355023775,
                -2.0669671210196077,
                -0.27062399731798964
              ],
              "variance": 1.3160962885895529,
              "mean_reward": -0.9552846323342715,
              "min_reward": -2.0669671210196077,
              "max_reward": -0.27062399731798964,
              "num_responses": 4,
              "rvariance": 0.45372151855545667
            },
            {
              "id": "reasoning_sample_65",
              "rewards": [
                1.9737865722048942,
                1.8108529555426158,
                1.2948965027787345,
                1.1591184888935024,
                1.9846488133157127,
                0.6540242772404398,
                2.1584446710888097
              ],
              "variance": 1.0970863521926744,
              "mean_reward": 1.5765388972949583,
              "min_reward": 0.6540242772404398,
              "max_reward": 2.1584446710888097,
              "num_responses": 7,
              "rvariance": 0.260353183742304
            },
            {
              "id": "reasoning_sample_256",
              "rewards": [
                -0.2570461959294665,
                -1.893171263246511,
                -0.22445947259701082,
                -2.023518156576334
              ],
              "variance": 1.7501785989806393,
              "mean_reward": -1.0995487720873305,
              "min_reward": -2.023518156576334,
              "max_reward": -0.22445947259701082,
              "num_responses": 4,
              "rvariance": 0.7397869887154467
            },
            {
              "id": "reasoning_sample_263",
              "rewards": [
                0.2358279944739254,
                0.5535485469653681,
                -0.3127151816224116,
                0.6268686744633933,
                -0.8775517193849763,
                0.40690829196931766
              ],
              "variance": 1.1853420612180747,
              "mean_reward": 0.10548110114410279,
              "min_reward": -0.8775517193849763,
              "max_reward": 0.6268686744633933,
              "num_responses": 6,
              "rvariance": 0.2869499597905291
            },
            {
              "id": "reasoning_sample_203",
              "rewards": [
                -0.46207099689616665,
                -1.22514343493117,
                -0.9807430099377527,
                -1.5890285121435914,
                -1.5890285121435914,
                -0.9807430099377527
              ],
              "variance": 0.8676215087266317,
              "mean_reward": -1.137792912665004,
              "min_reward": -1.5890285121435914,
              "max_reward": -0.46207099689616665,
              "num_responses": 6,
              "rvariance": 0.15346444959289302
            },
            {
              "id": "reasoning_sample_61",
              "rewards": [
                -0.07340643214969028,
                -0.6059956916145125,
                -1.3120413638177186,
                0.3267992637770308,
                -0.021386480579910806,
                -0.46750211745157594,
                -0.19730386981996442
              ],
              "variance": 1.006301777658661,
              "mean_reward": -0.3358338130937631,
              "min_reward": -1.3120413638177186,
              "max_reward": 0.3267992637770308,
              "num_responses": 7,
              "rvariance": 0.23847479428710372
            },
            {
              "id": "reasoning_sample_319",
              "rewards": [
                0.18287456905868496,
                0.008230098698805408,
                -0.9698807688269341,
                0.5861352702978238,
                0.059656021457837,
                0.001886719612604728
              ],
              "variance": 0.868501944285419,
              "mean_reward": -0.021849681616863043,
              "min_reward": -0.9698807688269341,
              "max_reward": 0.5861352702978238,
              "num_responses": 6,
              "rvariance": 0.21973867540782407
            },
            {
              "id": "reasoning_sample_528",
              "rewards": [
                -1.3337658460393556,
                -0.10769038065571136,
                -0.22717503287471544,
                -2.0017936743546967,
                -1.3337658460393556,
                -1.3337658460393556,
                -1.1382455060446217
              ],
              "variance": 1.4215958053783782,
              "mean_reward": -1.0680288760068304,
              "min_reward": -2.0017936743546967,
              "max_reward": -0.10769038065571136,
              "num_responses": 7,
              "rvariance": 0.3882829566652851
            },
            {
              "id": "reasoning_sample_551",
              "rewards": [
                -0.16675381669578723,
                -0.19051496912570284,
                -0.13688265364103622,
                -0.21902835204160154,
                -0.6114268121699218,
                0.7898022911256717,
                -0.8775517193849763
              ],
              "variance": 0.9516680993215909,
              "mean_reward": -0.20176514741905058,
              "min_reward": -0.8775517193849763,
              "max_reward": 0.7898022911256717,
              "num_responses": 7,
              "rvariance": 0.23051089594591345
            },
            {
              "id": "reasoning_sample_596",
              "rewards": [
                -2.403696595454983,
                -1.8714467810248738,
                -1.502130583257043,
                -1.502130583257043,
                -1.8714467810248738,
                -1.5238550654786802,
                -0.8449649960525207
              ],
              "variance": 0.8450823584216836,
              "mean_reward": -1.6456673407928597,
              "min_reward": -2.403696595454983,
              "max_reward": -0.8449649960525207,
              "num_responses": 7,
              "rvariance": 0.1962470198577519
            },
            {
              "id": "reasoning_sample_456",
              "rewards": [
                -0.8612583577187485,
                -0.2964218199561837,
                -1.59989075325441,
                -1.7845488521383255
              ],
              "variance": 1.2632786411881978,
              "mean_reward": -1.1355299457669168,
              "min_reward": -1.7845488521383255,
              "max_reward": -0.2964218199561837,
              "num_responses": 4,
              "rvariance": 0.3540459627925103
            },
            {
              "id": "reasoning_sample_306",
              "rewards": [
                -1.4369571365921316,
                -1.9474824688006038,
                -2.045242638797971,
                -2.1212783265737007,
                -1.9583447099114224,
                -0.9318629249390691,
                -0.7634981877213816
              ],
              "variance": 1.2111398838562688,
              "mean_reward": -1.6006666276194683,
              "min_reward": -2.1212783265737007,
              "max_reward": -0.7634981877213816,
              "num_responses": 7,
              "rvariance": 0.2702641994260667
            },
            {
              "id": "reasoning_sample_231",
              "rewards": [
                0.48022841946734285,
                -1.0947965416013474,
                0.4883751003004568,
                -0.1558915755849687,
                -0.13348820329390543,
                0.8115267733473087,
                0.4367794550240687
              ],
              "variance": 1.1490893315107178,
              "mean_reward": 0.11896191823699365,
              "min_reward": -1.0947965416013474,
              "max_reward": 0.8115267733473087,
              "num_responses": 7,
              "rvariance": 0.35144553642472764
            },
            {
              "id": "reasoning_sample_526",
              "rewards": [
                -1.3446280871501741,
                -1.502130583257043,
                -1.59989075325441,
                -0.03267302798412071,
                -0.7580670671659723
              ],
              "variance": 1.237956041598602,
              "mean_reward": -1.047477903762344,
              "min_reward": -1.59989075325441,
              "max_reward": -0.03267302798412071,
              "num_responses": 5,
              "rvariance": 0.3427509629971483
            },
            {
              "id": "reasoning_sample_591",
              "rewards": [
                -1.4912683421462245,
                -0.6657380177240145,
                -1.719375405473414,
                -0.15860713586267333,
                0.06440825194382012
              ],
              "variance": 1.6033346769637609,
              "mean_reward": -0.7941161298525011,
              "min_reward": -1.719375405473414,
              "max_reward": 0.06440825194382012,
              "num_responses": 5,
              "rvariance": 0.4999085338965924
            },
            {
              "id": "reasoning_sample_23",
              "rewards": [
                0.48022841946734285,
                0.757215567793216,
                -0.16403825641808262,
                -0.0866447885035004,
                0.757215567793216,
                0.4204860933578408
              ],
              "variance": 0.8825570902540074,
              "mean_reward": 0.36074376724833873,
              "min_reward": -0.16403825641808262,
              "max_reward": 0.757215567793216,
              "num_responses": 6,
              "rvariance": 0.1346296995134342
            },
            {
              "id": "reasoning_sample_275",
              "rewards": [
                -0.053379175101618576,
                -1.360921448816402,
                -1.2360056760419886,
                -1.1925567115987143,
                -1.2360056760419886,
                -0.48651103939550844
              ],
              "variance": 1.028518455180632,
              "mean_reward": -0.9275632878327035,
              "min_reward": -1.360921448816402,
              "max_reward": -0.053379175101618576,
              "num_responses": 6,
              "rvariance": 0.23450319547030665
            },
            {
              "id": "reasoning_sample_656",
              "rewards": [
                -0.8069471521646557,
                -0.6358668546692635,
                -1.7519621288058698,
                -1.4912683421462245
              ],
              "variance": 0.9865630488900949,
              "mean_reward": -1.1715111194465035,
              "min_reward": -1.7519621288058698,
              "max_reward": -0.6358668546692635,
              "num_responses": 4,
              "rvariance": 0.21474743009099406
            },
            {
              "id": "reasoning_sample_405",
              "rewards": [
                -0.752635946610563,
                0.14893006558737698,
                0.14960895565680313,
                -0.27877067815110357,
                0.10819666142180741,
                0.25212135614015324
              ],
              "variance": 0.7165684682793114,
              "mean_reward": -0.06209159765925431,
              "min_reward": -0.752635946610563,
              "max_reward": 0.25212135614015324,
              "num_responses": 6,
              "rvariance": 0.1234794099902145
            },
            {
              "id": "reasoning_sample_330",
              "rewards": [
                -0.9047073221620228,
                -1.7628243699166883,
                -1.6324774765868657,
                -0.9264318043836599,
                -1.339196966594765,
                -1.7628243699166883
              ],
              "variance": 0.847254806643847,
              "mean_reward": -1.3880770515934484,
              "min_reward": -1.7628243699166883,
              "max_reward": -0.9047073221620228,
              "num_responses": 6,
              "rvariance": 0.13162576087155956
            },
            {
              "id": "reasoning_sample_451",
              "rewards": [
                0.015273583169101814,
                -0.22853281301356776,
                0.028766523298946738,
                -0.04862694461563546,
                -0.20680833079193067,
                -0.37517306800961825,
                -0.8341027549417022
              ],
              "variance": 0.5794157020034916,
              "mean_reward": -0.23560054355777224,
              "min_reward": -0.8341027549417022,
              "max_reward": 0.028766523298946738,
              "num_responses": 7,
              "rvariance": 0.07805017587786943
            },
            {
              "id": "reasoning_sample_314",
              "rewards": [
                0.0779860533323433,
                -0.3276507631497871,
                -0.2366794938466817,
                -1.2685923993744443
              ],
              "variance": 0.969896297685683,
              "mean_reward": -0.43873415075964245,
              "min_reward": -1.2685923993744443,
              "max_reward": 0.0779860533323433,
              "num_responses": 4,
              "rvariance": 0.25220752137349634
            },
            {
              "id": "reasoning_sample_593",
              "rewards": [
                -1.6107529943652286,
                0.2847080794726089,
                -1.59989075325441,
                0.3349459446101447,
                0.6322997950188026
              ],
              "variance": 2.1197663527762405,
              "mean_reward": -0.3917379857036165,
              "min_reward": -1.6107529943652286,
              "max_reward": 0.6322997950188026,
              "num_responses": 5,
              "rvariance": 0.9959865782196925
            },
            {
              "id": "reasoning_sample_599",
              "rewards": [
                -0.42405315300830176,
                0.795233411681081,
                1.1265317655610467,
                0.8712690994568109,
                1.1265317655610467,
                1.1265317655610467,
                1.1265317655610467
              ],
              "variance": 0.8190129797557187,
              "mean_reward": 0.8212252029105395,
              "min_reward": -0.42405315300830176,
              "max_reward": 1.1265317655610467,
              "num_responses": 7,
              "rvariance": 0.2752495053289506
            },
            {
              "id": "reasoning_sample_301",
              "rewards": [
                -0.9535874071607062,
                -1.0676409388243011,
                -1.0676409388243011,
                -1.6650641999193214,
                -1.0296230949364362,
                -0.3072840610670023,
                -0.5652622874489429
              ],
              "variance": 0.8445392463661426,
              "mean_reward": -0.9508718468830015,
              "min_reward": -1.6650641999193214,
              "max_reward": -0.3072840610670023,
              "num_responses": 7,
              "rvariance": 0.15806426607388735
            },
            {
              "id": "reasoning_sample_77",
              "rewards": [
                1.3872255522206922,
                1.9955110544265313,
                2.5277608688566406,
                2.4300006988592733,
                2.4517251810809104,
                2.440862939970092,
                2.75586793218383
              ],
              "variance": 0.8668068406433207,
              "mean_reward": 2.2841363182282812,
              "min_reward": 1.3872255522206922,
              "max_reward": 2.75586793218383,
              "num_responses": 7,
              "rvariance": 0.17765182583008968
            },
            {
              "id": "reasoning_sample_511",
              "rewards": [
                -0.7797915493876094,
                0.6540242772404398,
                -1.1491077471554403,
                -1.1491077471554403,
                0.7029043622391232,
                0.6784643197397815,
                0.7029043622391232
              ],
              "variance": 1.8520121093945634,
              "mean_reward": -0.048529960320003195,
              "min_reward": -1.1491077471554403,
              "max_reward": 0.7029043622391232,
              "num_responses": 7,
              "rvariance": 0.7298138090843465
            },
            {
              "id": "reasoning_sample_12",
              "rewards": [
                1.4632612399964222,
                1.539296927772152,
                0.9418736666771315,
                1.2514475383354602,
                0.9255803050109036,
                0.9744603900095871
              ],
              "variance": 0.5675520980402695,
              "mean_reward": 1.1826533446336094,
              "min_reward": 0.9255803050109036,
              "max_reward": 1.539296927772152,
              "num_responses": 6,
              "rvariance": 0.06301229746561605
            },
            {
              "id": "reasoning_sample_543",
              "rewards": [
                -0.41590647217518784,
                0.6540242772404398,
                0.8712690994568109,
                -0.6521602163354914,
                0.8332512555689459,
                0.9853226311204056,
                1.0776516805623633
              ],
              "variance": 1.5326622207364982,
              "mean_reward": 0.4790646079197552,
              "min_reward": -0.6521602163354914,
              "max_reward": 1.0776516805623633,
              "num_responses": 7,
              "rvariance": 0.42930427675015936
            },
            {
              "id": "reasoning_sample_506",
              "rewards": [
                -1.893171263246511,
                -1.0947965416013474,
                -0.8558272371633393,
                -2.371109872122527,
                -1.0839343004905289,
                -2.132140567684519,
                -1.1979878321541237
              ],
              "variance": 1.2350368143000694,
              "mean_reward": -1.518423944923271,
              "min_reward": -2.371109872122527,
              "max_reward": -0.8558272371633393,
              "num_responses": 7,
              "rvariance": 0.30773029479329367
            },
            {
              "id": "reasoning_sample_531",
              "rewards": [
                0.2575524766955625,
                -0.8178093932754743,
                -0.8775517193849763,
                -0.8449649960525207,
                0.7626466883486253,
                0.8332512555689459,
                0.7843711705702624
              ],
              "variance": 1.6619228899552387,
              "mean_reward": 0.013927926067203547,
              "min_reward": -0.8775517193849763,
              "max_reward": 0.8332512555689459,
              "num_responses": 7,
              "rvariance": 0.5870037423196516
            },
            {
              "id": "reasoning_sample_274",
              "rewards": [
                0.21681907252999294,
                0.3607437672483388,
                0.6132908730748702,
                -0.6141423724476265,
                0.16590231732303096
              ],
              "variance": 0.8143965272836211,
              "mean_reward": 0.1485227315457213,
              "min_reward": -0.6141423724476265,
              "max_reward": 0.6132908730748702,
              "num_responses": 5,
              "rvariance": 0.16953433888359307
            },
            {
              "id": "reasoning_sample_597",
              "rewards": [
                0.09258218982500573,
                -0.4131909118974832,
                -0.4131909118974832,
                0.11973779260205211,
                -0.4131909118974832,
                -0.4131909118974832,
                -1.1708322293770774
              ],
              "variance": 0.819691869825145,
              "mean_reward": -0.37303941350570746,
              "min_reward": -1.1708322293770774,
              "max_reward": 0.11973779260205211,
              "num_responses": 7,
              "rvariance": 0.15750782867086027
            },
            {
              "id": "reasoning_sample_73",
              "rewards": [
                1.495847963328878,
                1.615332615547882,
                1.3600699494436457,
                1.4523989988856036,
                0.8278201350135366,
                1.5936081333262448,
                1.8217151966534344
              ],
              "variance": 0.550715624318501,
              "mean_reward": 1.4523989988856036,
              "min_reward": 0.8278201350135366,
              "max_reward": 1.8217151966534344,
              "num_responses": 7,
              "rvariance": 0.0833418657285119
            },
            {
              "id": "reasoning_sample_412",
              "rewards": [
                -1.007898612714799,
                -1.3011791227069,
                -1.3011791227069,
                -1.284885761040672,
                -2.2733497021251603,
                -1.3011791227069
              ],
              "variance": 0.6408722255382946,
              "mean_reward": -1.4116119073335553,
              "min_reward": -2.2733497021251603,
              "max_reward": -1.007898612714799,
              "num_responses": 6,
              "rvariance": 0.15970369452327762
            },
            {
              "id": "reasoning_sample_491",
              "rewards": [
                -0.4349153941191203,
                -0.35344858578798116,
                -0.8232405138308836,
                -0.7852226699430187,
                -0.7689293082767908,
                -0.7417737054997444,
                -1.339196966594765
              ],
              "variance": 0.6272944241497713,
              "mean_reward": -0.7495324491503291,
              "min_reward": -1.339196966594765,
              "max_reward": -0.35344858578798116,
              "num_responses": 7,
              "rvariance": 0.08724480973881775
            },
            {
              "id": "reasoning_sample_64",
              "rewards": [
                0.8658379789014016,
                0.795233411681081,
                1.4849857222180594,
                1.0667894394515447,
                1.0667894394515447,
                0.8604068583459923,
                1.5067102044396963
              ],
              "variance": 0.6593380354266862,
              "mean_reward": 1.0923932934984741,
              "min_reward": 0.795233411681081,
              "max_reward": 1.5067102044396963,
              "num_responses": 7,
              "rvariance": 0.0743639206417992
            },
            {
              "id": "reasoning_sample_535",
              "rewards": [
                0.7191977239053511,
                -0.30321072065044535,
                -0.27469733773454663,
                -0.36159526662109504,
                -0.38060418856502753,
                -0.4186220324528925
              ],
              "variance": 0.6218633035943621,
              "mean_reward": -0.16992197035310933,
              "min_reward": -0.4186220324528925,
              "max_reward": 0.7191977239053511,
              "num_responses": 6,
              "rvariance": 0.16037582829089406
            },
            {
              "id": "reasoning_sample_548",
              "rewards": [
                -0.9318629249390691,
                -0.14842378482128094,
                -0.3670263871765043,
                -1.3826459310380392,
                -0.4213375927305971,
                -0.4213375927305971,
                -0.6032801313368079
              ],
              "variance": 0.8325907811442421,
              "mean_reward": -0.610844906396128,
              "min_reward": -1.3826459310380392,
              "max_reward": -0.14842378482128094,
              "num_responses": 7,
              "rvariance": 0.14912763193538278
            },
            {
              "id": "reasoning_sample_235",
              "rewards": [
                0.9907537516758149,
                0.11227000183836436,
                0.6974732416837139,
                0.6377309155742119,
                0.6485931566850305
              ],
              "variance": 0.5509871803462711,
              "mean_reward": 0.6173642134914271,
              "min_reward": 0.11227000183836436,
              "max_reward": 0.9907537516758149,
              "num_responses": 5,
              "rvariance": 0.08046948314312202
            },
            {
              "id": "reasoning_sample_156",
              "rewards": [
                -0.5055199613394409,
                -1.1110899032675752,
                -0.7689293082767908,
                -1.2522990377082164,
                -0.5218133230056687,
                -0.7689293082767908
              ],
              "variance": 0.6680278283153409,
              "mean_reward": -0.8214301403124139,
              "min_reward": -1.2522990377082164,
              "max_reward": -0.5055199613394409,
              "num_responses": 6,
              "rvariance": 0.07743882302315659
            },
            {
              "id": "reasoning_sample_587",
              "rewards": [
                -0.7797915493876094,
                0.40690829196931766,
                -0.2502572952352049,
                0.6974732416837139,
                0.45850393724570576,
                0.45850393724570576,
                0.5454018661322542
              ],
              "variance": 1.0683014132490047,
              "mean_reward": 0.21953463280769756,
              "min_reward": -0.7797915493876094,
              "max_reward": 0.6974732416837139,
              "num_responses": 7,
              "rvariance": 0.24332765525129205
            },
            {
              "id": "reasoning_sample_594",
              "rewards": [
                -0.6603068971686052,
                0.035046256441138714,
                -1.5129928243678616,
                -0.9970363716039805,
                -1.5890285121435914,
                0.035046256441138714,
                -0.08732367857292657
              ],
              "variance": 1.5784533559192921,
              "mean_reward": -0.6823708244249553,
              "min_reward": -1.5890285121435914,
              "max_reward": 0.035046256441138714,
              "num_responses": 7,
              "rvariance": 0.4278454192256295
            },
            {
              "id": "reasoning_sample_622",
              "rewards": [
                0.0579587962842716,
                0.5236773839106171,
                0.11023333163008588,
                0.13806782447655844,
                -0.3127151816224116,
                -0.3643108268987997,
                -0.3127151816224116
              ],
              "variance": 0.6256650879831489,
              "mean_reward": -0.022829121977441413,
              "min_reward": -0.3643108268987997,
              "max_reward": 0.5236773839106171,
              "num_responses": 7,
              "rvariance": 0.09049530037175492
            },
            {
              "id": "reasoning_sample_647",
              "rewards": [
                0.03402792133699947,
                0.6404464758519165,
                -0.10836927072513752,
                -0.10836927072513752,
                -0.06933309173313333
              ],
              "variance": 0.5062483247710873,
              "mean_reward": 0.0776805528011015,
              "min_reward": -0.10836927072513752,
              "max_reward": 0.6404464758519165,
              "num_responses": 5,
              "rvariance": 0.08189062434570085
            },
            {
              "id": "reasoning_sample_395",
              "rewards": [
                -0.46207099689616665,
                -0.32629298301093473,
                -0.9535874071607062,
                -0.27062399731798964,
                -0.812378272720065,
                -0.44034651467452957
              ],
              "variance": 0.5845243497759234,
              "mean_reward": -0.544216695296732,
              "min_reward": -0.9535874071607062,
              "max_reward": -0.27062399731798964,
              "num_responses": 6,
              "rvariance": 0.06322927504835052
            },
            {
              "id": "reasoning_sample_252",
              "rewards": [
                0.8821313405676293,
                1.1482562477826839,
                1.2623097794462788,
                1.2623097794462788,
                1.1373940066718653,
                0.055922126075993124
              ],
              "variance": 0.7932830461244675,
              "mean_reward": 0.9580538799984547,
              "min_reward": 0.055922126075993124,
              "max_reward": 1.2623097794462788,
              "num_responses": 6,
              "rvariance": 0.17884817664540217
            },
            {
              "id": "reasoning_sample_497",
              "rewards": [
                -0.6575913368909007,
                -0.2366794938466817,
                -0.19051496912570284,
                0.2290390937796638,
                0.1604711967676217,
                0.1604711967676217,
                -0.19051496912570284
              ],
              "variance": 0.5929425866368079,
              "mean_reward": -0.10361704023915443,
              "min_reward": -0.6575913368909007,
              "max_reward": 0.2290390937796638,
              "num_responses": 7,
              "rvariance": 0.08426299076449083
            },
            {
              "id": "reasoning_sample_87",
              "rewards": [
                -0.04930583468506162,
                0.08579328913074415,
                0.3498815261375202,
                0.3498815261375202,
                -0.28284401856766056,
                0.27656139863949497,
                0.23990133489048238
              ],
              "variance": 0.4926026343756214,
              "mean_reward": 0.13855274595471997,
              "min_reward": -0.28284401856766056,
              "max_reward": 0.3498815261375202,
              "num_responses": 7,
              "rvariance": 0.047755324445217504
            },
            {
              "id": "reasoning_sample_299",
              "rewards": [
                1.0559271983407261,
                0.8821313405676293,
                1.539296927772152,
                0.8929935816784479,
                1.5501591688829706,
                1.0396338366744984,
                1.1482562477826839
              ],
              "variance": 0.6549931389823589,
              "mean_reward": 1.158342614528444,
              "min_reward": 0.8821313405676293,
              "max_reward": 1.5501591688829706,
              "num_responses": 7,
              "rvariance": 0.0671473720499049
            },
            {
              "id": "reasoning_sample_303",
              "rewards": [
                -0.4484931955076435,
                -0.9427251660498877,
                -1.1545388677108495,
                -0.9427251660498877,
                -1.969206951022241
              ],
              "variance": 0.9971537339731431,
              "mean_reward": -1.091537869268102,
              "min_reward": -1.969206951022241,
              "max_reward": -0.4484931955076435,
              "num_responses": 5,
              "rvariance": 0.24641380732037116
            },
            {
              "id": "reasoning_sample_509",
              "rewards": [
                -0.42676871328600635,
                -0.005273449088374299,
                -0.6412979752246728,
                -0.4349153941191203,
                -0.8015160316092464,
                -0.7146181027226981,
                0.031821528611364454
              ],
              "variance": 0.7589418162688387,
              "mean_reward": -0.42750973391982194,
              "min_reward": -0.8015160316092464,
              "max_reward": 0.031821528611364454,
              "num_responses": 7,
              "rvariance": 0.0939059171642206
            },
            {
              "id": "reasoning_sample_572",
              "rewards": [
                -0.8829828399403856,
                -0.09207590905890968,
                0.21817685266884526,
                -1.3174724843731278,
                0.08918773947787494,
                -0.1457082245435763,
                -1.3935081721488576
              ],
              "variance": 1.4886701442376826,
              "mean_reward": -0.5034832911311624,
              "min_reward": -1.3935081721488576,
              "max_reward": 0.21817685266884526,
              "num_responses": 7,
              "rvariance": 0.39543627843708495
            },
            {
              "id": "reasoning_sample_557",
              "rewards": [
                -0.6358668546692635,
                0.5698419086315959,
                0.5698419086315959,
                -1.203418952709533,
                0.6431620361296212,
                0.599713071686347,
                -1.2740235199298535
              ],
              "variance": 1.8487534370613177,
              "mean_reward": -0.10439291460421285,
              "min_reward": -1.2740235199298535,
              "max_reward": 0.6431620361296212,
              "num_responses": 7,
              "rvariance": 0.6888781960486688
            },
            {
              "id": "reasoning_sample_678",
              "rewards": [
                -0.02758135246342451,
                0.6567398375181444,
                0.1217744628103306,
                -0.13688265364103622,
                0.061013801596689315,
                0.061013801596689315,
                0.4965217811335707
              ],
              "variance": 0.6319108766218694,
              "mean_reward": 0.17608566836442335,
              "min_reward": -0.13688265364103622,
              "max_reward": 0.6567398375181444,
              "num_responses": 7,
              "rvariance": 0.07179570496211726
            },
            {
              "id": "reasoning_sample_53",
              "rewards": [
                2.8644903432920157,
                2.6255210388540076,
                3.0600106832867495,
                2.4300006988592733,
                2.994837236621838,
                3.1686330943949352,
                2.994837236621838
              ],
              "variance": 0.5561467448739101,
              "mean_reward": 2.8769043331329507,
              "min_reward": 2.4300006988592733,
              "max_reward": 3.1686330943949352,
              "num_responses": 7,
              "rvariance": 0.058502924454008766
            },
            {
              "id": "reasoning_sample_75",
              "rewards": [
                0.43406389474636403,
                0.18015900878098032,
                0.3267992637770308,
                0.3132214623885076,
                0.816957893902718,
                0.3906149303030898
              ],
              "variance": 0.37882065873979703,
              "mean_reward": 0.4103027423164485,
              "min_reward": 0.18015900878098032,
              "max_reward": 0.816957893902718,
              "num_responses": 6,
              "rvariance": 0.039280726424099605
            },
            {
              "id": "reasoning_sample_595",
              "rewards": [
                -2.696977105447084,
                -2.5449057298956244,
                -0.6195734930030357,
                -0.39961311050896,
                -0.3588797063433904
              ],
              "variance": 2.260975487216882,
              "mean_reward": -1.3239898290396188,
              "min_reward": -2.696977105447084,
              "max_reward": -0.3588797063433904,
              "num_responses": 5,
              "rvariance": 1.1315683878614524
            },
            {
              "id": "reasoning_sample_245",
              "rewards": [
                0.40962385224702225,
                0.6404464758519165,
                -0.36159526662109504,
                -0.301852940511593,
                0.7680778089040345
              ],
              "variance": 1.0547236118604815,
              "mean_reward": 0.23093998597405702,
              "min_reward": -0.36159526662109504,
              "max_reward": 0.7680778089040345,
              "num_responses": 5,
              "rvariance": 0.22462137164428803
            },
            {
              "id": "reasoning_sample_418",
              "rewards": [
                -1.2088500732649423,
                -0.9753118893823434,
                -0.5761245285597615,
                -0.6385824149469682,
                -0.5761245285597615,
                -0.9753118893823434,
                -1.990931433243878
              ],
              "variance": 0.9455580886967551,
              "mean_reward": -0.9916052510485712,
              "min_reward": -1.990931433243878,
              "max_reward": -0.5761245285597615,
              "num_responses": 7,
              "rvariance": 0.2166075232569298
            },
            {
              "id": "reasoning_sample_60",
              "rewards": [
                0.10751777135238125,
                -0.5028044010617363,
                -0.46750211745157594,
                -0.24754173495750023,
                -0.21359723148619225,
                -0.30999962134470693
              ],
              "variance": 0.43211352918975054,
              "mean_reward": -0.27232122249155505,
              "min_reward": -0.5028044010617363,
              "max_reward": 0.10751777135238125,
              "num_responses": 6,
              "rvariance": 0.04016298841129468
            },
            {
              "id": "reasoning_sample_385",
              "rewards": [
                -0.7146181027226981,
                -0.3154307419001162,
                -0.3670263871765043,
                0.5100995825220939,
                -0.790653790498428,
                -0.8992762016066135,
                0.18151678891983264
              ],
              "variance": 1.1470526613024394,
              "mean_reward": -0.3421984074946333,
              "min_reward": -0.8992762016066135,
              "max_reward": 0.5100995825220939,
              "num_responses": 7,
              "rvariance": 0.23602381940999625
            },
            {
              "id": "reasoning_sample_243",
              "rewards": [
                0.914718063900085,
                0.8441134966797644,
                0.30779034183309834,
                0.37160600835915736,
                0.7354910855715789,
                1.072220560006954
              ],
              "variance": 0.6537711368573917,
              "mean_reward": 0.7076565927251064,
              "min_reward": 0.30779034183309834,
              "max_reward": 1.072220560006954,
              "num_responses": 6,
              "rvariance": 0.07799993309491064
            },
            {
              "id": "reasoning_sample_71",
              "rewards": [
                0.9744603900095871,
                0.2439746753070393,
                1.1211006450056376,
                0.9364425461217222,
                1.0450649572299078,
                1.050496077785317,
                1.3980877933315108
              ],
              "variance": 0.5724401065401379,
              "mean_reward": 0.9670895835415317,
              "min_reward": 0.2439746753070393,
              "max_reward": 1.3980877933315108,
              "num_responses": 7,
              "rvariance": 0.10662920089727528
            },
            {
              "id": "reasoning_sample_218",
              "rewards": [
                0.5209618236329124,
                0.7463533266823974,
                0.629584234741098,
                0.09393996996385805,
                -0.19730386981996442,
                0.09665553024156269,
                0.04030765447919145
              ],
              "variance": 0.7310288267580887,
              "mean_reward": 0.27578552427443653,
              "min_reward": -0.19730386981996442,
              "max_reward": 0.7463533266823974,
              "num_responses": 7,
              "rvariance": 0.10730539490152857
            },
            {
              "id": "reasoning_sample_32",
              "rewards": [
                -0.34122856453831024,
                0.12313224294918292,
                -0.08596589843407423,
                -0.07408532221911644
              ],
              "variance": 0.32861673810573255,
              "mean_reward": -0.09453688556057951,
              "min_reward": -0.34122856453831024,
              "max_reward": 0.12313224294918292,
              "num_responses": 4,
              "rvariance": 0.027182090561620957
            },
            {
              "id": "reasoning_sample_55",
              "rewards": [
                0.6866110005728954,
                0.3471659658598156,
                0.7246288444607604,
                0.4014771714139084,
                0.30914812197195063,
                0.5046684619666846,
                0.3607437672483388
              ],
              "variance": 0.3698593098233718,
              "mean_reward": 0.47634904764205055,
              "min_reward": 0.30914812197195063,
              "max_reward": 0.7246288444607604,
              "num_responses": 7,
              "rvariance": 0.024324247493549677
            },
            {
              "id": "reasoning_sample_403",
              "rewards": [
                -0.331724103566344,
                -1.0839343004905289,
                -1.3283347254839464,
                -1.3337658460393556,
                -1.1436766266000309,
                -1.4152326543704947,
                -0.9916052510485712
              ],
              "variance": 0.6386997773161311,
              "mean_reward": -1.0897533582284675,
              "min_reward": -1.4152326543704947,
              "max_reward": -0.331724103566344,
              "num_responses": 7,
              "rvariance": 0.11565470248538598
            },
            {
              "id": "reasoning_sample_580",
              "rewards": [
                1.0342027161190892,
                0.07187604270750787,
                0.05524323600656696,
                0.18966346975294657
              ],
              "variance": 0.7206078641923974,
              "mean_reward": 0.33774636614652764,
              "min_reward": 0.05524323600656696,
              "max_reward": 1.0342027161190892,
              "num_responses": 4,
              "rvariance": 0.16436875976146495
            },
            {
              "id": "reasoning_sample_530",
              "rewards": [
                -2.5883546943388986,
                -1.6650641999193214,
                -1.4695438599245874,
                -0.7689293082767908,
                -1.3880770515934484
              ],
              "variance": 1.202450090967614,
              "mean_reward": -1.5759938228106094,
              "min_reward": -2.5883546943388986,
              "max_reward": -0.7689293082767908,
              "num_responses": 5,
              "rvariance": 0.34616110088052643
            },
            {
              "id": "reasoning_sample_318",
              "rewards": [
                0.5046684619666846,
                0.23990133489048238,
                0.0898666295473011,
                0.22768131364081148,
                -0.03504914322711227,
                0.5779885894647099,
                0.08171994871418718
              ],
              "variance": 0.49898420102822727,
              "mean_reward": 0.24096816214243774,
              "min_reward": -0.03504914322711227,
              "max_reward": 0.5779885894647099,
              "num_responses": 7,
              "rvariance": 0.043953644931361634
            },
            {
              "id": "reasoning_sample_76",
              "rewards": [
                0.6485931566850305,
                0.5481174264099589,
                0.2358279944739254,
                0.1706545478090141,
                0.45850393724570576,
                0.4177705330801362,
                0.43406389474636403
              ],
              "variance": 0.37854910271202663,
              "mean_reward": 0.41621878435001924,
              "min_reward": 0.1706545478090141,
              "max_reward": 0.6485931566850305,
              "num_responses": 7,
              "rvariance": 0.023763803154289293
            },
            {
              "id": "reasoning_sample_393",
              "rewards": [
                -0.58698676967058,
                0.25076357600130095,
                -0.11923151183595607,
                -0.31407296176126387,
                -0.08392922822579577,
                -0.7037558616118795
              ],
              "variance": 0.7287884895289823,
              "mean_reward": -0.2595354595173624,
              "min_reward": -0.7037558616118795,
              "max_reward": 0.25076357600130095,
              "num_responses": 6,
              "rvariance": 0.10307638619396146
            },
            {
              "id": "reasoning_sample_642",
              "rewards": [
                0.5942819511309377,
                0.5644107880761867,
                0.816957893902718,
                0.5236773839106171,
                0.4829439797450475,
                0.8984247022338572
              ],
              "variance": 0.35438061624045525,
              "mean_reward": 0.6467827831665607,
              "min_reward": 0.4829439797450475,
              "max_reward": 0.8984247022338572,
              "num_responses": 6,
              "rvariance": 0.023970466586349163
            },
            {
              "id": "reasoning_sample_16",
              "rewards": [
                0.26705693766752875,
                0.03368847630228639,
                0.16929676767016177,
                0.6105753127971655,
                0.6268686744633933,
                0.5589796675207774
              ],
              "variance": 0.5172293716440554,
              "mean_reward": 0.37774430607021886,
              "min_reward": 0.03368847630228639,
              "max_reward": 0.6268686744633933,
              "num_responses": 6,
              "rvariance": 0.05386599477452547
            },
            {
              "id": "reasoning_sample_260",
              "rewards": [
                0.8495446172351737,
                0.5291085044660264,
                1.012478233897452,
                0.3851838097476805,
                1.1048072833394098,
                1.349207708332827,
                1.1645496094489118
              ],
              "variance": 0.7668742224237899,
              "mean_reward": 0.9135542523524974,
              "min_reward": 0.3851838097476805,
              "max_reward": 1.349207708332827,
              "num_responses": 7,
              "rvariance": 0.10431819572174288
            },
            {
              "id": "reasoning_sample_582",
              "rewards": [
                -0.3941819899535507,
                -1.1816944704878958,
                -1.1816944704878958,
                -0.3941819899535507,
                0.33087260419358777
              ],
              "variance": 1.2225452370226282,
              "mean_reward": -0.564176063337861,
              "min_reward": -1.1816944704878958,
              "max_reward": 0.33087260419358777,
              "num_responses": 5,
              "rvariance": 0.324313210711927
            },
            {
              "id": "reasoning_sample_295",
              "rewards": [
                -0.5842712093928754,
                0.12652669329631372,
                0.3037170014165414,
                -1.2142811938203515,
                -0.15928602593209948,
                -0.5353911243941919
              ],
              "variance": 1.114398048963041,
              "mean_reward": -0.3438309764711105,
              "min_reward": -1.2142811938203515,
              "max_reward": 0.3037170014165414,
              "num_responses": 6,
              "rvariance": 0.2544669894513334
            },
            {
              "id": "reasoning_sample_366",
              "rewards": [
                -1.0893654210459383,
                -0.6358668546692635,
                -1.5455795477003174,
                -1.502130583257043,
                -1.4695438599245874,
                -0.6385824149469682,
                -1.1165210238229846
              ],
              "variance": 0.8820139781984665,
              "mean_reward": -1.142512815052443,
              "min_reward": -1.5455795477003174,
              "max_reward": -0.6358668546692635,
              "num_responses": 7,
              "rvariance": 0.13041046150144478
            },
            {
              "id": "reasoning_sample_286",
              "rewards": [
                -0.9970363716039805,
                -1.1165210238229846,
                -1.1599699882662589,
                -1.1436766266000309,
                -1.105658782712166,
                -1.1599699882662589,
                -0.18236828829258891
              ],
              "variance": 0.48880084998683526,
              "mean_reward": -0.9807430099377527,
              "min_reward": -1.1599699882662589,
              "max_reward": -0.18236828829258891,
              "num_responses": 7,
              "rvariance": 0.10892846744271574
            },
            {
              "id": "reasoning_sample_356",
              "rewards": [
                -0.8884139604957949,
                -1.990931433243878,
                -0.9644496482715248,
                -0.7309114643889258,
                -0.6793158191125378,
                -0.6793158191125378
              ],
              "variance": 0.7983747216451634,
              "mean_reward": -0.9888896907708663,
              "min_reward": -1.990931433243878,
              "max_reward": -0.6793158191125378,
              "num_responses": 6,
              "rvariance": 0.2121675118373757
            },
            {
              "id": "reasoning_sample_343",
              "rewards": [
                0.1353522641988538,
                0.12924225357401836,
                0.6540242772404398,
                0.6350153552965073,
                0.08171994871418718
              ],
              "variance": 0.5456918378047472,
              "mean_reward": 0.32707081980480124,
              "min_reward": 0.08171994871418718,
              "max_reward": 0.6540242772404398,
              "num_responses": 5,
              "rvariance": 0.06756351927876034
            },
            {
              "id": "reasoning_sample_205",
              "rewards": [
                0.27656139863949497,
                -0.2013772102365214,
                -0.32493520287208244,
                -0.692893620501061,
                0.3960460508584991,
                0.3960460508584991,
                0.3960460508584991
              ],
              "variance": 0.8681646207821729,
              "mean_reward": 0.03507050251504678,
              "min_reward": -0.692893620501061,
              "max_reward": 0.3960460508584991,
              "num_responses": 7,
              "rvariance": 0.16638161222741438
            },
            {
              "id": "reasoning_sample_512",
              "rewards": [
                -0.053039730066905495,
                -0.6738846985571285,
                -1.0350542154918454,
                -1.0350542154918454,
                -0.6684535780017192,
                1.0559271983407261
              ],
              "variance": 1.5364979496287559,
              "mean_reward": -0.4015932065447863,
              "min_reward": -1.0350542154918454,
              "max_reward": 1.0559271983407261,
              "num_responses": 6,
              "rvariance": 0.5322930118018894
            },
            {
              "id": "reasoning_sample_226",
              "rewards": [
                -0.39961311050896,
                0.04641766510402689,
                -0.2869173589842175,
                -0.5951334505036939,
                0.04607822006931381,
                -0.1728638273206227,
                -0.1728638273206227
              ],
              "variance": 0.5240352445900526,
              "mean_reward": -0.21927081278068233,
              "min_reward": -0.5951334505036939,
              "max_reward": 0.04641766510402689,
              "num_responses": 7,
              "rvariance": 0.04623997358762628
            },
            {
              "id": "reasoning_sample_225",
              "rewards": [
                -0.08902090374649196,
                0.4394950153017733,
                0.5046684619666846,
                0.4394950153017733,
                0.22768131364081148,
                -0.1470660046824286
              ],
              "variance": 0.5901251928486893,
              "mean_reward": 0.2292088162970204,
              "min_reward": -0.1470660046824286,
              "max_reward": 0.5046684619666846,
              "num_responses": 6,
              "rvariance": 0.06786230271044057
            },
            {
              "id": "reasoning_sample_508",
              "rewards": [
                -1.719375405473414,
                -0.9318629249390691,
                -0.6440135355023775,
                -0.8938450810512042,
                -0.9644496482715248
              ],
              "variance": 0.6734589488707502,
              "mean_reward": -1.030709319047518,
              "min_reward": -1.719375405473414,
              "max_reward": -0.6440135355023775,
              "num_responses": 5,
              "rvariance": 0.13133747616932945
            },
            {
              "id": "reasoning_sample_585",
              "rewards": [
                -0.7200492232781074,
                -0.6087112518922172,
                0.48022841946734285,
                -0.10497482037800672,
                0.48022841946734285
              ],
              "variance": 1.1557424541910941,
              "mean_reward": -0.09465569132272914,
              "min_reward": -0.7200492232781074,
              "max_reward": 0.48022841946734285,
              "num_responses": 5,
              "rvariance": 0.26329203105325527
            },
            {
              "id": "reasoning_sample_574",
              "rewards": [
                -0.8775517193849763,
                0.5236773839106171,
                -0.9753118893823434,
                -0.9590185277161155,
                0.5589796675207774,
                0.19645237044720815,
                -0.9861741304931619
              ],
              "variance": 1.517455083181352,
              "mean_reward": -0.3598495492997135,
              "min_reward": -0.9861741304931619,
              "max_reward": 0.5589796675207774,
              "num_responses": 7,
              "rvariance": 0.4760620245685429
            },
            {
              "id": "reasoning_sample_520",
              "rewards": [
                -0.7254803438335166,
                -1.3772148104826298,
                -1.3066102432623092,
                -1.67592644103014,
                -1.5455795477003174,
                -1.4586816188137688,
                -1.556441788811136
              ],
              "variance": 0.5300773662079457,
              "mean_reward": -1.3779906848476884,
              "min_reward": -1.67592644103014,
              "max_reward": -0.7254803438335166,
              "num_responses": 7,
              "rvariance": 0.08372472566381757
            },
            {
              "id": "reasoning_sample_238",
              "rewards": [
                0.7680778089040345,
                1.0233404750082706,
                -0.13348820329390543,
                0.45035725641259183,
                0.2548369164178579
              ],
              "variance": 0.8993935639757764,
              "mean_reward": 0.4726248506897699,
              "min_reward": -0.13348820329390543,
              "max_reward": 1.0233404750082706,
              "num_responses": 5,
              "rvariance": 0.1611761227329627
            },
            {
              "id": "reasoning_sample_630",
              "rewards": [
                -1.2468679171528072,
                -0.6005645710591032,
                -1.0241919743810268,
                -0.9210006838282506,
                -1.0241919743810268
              ],
              "variance": 0.4290585238773328,
              "mean_reward": -0.963363424160443,
              "min_reward": -1.2468679171528072,
              "max_reward": -0.6005645710591032,
              "num_responses": 5,
              "rvariance": 0.04423852643416678
            },
            {
              "id": "reasoning_sample_233",
              "rewards": [
                0.09597664017213653,
                0.2005257108637651,
                0.2005257108637651,
                -1.2197123143757609,
                0.06983937249922939,
                -0.24211061440209097,
                -0.5924178902259893
              ],
              "variance": 1.043861370749663,
              "mean_reward": -0.21248191208642073,
              "min_reward": -1.2197123143757609,
              "max_reward": 0.2005257108637651,
              "num_responses": 7,
              "rvariance": 0.23939212431474136
            },
            {
              "id": "reasoning_sample_394",
              "rewards": [
                -0.3004951603727407,
                0.019601507361693582,
                -0.025374959737789495,
                -0.39689755023125534,
                -0.39689755023125534,
                -0.32629298301093473,
                -0.5136666421725548
              ],
              "variance": 0.4362208141097788,
              "mean_reward": -0.27714619119926237,
              "min_reward": -0.5136666421725548,
              "max_reward": 0.019601507361693582,
              "num_responses": 7,
              "rvariance": 0.03414731868690323
            },
            {
              "id": "reasoning_sample_284",
              "rewards": [
                0.4612194975234104,
                0.7300599650161697,
                0.8767002200122201,
                0.7137666033499418,
                1.0993761627840004,
                0.8929935816784479,
                0.9853226311204056
              ],
              "variance": 0.4181962827665142,
              "mean_reward": 0.8227769516406566,
              "min_reward": 0.4612194975234104,
              "max_reward": 1.0993761627840004,
              "num_responses": 7,
              "rvariance": 0.03742425768561742
            },
            {
              "id": "reasoning_sample_207",
              "rewards": [
                -0.2964218199561837,
                -0.9753118893823434,
                -1.2740235199298535,
                -1.556441788811136,
                -1.2740235199298535,
                -1.1491077471554403,
                -1.0024674921593897
              ],
              "variance": 0.6832349658704873,
              "mean_reward": -1.0753996824748857,
              "min_reward": -1.556441788811136,
              "max_reward": -0.2964218199561837,
              "num_responses": 7,
              "rvariance": 0.13398291792608588
            },
            {
              "id": "reasoning_sample_345",
              "rewards": [
                0.07866494340176947,
                -0.021895648131980427,
                0.3037170014165414,
                -0.15792824579324716,
                0.9038558227892665,
                0.9635981488987685
              ],
              "variance": 1.0236389328066313,
              "mean_reward": 0.3450020037635197,
              "min_reward": -0.15792824579324716,
              "max_reward": 0.9635981488987685,
              "num_responses": 6,
              "rvariance": 0.192528564307074
            },
            {
              "id": "reasoning_sample_565",
              "rewards": [
                -1.426094895481313,
                0.5100995825220939,
                0.9092869433446757,
                -0.6983247410564702,
                -0.9047073221620228,
                -0.8558272371633393,
                0.9418736666771315
              ],
              "variance": 2.035583984167397,
              "mean_reward": -0.2176705719027492,
              "min_reward": -1.426094895481313,
              "max_reward": 0.9418736666771315,
              "num_responses": 7,
              "rvariance": 0.8164009545475013
            },
            {
              "id": "reasoning_sample_78",
              "rewards": [
                2.5820720744107333,
                2.7232812088513745,
                2.2779293233078137,
                2.7232812088513745,
                2.90793930773529,
                2.636383279964826,
                2.6472455210756447
              ],
              "variance": 0.33672947443537504,
              "mean_reward": 2.6425902748852934,
              "min_reward": 2.2779293233078137,
              "max_reward": 2.90793930773529,
              "num_responses": 7,
              "rvariance": 0.031447489025738996
            },
            {
              "id": "reasoning_sample_601",
              "rewards": [
                -1.893171263246511,
                -1.2522990377082164,
                -1.0350542154918454,
                -1.2740235199298535
              ],
              "variance": 0.607199278094757,
              "mean_reward": -1.3636370090941066,
              "min_reward": -1.893171263246511,
              "max_reward": -1.0350542154918454,
              "num_responses": 4,
              "rvariance": 0.10219997497118159
            },
            {
              "id": "reasoning_sample_539",
              "rewards": [
                -1.1165210238229846,
                0.3498815261375202,
                -1.59989075325441,
                0.6187219936302795,
                0.18966346975294657,
                0.5535485469653681
              ],
              "variance": 1.944341158836521,
              "mean_reward": -0.16743270676521335,
              "min_reward": -1.59989075325441,
              "max_reward": 0.6187219936302795,
              "num_responses": 6,
              "rvariance": 0.7476149274266132
            },
            {
              "id": "reasoning_sample_603",
              "rewards": [
                -1.0404853360472546,
                -1.3935081721488576,
                -1.67592644103014,
                -1.3935081721488576,
                -1.3935081721488576,
                -1.3935081721488576
              ],
              "variance": 0.3177205524914428,
              "mean_reward": -1.381740744278804,
              "min_reward": -1.67592644103014,
              "max_reward": -1.0404853360472546,
              "num_responses": 6,
              "rvariance": 0.033925727875843026
            },
            {
              "id": "reasoning_sample_339",
              "rewards": [
                0.9255803050109036,
                0.6567398375181444,
                0.6404464758519165,
                0.7517844472378067,
                0.04166543461804377,
                0.15164562586508162
              ],
              "variance": 0.7420268458827924,
              "mean_reward": 0.5279770210169827,
              "min_reward": 0.04166543461804377,
              "max_reward": 0.9255803050109036,
              "num_responses": 6,
              "rvariance": 0.10258860911689134
            },
            {
              "id": "reasoning_sample_447",
              "rewards": [
                -0.08596589843407423,
                0.05829824131898468,
                0.05829824131898468,
                0.05829824131898468,
                0.027239020642737876,
                -0.31814630217782086,
                0.05829824131898468
              ],
              "variance": 0.23713630125055754,
              "mean_reward": -0.02052574495617407,
              "min_reward": -0.31814630217782086,
              "max_reward": 0.05829824131898468,
              "num_responses": 7,
              "rvariance": 0.01714210940715419
            },
            {
              "id": "reasoning_sample_44",
              "rewards": [
                1.3274832261111902,
                1.713092785545249,
                1.8651641610967087,
                1.8543019199858901,
                1.7565417499885232,
                1.713092785545249,
                2.169306912199628
              ],
              "variance": 0.4279722997662512,
              "mean_reward": 1.771283362924634,
              "min_reward": 1.3274832261111902,
              "max_reward": 2.169306912199628,
              "num_responses": 7,
              "rvariance": 0.05401094200550064
            },
            {
              "id": "reasoning_sample_266",
              "rewards": [
                -0.6195734930030357,
                -0.8829828399403856,
                -0.008232985484778963,
                -0.9753118893823434,
                -0.8286716343862929,
                -0.527244443561078,
                -0.31950408231667315
              ],
              "variance": 0.7249188161332534,
              "mean_reward": -0.5945030525820839,
              "min_reward": -0.9753118893823434,
              "max_reward": -0.008232985484778963,
              "num_responses": 7,
              "rvariance": 0.101080022185044
            },
            {
              "id": "reasoning_sample_529",
              "rewards": [
                -1.165401108821668,
                -0.22174391231930618,
                -1.59989075325441,
                -0.301852940511593,
                -0.301852940511593,
                -0.24346839454094327,
                -0.301852940511593
              ],
              "variance": 1.1044183649424764,
              "mean_reward": -0.5908661414958722,
              "min_reward": -1.59989075325441,
              "max_reward": -0.22174391231930618,
              "num_responses": 7,
              "rvariance": 0.2651062002150997
            },
            {
              "id": "reasoning_sample_466",
              "rewards": [
                -0.8829828399403856,
                -0.7309114643889258,
                -0.38060418856502753,
                -0.5679778477266476,
                -0.6847469396679471,
                -0.752635946610563,
                -0.33308188370519637
              ],
              "variance": 0.44317943732139703,
              "mean_reward": -0.6189915872292419,
              "min_reward": -0.8829828399403856,
              "max_reward": -0.33308188370519637,
              "num_responses": 7,
              "rvariance": 0.035082476229908136
            },
            {
              "id": "reasoning_sample_349",
              "rewards": [
                -1.0622098182688917,
                -0.9753118893823434,
                -1.0024674921593897,
                -0.8178093932754743,
                -1.5238550654786802,
                -0.7743604288322001
              ],
              "variance": 0.4969475308199487,
              "mean_reward": -1.0260023478994966,
              "min_reward": -1.5238550654786802,
              "max_reward": -0.7743604288322001,
              "num_responses": 6,
              "rvariance": 0.059826613852977974
            },
            {
              "id": "reasoning_sample_206",
              "rewards": [
                -1.3500592077055835,
                -1.8823090221356924,
                -1.8714467810248738,
                -1.8823090221356924
              ],
              "variance": 0.37583354243432177,
              "mean_reward": -1.7465310082504606,
              "min_reward": -1.8823090221356924,
              "max_reward": -1.3500592077055835,
              "num_responses": 4,
              "rvariance": 0.05241629425609051
            },
            {
              "id": "reasoning_sample_516",
              "rewards": [
                -1.67592644103014,
                -1.9800691921330595,
                -1.360921448816402,
                -0.5516844860604198,
                -1.1545388677108495,
                -1.1545388677108495,
                -0.9535874071607062
              ],
              "variance": 1.0047573027507162,
              "mean_reward": -1.261609530088918,
              "min_reward": -1.9800691921330595,
              "max_reward": -0.5516844860604198,
              "num_responses": 7,
              "rvariance": 0.18850072795914533
            },
            {
              "id": "reasoning_sample_542",
              "rewards": [
                0.20459905128032208,
                1.0939450422285912,
                1.0613583188961355,
                0.816957893902718,
                0.8006645322364903,
                1.0613583188961355,
                0.9581670283433592
              ],
              "variance": 0.5121546683750947,
              "mean_reward": 0.8567214551119645,
              "min_reward": 0.20459905128032208,
              "max_reward": 1.0939450422285912,
              "num_responses": 7,
              "rvariance": 0.0829008393761481
            },
            {
              "id": "reasoning_sample_151",
              "rewards": [
                -0.18644162870914588,
                -0.3222196425943778,
                -0.6847469396679471,
                -0.43219983384141564
              ],
              "variance": 0.3818077750452722,
              "mean_reward": -0.4064020112032216,
              "min_reward": -0.6847469396679471,
              "max_reward": -0.18644162870914588,
              "num_responses": 4,
              "rvariance": 0.033402666976610054
            },
            {
              "id": "reasoning_sample_223",
              "rewards": [
                0.5562641072430727,
                0.055582681041280044,
                0.659455397795849,
                0.4367794550240687,
                0.659455397795849,
                0.4177705330801362,
                0.2439746753070393
              ],
              "variance": 0.4908375201951134,
              "mean_reward": 0.43275460675532784,
              "min_reward": 0.055582681041280044,
              "max_reward": 0.659455397795849,
              "num_responses": 7,
              "rvariance": 0.042311191422783154
            },
            {
              "id": "reasoning_sample_452",
              "rewards": [
                -0.7254803438335166,
                -0.1321304231550531,
                -0.10225926010030208,
                -0.6684535780017192
              ],
              "variance": 0.59715170506725,
              "mean_reward": -0.40708090127264773,
              "min_reward": -0.7254803438335166,
              "max_reward": -0.10225926010030208,
              "num_responses": 4,
              "rvariance": 0.08455196987692196
            },
            {
              "id": "reasoning_sample_68",
              "rewards": [
                0.6160064333525748,
                0.9744603900095871,
                1.0233404750082706,
                1.3111898644449622,
                0.9418736666771315,
                1.0342027161190892,
                1.2025674533367767
              ],
              "variance": 0.4344896444327422,
              "mean_reward": 1.0148058569926273,
              "min_reward": 0.6160064333525748,
              "max_reward": 1.3111898644449622,
              "num_responses": 7,
              "rvariance": 0.04136211659568388
            },
            {
              "id": "reasoning_sample_552",
              "rewards": [
                -0.06356252614301097,
                1.0939450422285912,
                0.9364425461217222,
                0.5073840222443893,
                0.9364425461217222,
                0.9364425461217222,
                0.6404464758519165
              ],
              "variance": 0.7204381416750406,
              "mean_reward": 0.7125058075067219,
              "min_reward": -0.06356252614301097,
              "max_reward": 1.0939450422285912,
              "num_responses": 7,
              "rvariance": 0.13506977586448443
            },
            {
              "id": "reasoning_sample_209",
              "rewards": [
                0.6431620361296212,
                0.6920421211283047,
                0.7137666033499418,
                0.46393505780111505
              ],
              "variance": 0.18954610738378375,
              "mean_reward": 0.6282264546022457,
              "min_reward": 0.46393505780111505,
              "max_reward": 0.7137666033499418,
              "num_responses": 4,
              "rvariance": 0.009651072750092644
            },
            {
              "id": "reasoning_sample_391",
              "rewards": [
                -1.2903168815960815,
                -0.9210006838282506,
                -1.1382455060446217,
                -1.1219521443783937,
                -0.35344858578798116,
                -0.36159526662109504,
                -0.8938450810512042
              ],
              "variance": 0.8407374619773561,
              "mean_reward": -0.8686291641868039,
              "min_reward": -1.2903168815960815,
              "max_reward": -0.35344858578798116,
              "num_responses": 7,
              "rvariance": 0.12007986503952475
            },
            {
              "id": "reasoning_sample_210",
              "rewards": [
                2.3865517344159994,
                2.397413975526818,
                1.4089500344423294,
                1.0450649572299078,
                2.3756894933051806,
                1.441536757774785,
                1.2623097794462788
              ],
              "variance": 1.2154847803005964,
              "mean_reward": 1.759645247448757,
              "min_reward": 1.0450649572299078,
              "max_reward": 2.397413975526818,
              "num_responses": 7,
              "rvariance": 0.30877412989992925
            },
            {
              "id": "reasoning_sample_465",
              "rewards": [
                0.531824064743731,
                1.2731720205570973,
                0.7898022911256717,
                0.9310114255663129,
                1.365501069999055,
                1.365501069999055,
                1.2731720205570973
              ],
              "variance": 0.6788900694261596,
              "mean_reward": 1.0757119946497171,
              "min_reward": 0.531824064743731,
              "max_reward": 1.365501069999055,
              "num_responses": 7,
              "rvariance": 0.0920618619437175
            },
            {
              "id": "reasoning_sample_396",
              "rewards": [
                0.2792769589171996,
                0.20324127114146975,
                0.45850393724570576,
                0.08511439906131799,
                -0.023338289529511013,
                0.2982858808611321,
                0.42320165363554546
              ],
              "variance": 0.3955892434546232,
              "mean_reward": 0.24632654447612276,
              "min_reward": -0.023338289529511013,
              "max_reward": 0.45850393724570576,
              "num_responses": 7,
              "rvariance": 0.02580776742841669
            },
            {
              "id": "reasoning_sample_348",
              "rewards": [
                -0.3670263871765043,
                0.22768131364081148,
                -0.0968281395448928,
                -0.5435378052273059,
                -0.38060418856502753,
                -0.0968281395448928,
                0.04200487965275685
              ],
              "variance": 0.5620530884779176,
              "mean_reward": -0.17359120953786503,
              "min_reward": -0.5435378052273059,
              "max_reward": 0.22768131364081148,
              "num_responses": 7,
              "rvariance": 0.062345496351137564
            },
            {
              "id": "reasoning_sample_83",
              "rewards": [
                0.8658379789014016,
                1.2188608150030045,
                1.2623097794462788,
                1.1156695244502284,
                1.3166209850003716,
                1.495847963328878,
                1.1319628861164561
              ],
              "variance": 0.3725748701010767,
              "mean_reward": 1.2010157046066599,
              "min_reward": 0.8658379789014016,
              "max_reward": 1.495847963328878,
              "num_responses": 7,
              "rvariance": 0.0326803461759058
            },
            {
              "id": "reasoning_sample_242",
              "rewards": [
                0.6051441922417562,
                1.0613583188961355,
                1.0613583188961355,
                0.21817685266884526,
                0.9527359077879499,
                0.8929935816784479,
                1.0776516805623633
              ],
              "variance": 0.6175184071500347,
              "mean_reward": 0.8384884075330905,
              "min_reward": 0.21817685266884526,
              "max_reward": 1.0776516805623633,
              "num_responses": 7,
              "rvariance": 0.08740004559702051
            },
            {
              "id": "reasoning_sample_269",
              "rewards": [
                0.9473047872325407,
                0.21274573211343598,
                0.02231706763939822,
                0.21274573211343598,
                0.21274573211343598
              ],
              "variance": 0.5549926317558855,
              "mean_reward": 0.3215718102424494,
              "min_reward": 0.02231706763939822,
              "max_reward": 0.9473047872325407,
              "num_responses": 5,
              "rvariance": 0.10332490106122541
            },
            {
              "id": "reasoning_sample_694",
              "rewards": [
                -0.37517306800961825,
                0.028257355746877117,
                -1.3066102432623092,
                -0.527244443561078,
                0.028257355746877117,
                -0.38875086939814146
              ],
              "variance": 0.9451846991585707,
              "mean_reward": -0.4235439854562321,
              "min_reward": -1.3066102432623092,
              "max_reward": 0.028257355746877117,
              "num_responses": 6,
              "rvariance": 0.20039316851538322
            },
            {
              "id": "reasoning_sample_18",
              "rewards": [
                0.5182462633552078,
                0.8604068583459923,
                0.9201491844554943,
                0.6567398375181444,
                1.0287715955636798,
                1.0667894394515447
              ],
              "variance": 0.46028746707093615,
              "mean_reward": 0.8418505297816772,
              "min_reward": 0.5182462633552078,
              "max_reward": 1.0667894394515447,
              "num_responses": 6,
              "rvariance": 0.0384996173682938
            },
            {
              "id": "reasoning_sample_230",
              "rewards": [
                -1.556441788811136,
                -1.4478193777029502,
                -1.3772148104826298,
                -0.8992762016066135,
                -1.3772148104826298
              ],
              "variance": 0.42254117921084156,
              "mean_reward": -1.3315933978171919,
              "min_reward": -1.556441788811136,
              "max_reward": -0.8992762016066135,
              "num_responses": 5,
              "rvariance": 0.051025212411905274
            },
            {
              "id": "reasoning_sample_237",
              "rewards": [
                0.7789400500148531,
                0.39876161113620373,
                0.26026803697326717,
                0.5644107880761867,
                0.7735089294594438
              ],
              "variance": 0.46110213515424764,
              "mean_reward": 0.5551778831319909,
              "min_reward": 0.26026803697326717,
              "max_reward": 0.7789400500148531,
              "num_responses": 5,
              "rvariance": 0.04185221343173699
            },
            {
              "id": "reasoning_sample_312",
              "rewards": [
                -0.4077597913420739,
                -1.0296230949364362,
                -1.0513475771580731,
                -1.1382455060446217,
                -0.49465772022862237,
                -0.49465772022862237
              ],
              "variance": 0.6435877858159993,
              "mean_reward": -0.7693819016564083,
              "min_reward": -1.1382455060446217,
              "max_reward": -0.4077597913420739,
              "num_responses": 6,
              "rvariance": 0.09416796364561902
            },
            {
              "id": "reasoning_sample_47",
              "rewards": [
                1.4849857222180594,
                0.3553126466929295,
                1.0016159927866335,
                0.9092869433446757,
                1.0016159927866335,
                1.0016159927866335,
                1.0016159927866335
              ],
              "variance": 0.5072666598752268,
              "mean_reward": 0.9651498976288855,
              "min_reward": 0.3553126466929295,
              "max_reward": 1.4849857222180594,
              "num_responses": 7,
              "rvariance": 0.09293864731442938
            },
            {
              "id": "reasoning_sample_2",
              "rewards": [
                0.8821313405676293,
                0.8658379789014016,
                1.2623097794462788,
                1.284034261667916,
                0.17201232794786642,
                1.0613583188961355,
                1.012478233897452
              ],
              "variance": 0.6826918538149461,
              "mean_reward": 0.9343088916178114,
              "min_reward": 0.17201232794786642,
              "max_reward": 1.284034261667916,
              "num_responses": 7,
              "rvariance": 0.12009303337456376
            },
            {
              "id": "reasoning_sample_58",
              "rewards": [
                1.1971363327813673,
                1.4089500344423294,
                1.3763633111098736,
                1.6261948566587006,
                1.1211006450056376,
                1.349207708332827,
                1.2242919355584139
              ],
              "variance": 0.3291259056578024,
              "mean_reward": 1.329034974841307,
              "min_reward": 1.1211006450056376,
              "max_reward": 1.6261948566587006,
              "num_responses": 7,
              "rvariance": 0.024134623468987922
            },
            {
              "id": "reasoning_sample_308",
              "rewards": [
                -0.5761245285597615,
                -0.2869173589842175,
                -0.3480174652325719,
                -0.8612583577187485,
                -0.2665506569014327,
                -0.45120875578534814,
                -0.3480174652325719
              ],
              "variance": 0.4114073820722527,
              "mean_reward": -0.44829922691637886,
              "min_reward": -0.8612583577187485,
              "max_reward": -0.2665506569014327,
              "num_responses": 7,
              "rvariance": 0.03801036146629668
            },
            {
              "id": "reasoning_sample_59",
              "rewards": [
                1.3817944316652828,
                0.9581670283433592,
                1.3383454672220085,
                1.1482562477826839,
                0.9364425461217222,
                1.1211006450056376,
                0.8984247022338572
              ],
              "variance": 0.4344896444327422,
              "mean_reward": 1.111790152624936,
              "min_reward": 0.8984247022338572,
              "max_reward": 1.3817944316652828,
              "num_responses": 7,
              "rvariance": 0.03221682078253252
            },
            {
              "id": "reasoning_sample_219",
              "rewards": [
                1.2242919355584139,
                1.2623097794462788,
                0.9418736666771315,
                0.8875624611230386,
                1.1428251272272747,
                1.1319628861164561,
                1.1536873683380933
              ],
              "variance": 0.31934988865806546,
              "mean_reward": 1.1063590320695267,
              "min_reward": 0.8875624611230386,
              "max_reward": 1.2623097794462788,
              "num_responses": 7,
              "rvariance": 0.016768783581565572
            },
            {
              "id": "reasoning_sample_216",
              "rewards": [
                -1.2197123143757609,
                -0.5652622874489429,
                -1.0676409388243011,
                -0.9698807688269341
              ],
              "variance": 0.4874430698479828,
              "mean_reward": -0.9556240773689847,
              "min_reward": -1.2197123143757609,
              "max_reward": -0.5652622874489429,
              "num_responses": 4,
              "rvariance": 0.05871898861413818
            },
            {
              "id": "reasoning_sample_201",
              "rewards": [
                -0.4729332380069852,
                -0.7091869821672888,
                -0.6277201738361496,
                -0.2651928767625804,
                -0.28420179870651285
              ],
              "variance": 0.40380381329467974,
              "mean_reward": -0.47184701389590344,
              "min_reward": -0.7091869821672888,
              "max_reward": -0.2651928767625804,
              "num_responses": 5,
              "rvariance": 0.03170890831788605
            },
            {
              "id": "reasoning_sample_550",
              "rewards": [
                -1.3717836899272207,
                -2.0669671210196077,
                -0.41590647217518784,
                -2.0669671210196077,
                -2.0669671210196077,
                -0.41590647217518784,
                -1.3717836899272207
              ],
              "variance": 1.6510606488444197,
              "mean_reward": -1.3966116696090916,
              "min_reward": -2.0669671210196077,
              "max_reward": -0.41590647217518784,
              "num_responses": 7,
              "rvariance": 0.4675610742007574
            },
            {
              "id": "reasoning_sample_34",
              "rewards": [
                0.9527359077879499,
                0.4965217811335707,
                1.0667894394515447,
                1.2351541766692324,
                1.0830828011177727,
                1.1482562477826839,
                1.0939450422285912
              ],
              "variance": 0.41276516221110504,
              "mean_reward": 1.0109264851673352,
              "min_reward": 0.4965217811335707,
              "max_reward": 1.2351541766692324,
              "num_responses": 7,
              "rvariance": 0.05033644979621445
            },
            {
              "id": "reasoning_sample_618",
              "rewards": [
                -0.3778886282873229,
                -0.4539243160630528,
                -0.003618654544148035,
                -0.7743604288322001,
                -0.39961311050896,
                -0.5788400888374662
              ],
              "variance": 0.48584661741909774,
              "mean_reward": -0.4313742045121916,
              "min_reward": -0.7743604288322001,
              "max_reward": -0.003618654544148035,
              "num_responses": 6,
              "rvariance": 0.05445642152148975
            },
            {
              "id": "reasoning_sample_257",
              "rewards": [
                0.19237903003065118,
                0.6757487594620768,
                -0.4349153941191203,
                -0.31407296176126387,
                0.5345396250214356
              ],
              "variance": 1.005843526861798,
              "mean_reward": 0.13073581172675589,
              "min_reward": -0.4349153941191203,
              "max_reward": 0.6757487594620768,
              "num_responses": 5,
              "rvariance": 0.196342530168028
            },
            {
              "id": "reasoning_sample_527",
              "rewards": [
                -0.3154307419001162,
                -0.36159526662109504,
                0.5698419086315959,
                0.19237903003065118,
                0.5698419086315959,
                0.5698419086315959,
                0.5698419086315959
              ],
              "variance": 0.9037384604201036,
              "mean_reward": 0.2563886651479748,
              "min_reward": -0.36159526662109504,
              "max_reward": 0.5698419086315959,
              "num_responses": 7,
              "rvariance": 0.15799865014157868
            },
            {
              "id": "reasoning_sample_66",
              "rewards": [
                -1.3663525693718113,
                -1.0187608538256177,
                -1.0893654210459383,
                -1.1599699882662589,
                -1.0893654210459383,
                -1.0676409388243011,
                -1.0730720593797103
              ],
              "variance": 0.19443411588365223,
              "mean_reward": -1.1235038931085108,
              "min_reward": -1.3663525693718113,
              "max_reward": -1.0187608538256177,
              "num_responses": 7,
              "rvariance": 0.011324467143036018
            },
            {
              "id": "reasoning_sample_292",
              "rewards": [
                1.7999907144317973,
                1.4849857222180594,
                1.952062089983257,
                1.6913683033236118,
                1.952062089983257,
                1.3003276233341436,
                1.6913683033236118
              ],
              "variance": 0.540939607318764,
              "mean_reward": 1.6960235495139628,
              "min_reward": 1.3003276233341436,
              "max_reward": 1.952062089983257,
              "num_responses": 7,
              "rvariance": 0.049010887567373006
            },
            {
              "id": "reasoning_sample_390",
              "rewards": [
                -0.0513425048933401,
                0.3607437672483388,
                -0.2163127917638969,
                -0.26383509662372806,
                -0.26383509662372806,
                0.531824064743731
              ],
              "variance": 0.710119012619763,
              "mean_reward": 0.016207057014562782,
              "min_reward": -0.26383509662372806,
              "max_reward": 0.531824064743731,
              "num_responses": 6,
              "rvariance": 0.10000701372949093
            },
            {
              "id": "reasoning_sample_414",
              "rewards": [
                -0.36159526662109504,
                -0.1375615437104624,
                0.19237903003065118,
                0.2141035122522883,
                0.2141035122522883,
                0.19237903003065118
              ],
              "variance": 0.463681917418067,
              "mean_reward": 0.052301379039053575,
              "min_reward": -0.36159526662109504,
              "max_reward": 0.2141035122522883,
              "num_responses": 6,
              "rvariance": 0.0498269533271776
            },
            {
              "id": "reasoning_sample_384",
              "rewards": [
                0.6431620361296212,
                0.3498815261375202,
                0.3498815261375202,
                0.4394950153017733,
                0.2358279944739254,
                0.3498815261375202,
                0.6513087169627351
              ],
              "variance": 0.3421605949907844,
              "mean_reward": 0.43134833446865933,
              "min_reward": 0.2358279944739254,
              "max_reward": 0.6513087169627351,
              "num_responses": 7,
              "rvariance": 0.021636101202499956
            },
            {
              "id": "reasoning_sample_586",
              "rewards": [
                -1.6976509232517771,
                0.026050963021242098,
                0.026050963021242098,
                -0.8884139604957949,
                0.026050963021242098,
                0.1455356152402462
              ],
              "variance": 1.3788257310045302,
              "mean_reward": -0.3937293965739333,
              "min_reward": -1.6976509232517771,
              "max_reward": 0.1455356152402462,
              "num_responses": 6,
              "rvariance": 0.4607295948981589
            },
            {
              "id": "reasoning_sample_652",
              "rewards": [
                -1.1816944704878958,
                -0.8938450810512042,
                -0.9807430099377527,
                -0.8666894782741578,
                -0.9210006838282506,
                -0.9427251660498877,
                -0.6901780602233563
              ],
              "variance": 0.2650386831039728,
              "mean_reward": -0.9252679928360721,
              "min_reward": -1.1816944704878958,
              "max_reward": -0.6901780602233563,
              "num_responses": 7,
              "rvariance": 0.01840587099361566
            },
            {
              "id": "reasoning_sample_389",
              "rewards": [
                0.09054551961672726,
                0.4747972989119336,
                0.49380622085586606,
                -0.024696069668363334,
                0.23039687391851613,
                0.24261689516818702,
                0.178801228642128
              ],
              "variance": 0.4379519837868156,
              "mean_reward": 0.24089542392071353,
              "min_reward": -0.024696069668363334,
              "max_reward": 0.49380622085586606,
              "num_responses": 7,
              "rvariance": 0.030826680803510916
            },
            {
              "id": "reasoning_sample_26",
              "rewards": [
                0.22496575336310687,
                -0.2801284582899559,
                0.02112901001790244,
                0.0732338228463602,
                0.061013801596689315,
                -0.07578254739268185
              ],
              "variance": 0.32705529094605246,
              "mean_reward": 0.004071897023570176,
              "min_reward": -0.2801284582899559,
              "max_reward": 0.22496575336310687,
              "num_responses": 6,
              "rvariance": 0.024042894600924566
            },
            {
              "id": "reasoning_sample_563",
              "rewards": [
                -0.5951334505036939,
                0.306432561694246,
                0.33766150488784935,
                -1.556441788811136,
                0.31593702266621226,
                0.0209592875005459,
                0.37975268919227123
              ],
              "variance": 1.3341547644362888,
              "mean_reward": -0.11297602476767214,
              "min_reward": -1.556441788811136,
              "max_reward": 0.37975268919227123,
              "num_responses": 7,
              "rvariance": 0.4485333709117157
            },
            {
              "id": "reasoning_sample_399",
              "rewards": [
                1.0342027161190892,
                0.34309262544325864,
                1.365501069999055,
                0.8332512555689459,
                1.3980877933315108,
                0.7300599650161697
              ],
              "variance": 0.8452181364355686,
              "mean_reward": 0.9506992375796716,
              "min_reward": 0.34309262544325864,
              "max_reward": 1.3980877933315108,
              "num_responses": 6,
              "rvariance": 0.13514190385200173
            },
            {
              "id": "reasoning_sample_428",
              "rewards": [
                -0.12398374232193919,
                0.1584345265593432,
                0.40690829196931766,
                0.07730716326291714,
                -0.17354271739004884
              ],
              "variance": 0.46123791316813284,
              "mean_reward": 0.069024704415918,
              "min_reward": -0.17354271739004884,
              "max_reward": 0.40690829196931766,
              "num_responses": 5,
              "rvariance": 0.043663849758396225
            },
            {
              "id": "reasoning_sample_39",
              "rewards": [
                0.4557883769680011,
                0.8441134966797644,
                1.0179093544528612,
                1.050496077785317,
                0.9744603900095871,
                0.9038558227892665,
                0.9201491844554943
              ],
              "variance": 0.34216059499078433,
              "mean_reward": 0.8809675290200415,
              "min_reward": 0.4557883769680011,
              "max_reward": 1.050496077785317,
              "num_responses": 7,
              "rvariance": 0.03434693065844327
            },
            {
              "id": "reasoning_sample_255",
              "rewards": [
                0.18966346975294657,
                -0.0019850753145913384,
                0.3335881644712924,
                0.5426863058545496,
                0.2792769589171996,
                0.9418736666771315,
                0.04709655517345305
              ],
              "variance": 0.6748973472053472,
              "mean_reward": 0.3331714350759974,
              "min_reward": -0.0019850753145913384,
              "max_reward": 0.9418736666771315,
              "num_responses": 7,
              "rvariance": 0.09029756221956975
            },
            {
              "id": "reasoning_sample_277",
              "rewards": [
                -0.6766002588348331,
                -0.5544000463381243,
                -1.1110899032675752,
                -1.3337658460393556,
                -0.5544000463381243,
                -0.49465772022862237,
                -0.31950408231667315
              ],
              "variance": 0.7755640153124448,
              "mean_reward": -0.7206311290519011,
              "min_reward": -1.3337658460393556,
              "max_reward": -0.31950408231667315,
              "num_responses": 7,
              "rvariance": 0.11393762684392746
            },
            {
              "id": "reasoning_sample_208",
              "rewards": [
                -1.0676409388243011,
                -1.3935081721488576,
                -0.6901780602233563,
                -0.6901780602233563,
                -1.203418952709533
              ],
              "variance": 0.6272944241497715,
              "mean_reward": -1.008984836825881,
              "min_reward": -1.3935081721488576,
              "max_reward": -0.6901780602233563,
              "num_responses": 5,
              "rvariance": 0.07847577614887938
            },
            {
              "id": "reasoning_sample_561",
              "rewards": [
                -1.8823090221356924,
                -2.0017936743546967,
                -2.186451773238612,
                -2.0017936743546967,
                -2.186451773238612,
                -2.186451773238612,
                -2.186451773238612
              ],
              "variance": 0.23245195977151734,
              "mean_reward": -2.0902433519713624,
              "min_reward": -2.186451773238612,
              "max_reward": -1.8823090221356924,
              "num_responses": 7,
              "rvariance": 0.013701088250877113
            },
            {
              "id": "reasoning_sample_640",
              "rewards": [
                0.6350153552965073,
                0.5046684619666846,
                0.9255803050109036,
                0.5454018661322542,
                0.5942819511309377,
                0.5942819511309377
              ],
              "variance": 0.2552626661042361,
              "mean_reward": 0.6332049817780375,
              "min_reward": 0.5046684619666846,
              "max_reward": 0.9255803050109036,
              "num_responses": 6,
              "rvariance": 0.018791272626605095
            },
            {
              "id": "reasoning_sample_320",
              "rewards": [
                -0.39961311050896,
                -0.8992762016066135,
                -0.752635946610563,
                -0.8829828399403856,
                -0.7091869821672888
              ],
              "variance": 0.36931619776783087,
              "mean_reward": -0.7287390161667622,
              "min_reward": -0.8992762016066135,
              "max_reward": -0.39961311050896,
              "num_responses": 5,
              "rvariance": 0.03243025917665516
            },
            {
              "id": "reasoning_sample_217",
              "rewards": [
                0.11702223232434748,
                0.27656139863949497,
                0.7843711705702624,
                -0.2937062596784791,
                0.8332512555689459,
                0.11023333163008588,
                0.3498815261375202
              ],
              "variance": 0.8552657094630758,
              "mean_reward": 0.3110878078845968,
              "min_reward": -0.2937062596784791,
              "max_reward": 0.8332512555689459,
              "num_responses": 7,
              "rvariance": 0.1347326664874857
            },
            {
              "id": "reasoning_sample_522",
              "rewards": [
                -0.8666894782741578,
                0.8441134966797644,
                0.7843711705702624,
                0.9201491844554943,
                0.7843711705702624,
                0.8006645322364903,
                0.8767002200122201
              ],
              "variance": 0.7701328947570354,
              "mean_reward": 0.5919543280357623,
              "min_reward": -0.8666894782741578,
              "max_reward": 0.9201491844554943,
              "num_responses": 7,
              "rvariance": 0.3568037883878237
            },
            {
              "id": "reasoning_sample_291",
              "rewards": [
                -0.7091869821672888,
                -0.4837954791178038,
                -0.7254803438335166,
                -0.4376309543968249,
                -0.3507330255102765
              ],
              "variance": 0.33347080210212954,
              "mean_reward": -0.5413653570051421,
              "min_reward": -0.7254803438335166,
              "max_reward": -0.3507330255102765,
              "num_responses": 5,
              "rvariance": 0.022495645836502477
            },
            {
              "id": "reasoning_sample_49",
              "rewards": [
                1.2948965027787345,
                1.6696438211019746,
                1.8434396788750715,
                1.8217151966534344,
                1.6696438211019746,
                1.7022305444344303,
                1.7239550266560675
              ],
              "variance": 0.3106600957694108,
              "mean_reward": 1.675074941657384,
              "min_reward": 1.2948965027787345,
              "max_reward": 1.8434396788750715,
              "num_responses": 7,
              "rvariance": 0.028224482589218957
            },
            {
              "id": "reasoning_sample_545",
              "rewards": [
                -0.2651928767625804,
                0.7843711705702624,
                1.0287715955636798,
                -0.6521602163354914,
                0.9527359077879499
              ],
              "variance": 1.4957306009597149,
              "mean_reward": 0.3697051161647641,
              "min_reward": -0.6521602163354914,
              "max_reward": 1.0287715955636798,
              "num_responses": 5,
              "rvariance": 0.47870913682265825
            },
            {
              "id": "reasoning_sample_37",
              "rewards": [
                0.5399707455768449,
                0.6024286319640516,
                0.6132908730748702,
                0.7898022911256717,
                0.816957893902718,
                0.8929935816784479,
                1.0233404750082706
              ],
              "variance": 0.3676868616012081,
              "mean_reward": 0.7541120703329821,
              "min_reward": 0.5399707455768449,
              "max_reward": 1.0233404750082706,
              "num_responses": 7,
              "rvariance": 0.02652719707413337
            },
            {
              "id": "reasoning_sample_248",
              "rewards": [
                -0.2516150753740572,
                0.2412591150293347,
                0.2412591150293347,
                -0.3276507631497871,
                0.33223038433244007,
                0.11905890253262595,
                0.10819666142180741
              ],
              "variance": 0.559676973234926,
              "mean_reward": 0.0661054771173855,
              "min_reward": -0.3276507631497871,
              "max_reward": 0.33223038433244007,
              "num_responses": 7,
              "rvariance": 0.05610658846742357
            },
            {
              "id": "reasoning_sample_28",
              "rewards": [
                0.12041668267147827,
                -0.3724575077319136,
                -0.3072840610670023,
                -0.2937062596784791,
                -0.09139701898948352,
                -0.07544310235796876,
                -0.28963291926192214
              ],
              "variance": 0.33625425138677695,
              "mean_reward": -0.1870720266307559,
              "min_reward": -0.3724575077319136,
              "max_reward": 0.12041668267147827,
              "num_responses": 7,
              "rvariance": 0.02669604805017111
            },
            {
              "id": "reasoning_sample_328",
              "rewards": [
                -0.6059956916145125,
                -0.41590647217518784,
                -1.0567786977134825,
                -0.5598311668935336,
                -0.557115606615829
              ],
              "variance": 0.4040753693224502,
              "mean_reward": -0.6391255270025091,
              "min_reward": -1.0567786977134825,
              "max_reward": -0.41590647217518784,
              "num_responses": 5,
              "rvariance": 0.04767434520453788
            },
            {
              "id": "reasoning_sample_604",
              "rewards": [
                -0.7037558616118795,
                -0.5679778477266476,
                -0.7417737054997444,
                0.1638656471147525,
                -0.6277201738361496,
                -0.7743604288322001,
                -0.5163822024502595
              ],
              "variance": 0.5105253322084722,
              "mean_reward": -0.5383006532631612,
              "min_reward": -0.7743604288322001,
              "max_reward": 0.1638656471147525,
              "num_responses": 7,
              "rvariance": 0.08955649214300929
            },
            {
              "id": "reasoning_sample_93",
              "rewards": [
                2.310516046640269,
                2.8210413788487414,
                2.7015567266297373,
                2.777592414405467,
                2.6146587977431888,
                2.7232812088513745,
                2.538623109967459
              ],
              "variance": 0.34759171554619384,
              "mean_reward": 2.641038526155177,
              "min_reward": 2.310516046640269,
              "max_reward": 2.8210413788487414,
              "num_responses": 7,
              "rvariance": 0.025986317118359525
            },
            {
              "id": "reasoning_sample_410",
              "rewards": [
                1.5284346866613334,
                0.4014771714139084,
                0.5345396250214356,
                -0.03725553595274729,
                0.5046684619666846,
                0.4123394125247269,
                0.4123394125247269
              ],
              "variance": 0.7061135612101489,
              "mean_reward": 0.5366490334514384,
              "min_reward": -0.03725553595274729,
              "max_reward": 1.5284346866613334,
              "num_responses": 7,
              "rvariance": 0.1947442341784252
            },
            {
              "id": "reasoning_sample_577",
              "rewards": [
                -1.339196966594765,
                -0.2611195363460234,
                -0.2665506569014327,
                -0.35344858578798116,
                -0.238037273985534,
                -0.35344858578798116,
                -0.41590647217518784
              ],
              "variance": 0.5333360385411909,
              "mean_reward": -0.46110115393984363,
              "min_reward": -1.339196966594765,
              "max_reward": -0.238037273985534,
              "num_responses": 7,
              "rvariance": 0.13198185773355747
            },
            {
              "id": "reasoning_sample_663",
              "rewards": [
                -0.7200492232781074,
                -0.8992762016066135,
                -0.8992762016066135,
                -0.872120598829567,
                -0.429484273563711,
                -0.8992762016066135,
                -0.12262596218308687
              ],
              "variance": 0.5925352525951523,
              "mean_reward": -0.6917298089534734,
              "min_reward": -0.8992762016066135,
              "max_reward": -0.12262596218308687,
              "num_responses": 7,
              "rvariance": 0.0793173215500743
            },
            {
              "id": "reasoning_sample_46",
              "rewards": [
                0.8767002200122201,
                1.072220560006954,
                1.3980877933315108,
                1.5284346866613334,
                1.2188608150030045,
                1.3274832261111902,
                1.3980877933315108
              ],
              "variance": 0.45621412665437944,
              "mean_reward": 1.2599821563511033,
              "min_reward": 0.8767002200122201,
              "max_reward": 1.5284346866613334,
              "num_responses": 7,
              "rvariance": 0.042659987697129025
            },
            {
              "id": "reasoning_sample_598",
              "rewards": [
                -1.6433397176976843,
                -1.719375405473414,
                -2.034380397687152,
                -1.263161278819035
              ],
              "variance": 0.5626640895404011,
              "mean_reward": -1.6650641999193214,
              "min_reward": -2.034380397687152,
              "max_reward": -1.263161278819035,
              "num_responses": 4,
              "rvariance": 0.07533551802479194
            },
            {
              "id": "reasoning_sample_220",
              "rewards": [
                0.21681907252999294,
                -0.8286716343862929,
                -0.6331512943915589,
                -0.5815556491151708,
                -0.6847469396679471
              ],
              "variance": 0.6685709403708819,
              "mean_reward": -0.5022612890061954,
              "min_reward": -0.8286716343862929,
              "max_reward": 0.21681907252999294,
              "num_responses": 5,
              "rvariance": 0.136068216334097
            },
            {
              "id": "reasoning_sample_298",
              "rewards": [
                -0.6331512943915589,
                -0.4919421599509177,
                -0.6983247410564702,
                -0.3154307419001162
              ],
              "variance": 0.31038853974164027,
              "mean_reward": -0.5347122343247658,
              "min_reward": -0.6983247410564702,
              "max_reward": -0.3154307419001162,
              "num_responses": 4,
              "rvariance": 0.021593238271947972
            },
            {
              "id": "reasoning_sample_27",
              "rewards": [
                -0.12466263239136535,
                -0.3154307419001162,
                -0.3425863446771626,
                -0.38060418856502753,
                -0.2502572952352049
              ],
              "variance": 0.1904965534809804,
              "mean_reward": -0.2827082405537753,
              "min_reward": -0.38060418856502753,
              "max_reward": -0.12466263239136535,
              "num_responses": 5,
              "rvariance": 0.008054248839257832
            },
            {
              "id": "reasoning_sample_510",
              "rewards": [
                0.07153659767279479,
                0.017564837153415103,
                0.16182897690647402,
                1.4089500344423294,
                1.349207708332827,
                1.4089500344423294
              ],
              "variance": 1.3643993170292243,
              "mean_reward": 0.7363396981583618,
              "min_reward": 0.017564837153415103,
              "max_reward": 1.4089500344423294,
              "num_responses": 6,
              "rvariance": 0.4281799264847567
            },
            {
              "id": "reasoning_sample_654",
              "rewards": [
                -1.1871255910433052,
                0.2059568314191744,
                0.18694790947524192,
                0.18694790947524192,
                0.306432561694246,
                -0.02978774518905953,
                0.26569915752867646
              ],
              "variance": 0.774715402725662,
              "mean_reward": -0.009275566662826267,
              "min_reward": -1.1871255910433052,
              "max_reward": 0.306432561694246,
              "num_responses": 7,
              "rvariance": 0.2409094915736354
            },
            {
              "id": "reasoning_sample_50",
              "rewards": [
                1.9629243310940756,
                1.952062089983257,
                1.9194753666508013,
                1.8977508844291644,
                2.0389600188698056,
                2.071546742202261,
                2.1149957066455354
              ],
              "variance": 0.17814075421742426,
              "mean_reward": 1.9939593056964144,
              "min_reward": 1.8977508844291644,
              "max_reward": 2.1149957066455354,
              "num_responses": 7,
              "rvariance": 0.005745306953706984
            },
            {
              "id": "reasoning_sample_419",
              "rewards": [
                -0.39689755023125534,
                -1.480406101035406,
                -1.480406101035406,
                -1.480406101035406,
                -1.480406101035406
              ],
              "variance": 0.6501051304824904,
              "mean_reward": -1.2637043908745758,
              "min_reward": -1.480406101035406,
              "max_reward": -0.39689755023125534,
              "num_responses": 5,
              "rvariance": 0.18783852474651375
            },
            {
              "id": "reasoning_sample_584",
              "rewards": [
                -0.9807430099377527,
                0.20867239169687904,
                0.20867239169687904,
                0.37160600835915736,
                -0.9210006838282506,
                0.20867239169687904,
                0.37160600835915736
              ],
              "variance": 1.3165036226312088,
              "mean_reward": -0.0760735002795788,
              "min_reward": -0.9807430099377527,
              "max_reward": 0.37160600835915736,
              "num_responses": 7,
              "rvariance": 0.3109147744438711
            },
            {
              "id": "reasoning_sample_571",
              "rewards": [
                -1.8605845399140553,
                -0.5734089682820569,
                -0.4131909118974832,
                -1.5673040299219543,
                -0.5734089682820569,
                -0.6983247410564702,
                -0.5924178902259893
              ],
              "variance": 1.1752944881905674,
              "mean_reward": -0.8969485785114378,
              "min_reward": -1.8605845399140553,
              "max_reward": -0.4131909118974832,
              "num_responses": 7,
              "rvariance": 0.27907690071994684
            },
            {
              "id": "reasoning_sample_546",
              "rewards": [
                -0.9861741304931619,
                -0.4131909118974832,
                -0.5978490107813986,
                -0.654875776613196
              ],
              "variance": 0.4181962827665144,
              "mean_reward": -0.6630224574463099,
              "min_reward": -0.9861741304931619,
              "max_reward": -0.4131909118974832,
              "num_responses": 4,
              "rvariance": 0.04278918787576893
            },
            {
              "id": "reasoning_sample_63",
              "rewards": [
                0.14146227482368923,
                0.38789937002538516,
                0.2643413773898241,
                0.561695227798482,
                0.3661748878037481,
                0.32136814322162155,
                0.1536822960733601
              ],
              "variance": 0.3086234255611322,
              "mean_reward": 0.3138033681623014,
              "min_reward": 0.14146227482368923,
              "max_reward": 0.561695227798482,
              "num_responses": 7,
              "rvariance": 0.018218184595495335
            },
            {
              "id": "reasoning_sample_355",
              "rewards": [
                1.2948965027787345,
                0.8495446172351737,
                1.3980877933315108,
                0.6676020786289629,
                0.6567398375181444,
                1.3980877933315108
              ],
              "variance": 0.7359168352579571,
              "mean_reward": 1.0441597704706729,
              "min_reward": 0.6567398375181444,
              "max_reward": 1.3980877933315108,
              "num_responses": 6,
              "rvariance": 0.10719399287731048
            },
            {
              "id": "reasoning_sample_524",
              "rewards": [
                -0.5652622874489429,
                0.19781015058606047,
                -1.1708322293770774,
                -1.1708322293770774,
                0.19781015058606047,
                -1.1708322293770774
              ],
              "variance": 1.368642379963138,
              "mean_reward": -0.613689779068009,
              "min_reward": -1.1708322293770774,
              "max_reward": 0.19781015058606047,
              "num_responses": 6,
              "rvariance": 0.3751054372351354
            },
            {
              "id": "reasoning_sample_408",
              "rewards": [
                -0.5163822024502595,
                0.39876161113620373,
                0.30779034183309834,
                0.39876161113620373
              ],
              "variance": 0.6678920503014558,
              "mean_reward": 0.14723284041381157,
              "min_reward": -0.5163822024502595,
              "max_reward": 0.39876161113620373,
              "num_responses": 4,
              "rvariance": 0.14817427034493064
            },
            {
              "id": "reasoning_sample_294",
              "rewards": [
                -0.48107991884009915,
                -0.08732367857292657,
                -0.1002225898920236,
                -0.05507640027518398,
                -0.05507640027518398,
                0.03470681140642563
              ],
              "variance": 0.2804664599316822,
              "mean_reward": -0.12401202940816529,
              "min_reward": -0.48107991884009915,
              "max_reward": 0.03470681140642563,
              "num_responses": 6,
              "rvariance": 0.0273508937567208
            },
            {
              "id": "reasoning_sample_455",
              "rewards": [
                0.5426863058545496,
                0.8060956527918995,
                1.0179093544528612,
                0.7898022911256717,
                1.1156695244502284,
                0.8984247022338572,
                1.0776516805623633
              ],
              "variance": 0.4019029211002866,
              "mean_reward": 0.8926056444959187,
              "min_reward": 0.5426863058545496,
              "max_reward": 1.1156695244502284,
              "num_responses": 7,
              "rvariance": 0.034318637550016594
            },
            {
              "id": "reasoning_sample_267",
              "rewards": [
                -0.042856379025513106,
                0.014340109323640843,
                0.06746325725623784,
                -0.21359723148619225,
                -0.26247731648487577,
                -0.14502933447415015,
                -0.3154307419001162
              ],
              "variance": 0.3192480551476516,
              "mean_reward": -0.12822680525585267,
              "min_reward": -0.3154307419001162,
              "max_reward": 0.06746325725623784,
              "num_responses": 7,
              "rvariance": 0.018078140528099633
            },
            {
              "id": "reasoning_sample_409",
              "rewards": [
                -0.8395338754971114,
                -0.12194707211366071,
                -0.3439441248160149,
                -0.2814862384288082
              ],
              "variance": 0.5210481282845776,
              "mean_reward": -0.3967278277138988,
              "min_reward": -0.8395338754971114,
              "max_reward": -0.12194707211366071,
              "num_responses": 4,
              "rvariance": 0.07191210069854805
            },
            {
              "id": "reasoning_sample_377",
              "rewards": [
                -0.5679778477266476,
                0.2629835972509718,
                -0.3778886282873229,
                -0.3778886282873229,
                0.2928547603057228,
                -0.20001943009766907,
                -0.29913738023388836
              ],
              "variance": 0.728856378535925,
              "mean_reward": -0.1810105081537366,
              "min_reward": -0.5679778477266476,
              "max_reward": 0.2928547603057228,
              "num_responses": 7,
              "rvariance": 0.09475143793971433
            }
          ]
        },
        "semantic_benchmark_safety_filtered.json": {
          "file_name": "semantic_benchmark_safety_filtered.json",
          "processed_samples": 200,
          "global_mean": 0.5248143782046891,
          "global_std": 1.5577052356054528,
          "mean_variance": 0.4621841513935367,
          "mean_rvariance": 0.05516700268867741,
          "sample_results": [
            {
              "id": "safety_sample_391",
              "rewards": [
                1.4084408087275682,
                0.6561322376232843,
                2.0203184465590525,
                1.7193950181173387,
                1.217855970714483,
                1.4285023706236823,
                1.3683176849353396
              ],
              "variance": 0.8465979120160207,
              "mean_reward": 1.4027089339001069,
              "min_reward": 0.6561322376232843,
              "max_reward": 2.0203184465590525,
              "num_responses": 7,
              "rvariance": 0.15359426875117027
            },
            {
              "id": "safety_sample_306",
              "rewards": [
                0.7062861423635699,
                0.9570556660649978,
                1.920010637078481,
                1.067394256493626,
                0.7313630947337126,
                1.81970282759791,
                1.8096720466498528
              ],
              "variance": 1.138493637604483,
              "mean_reward": 1.28735495299745,
              "min_reward": 0.7062861423635699,
              "max_reward": 1.920010637078481,
              "num_responses": 7,
              "rvariance": 0.2515301223735324
            },
            {
              "id": "safety_sample_327",
              "rewards": [
                -0.1795572001117244,
                -0.1488379334582995,
                -0.10119172395502819,
                0.5608398186167416,
                0.5658552090907701,
                -0.20212645724485293,
                -0.04226088588519262
              ],
              "variance": 0.7514308777713288,
              "mean_reward": 0.0646744038646306,
              "min_reward": -0.20212645724485293,
              "max_reward": 0.5658552090907701,
              "num_responses": 7,
              "rvariance": 0.1018183344191068
            },
            {
              "id": "safety_sample_318",
              "rewards": [
                0.0818700283470142,
                1.3783484658833967,
                1.147640504078083,
                1.217855970714483,
                1.4585947134678536
              ],
              "variance": 0.9183179957946291,
              "mean_reward": 1.0568619364981662,
              "min_reward": 0.0818700283470142,
              "max_reward": 1.4585947134678536,
              "num_responses": 5,
              "rvariance": 0.2499023722026536
            },
            {
              "id": "safety_sample_315",
              "rewards": [
                0.8968709803766551,
                0.44548583771408473,
                0.8366862946883123,
                1.6391487705328818,
                0.35520880918157066,
                0.33013185681142787,
                0.9420094946429122
              ],
              "variance": 0.8756871767653869,
              "mean_reward": 0.777934577706835,
              "min_reward": 0.33013185681142787,
              "max_reward": 1.6391487705328818,
              "num_responses": 7,
              "rvariance": 0.18227923048004024
            },
            {
              "id": "safety_sample_302",
              "rewards": [
                0.5658552090907701,
                0.7012707518895414,
                1.1175481612339118,
                1.7795797038056815,
                0.7514246566298269,
                1.318163780195054,
                1.6893026752731675
              ],
              "variance": 1.0783089519161404,
              "mean_reward": 1.1318778483025647,
              "min_reward": 0.5658552090907701,
              "max_reward": 1.7795797038056815,
              "num_responses": 7,
              "rvariance": 0.20224237861906266
            },
            {
              "id": "safety_sample_397",
              "rewards": [
                0.09942389500611416,
                -0.23472649532603856,
                1.22788675166254,
                0.44548583771408473,
                1.0373019136494548,
                0.8567478565844266,
                0.2549009997009995
              ],
              "variance": 1.1477721099814358,
              "mean_reward": 0.5267172512845116,
              "min_reward": -0.23472649532603856,
              "max_reward": 1.22788675166254,
              "num_responses": 7,
              "rvariance": 0.2434449106978365
            },
            {
              "id": "safety_sample_393",
              "rewards": [
                1.4987178372600822,
                2.4717035892216224,
                2.1908417226760233,
                1.4987178372600822
              ],
              "variance": 0.8887271919978605,
              "mean_reward": 1.9149952466044526,
              "min_reward": 1.4987178372600822,
              "max_reward": 2.4717035892216224,
              "num_responses": 4,
              "rvariance": 0.18314730504039517
            },
            {
              "id": "safety_sample_380",
              "rewards": [
                0.43043966629199903,
                1.4585947134678536,
                0.5809013805128558,
                0.4254242758179705,
                0.30003951396725653,
                1.3281945611431112,
                0.37025498060365636
              ],
              "variance": 1.0381858281239118,
              "mean_reward": 0.6991212988292432,
              "min_reward": 0.30003951396725653,
              "max_reward": 1.4585947134678536,
              "num_responses": 7,
              "rvariance": 0.2001468846182529
            },
            {
              "id": "safety_sample_234",
              "rewards": [
                -0.05856090492578544,
                -0.030976257318628363,
                0.8116093423181696,
                -0.32053669171762095,
                -0.40117476668286134,
                -0.48863063807373436,
                -0.4359690380964345
              ],
              "variance": 0.7630916606234457,
              "mean_reward": -0.13203413635669933,
              "min_reward": -0.48863063807373436,
              "max_reward": 0.8116093423181696,
              "num_responses": 7,
              "rvariance": 0.17622591532864468
            },
            {
              "id": "safety_sample_301",
              "rewards": [
                0.590932161460913,
                0.841701685162341,
                1.4184715896756253,
                0.8567478565844266,
                1.4385331515717394,
                1.057363475545569
              ],
              "variance": 0.7121854473120554,
              "mean_reward": 1.0339583200001023,
              "min_reward": 0.590932161460913,
              "max_reward": 1.4385331515717394,
              "num_responses": 6,
              "rvariance": 0.09611956488950286
            },
            {
              "id": "safety_sample_323",
              "rewards": [
                1.909979856130424,
                2.0002568846629383,
                2.511826713013851,
                2.6923807700788793,
                2.27108797026048,
                2.2911495321565947,
                2.451642027325508
              ],
              "variance": 0.6199022625899302,
              "mean_reward": 2.304046250518382,
              "min_reward": 1.909979856130424,
              "max_reward": 2.6923807700788793,
              "num_responses": 7,
              "rvariance": 0.06636997265475034
            },
            {
              "id": "safety_sample_342",
              "rewards": [
                0.5157013043504846,
                -0.7582078760527693,
                0.6410860662011986,
                0.6009629424089701,
                0.6160091138310557,
                0.3903165424997706,
                0.34517802823351357
              ],
              "variance": 0.7222162282601123,
              "mean_reward": 0.33586373163888916,
              "min_reward": -0.7582078760527693,
              "max_reward": 0.6410860662011986,
              "num_responses": 7,
              "rvariance": 0.21061511432538474
            },
            {
              "id": "safety_sample_388",
              "rewards": [
                0.44548583771408473,
                -0.057307057307278295,
                0.49062435198034177,
                -0.24601112389260282,
                0.49062435198034177,
                0.35520880918157066,
                0.4153934948699134
              ],
              "variance": 0.6234130359217498,
              "mean_reward": 0.2705740949323387,
              "min_reward": -0.24601112389260282,
              "max_reward": 0.49062435198034177,
              "num_responses": 7,
              "rvariance": 0.07570576868192173
            },
            {
              "id": "safety_sample_390",
              "rewards": [
                0.8667786375324837,
                2.1406878179357376,
                1.057363475545569,
                1.29810221829894,
                1.398410027779511,
                1.3582869039872825,
                1.5488717420003677
              ],
              "variance": 0.804468632034181,
              "mean_reward": 1.3812144032971272,
              "min_reward": 0.8667786375324837,
              "max_reward": 2.1406878179357376,
              "num_responses": 7,
              "rvariance": 0.140308775184057
            },
            {
              "id": "safety_sample_288",
              "rewards": [
                -1.2998700472478537,
                -0.629061571346534,
                -0.5901922951728127,
                -0.7958233046079836,
                -1.0691620854425399,
                -1.114300599708797,
                -1.2246391901374254
              ],
              "variance": 0.6412176721045513,
              "mean_reward": -0.960435584809135,
              "min_reward": -1.2998700472478537,
              "max_reward": -0.5901922951728127,
              "num_responses": 7,
              "rvariance": 0.07064303246023546
            },
            {
              "id": "safety_sample_343",
              "rewards": [
                -0.5889384475543056,
                0.34517802823351357,
                0.6661630185713414,
                0.08939311405805705,
                0.2875010377821851,
                1.0774250374416832,
                0.44548583771408473
              ],
              "variance": 1.0126073367063662,
              "mean_reward": 0.33174394660665135,
              "min_reward": -0.5889384475543056,
              "max_reward": 1.0774250374416832,
              "num_responses": 7,
              "rvariance": 0.22704878988581406
            },
            {
              "id": "safety_sample_328",
              "rewards": [
                0.8015785613701125,
                0.5508090376686845,
                1.7193950181173387,
                1.7595181419095671,
                1.5990256467406534,
                0.7664708280519126,
                2.1908417226760233
              ],
              "variance": 1.2518414623175285,
              "mean_reward": 1.341091279504899,
              "min_reward": 0.5508090376686845,
              "max_reward": 2.1908417226760233,
              "num_responses": 7,
              "rvariance": 0.33608705275995543
            },
            {
              "id": "safety_sample_325",
              "rewards": [
                0.16462397116848543,
                0.4555166186621418,
                0.5056705234024275,
                0.590932161460913,
                0.5859167709868843,
                1.0473326945975119,
                0.9570556660649978
              ],
              "variance": 0.6540069178133241,
              "mean_reward": 0.6152926294776231,
              "min_reward": 0.16462397116848543,
              "max_reward": 1.0473326945975119,
              "num_responses": 7,
              "rvariance": 0.07793779769498722
            },
            {
              "id": "safety_sample_225",
              "rewards": [
                -0.23786111437230642,
                -0.2798650095922956,
                0.7765016089999697,
                0.26743947588607087,
                0.09440850453208562,
                0.15960858069445688,
                0.5257320852985417
              ],
              "variance": 0.8807025672394151,
              "mean_reward": 0.1865663044923604,
              "min_reward": -0.2798650095922956,
              "max_reward": 0.7765016089999697,
              "num_responses": 7,
              "rvariance": 0.1252163062620533
            },
            {
              "id": "safety_sample_297",
              "rewards": [
                -1.2095930187153396,
                -0.03724549541116406,
                -0.09241479062547821,
                -1.3450085615141107,
                -1.0491005235464257,
                -1.1443929425529684
              ],
              "variance": 1.212470647096404,
              "mean_reward": -0.8129592220609144,
              "min_reward": -1.3450085615141107,
              "max_reward": -0.03724549541116406,
              "num_responses": 6,
              "rvariance": 0.28782032616550374
            },
            {
              "id": "safety_sample_370",
              "rewards": [
                2.2008725036240806,
                2.5720113987021938,
                2.7124423319749935,
                3.1537966936895065,
                2.8929963890400217,
                2.772627017663336,
                2.9933041985205926
              ],
              "variance": 0.6339453559172101,
              "mean_reward": 2.756864361887818,
              "min_reward": 2.2008725036240806,
              "max_reward": 3.1537966936895065,
              "num_responses": 7,
              "rvariance": 0.08250147767225288
            },
            {
              "id": "safety_sample_349",
              "rewards": [
                1.6893026752731675,
                1.5589025229484248,
                2.160749379831852,
                2.491765151117737,
                1.839764389494024,
                1.8999490751823669,
                2.090533913195452
              ],
              "variance": 0.6560130740029355,
              "mean_reward": 1.961566729577575,
              "min_reward": 1.5589025229484248,
              "max_reward": 2.491765151117737,
              "num_responses": 7,
              "rvariance": 0.0846164789665538
            },
            {
              "id": "safety_sample_386",
              "rewards": [
                -0.656646218953691,
                -0.48424217140895937,
                -0.7682386570008265,
                -0.22093417152246003,
                -0.22657648580574216,
                -0.5676230380396842,
                -0.5864307523172912
              ],
              "variance": 0.47696363408011594,
              "mean_reward": -0.501527356435522,
              "min_reward": -0.7682386570008265,
              "max_reward": -0.22093417152246003,
              "num_responses": 7,
              "rvariance": 0.03734332848832489
            },
            {
              "id": "safety_sample_222",
              "rewards": [
                0.20976248543474246,
                0.17214705687952828,
                -0.029722409700121223,
                0.2799779520711423,
                1.1977944088183687,
                0.35520880918157066,
                0.3602241996555992
              ],
              "variance": 0.6038530130730388,
              "mean_reward": 0.36362750033440433,
              "min_reward": -0.029722409700121223,
              "max_reward": 1.1977944088183687,
              "num_responses": 7,
              "rvariance": 0.13113964138721404
            },
            {
              "id": "safety_sample_378",
              "rewards": [
                0.26743947588607087,
                0.4505012281881133,
                -0.08238400967742109,
                0.8717940280065123,
                0.8768094184805408,
                0.2423625235159281,
                0.931978713694855
              ],
              "variance": 0.7864132263276781,
              "mean_reward": 0.5083573397277998,
              "min_reward": -0.08238400967742109,
              "max_reward": 0.931978713694855,
              "num_responses": 7,
              "rvariance": 0.1326307943021704
            },
            {
              "id": "safety_sample_360",
              "rewards": [
                -0.21591878104843146,
                -0.53000760948447,
                -0.1920956762967958,
                -0.18269181915799226,
                -0.4422382761889702,
                0.0718392473989571,
                -0.1920956762967958
              ],
              "variance": 0.3964666169719577,
              "mean_reward": -0.24045837015349977,
              "min_reward": -0.53000760948447,
              "max_reward": 0.0718392473989571,
              "num_responses": 7,
              "rvariance": 0.03295725150961201
            },
            {
              "id": "safety_sample_311",
              "rewards": [
                -0.8058540855560407,
                -1.249716142507568,
                -0.3148160119581821,
                -0.417788247628081,
                -0.5538307142361056,
                -0.35533096313119406,
                -0.3902036000209239
              ],
              "variance": 0.6442739256746624,
              "mean_reward": -0.5839342521482994,
              "min_reward": -1.249716142507568,
              "max_reward": -0.3148160119581821,
              "num_responses": 7,
              "rvariance": 0.09760575890415803
            },
            {
              "id": "safety_sample_392",
              "rewards": [
                1.6391487705328818,
                2.1406878179357376,
                2.160749379831852,
                2.251026408364366,
                2.3513342178449372,
                2.491765151117737,
                2.3713957797410514
              ],
              "variance": 0.47947132931713066,
              "mean_reward": 2.2008725036240806,
              "min_reward": 1.6391487705328818,
              "max_reward": 2.491765151117737,
              "num_responses": 7,
              "rvariance": 0.06565949649181045
            },
            {
              "id": "safety_sample_352",
              "rewards": [
                -0.40117476668286134,
                0.1320239330872998,
                0.7765016089999697,
                -0.0008839144744570087,
                0.4404704472400562,
                0.33013185681142787,
                0.5809013805128558
              ],
              "variance": 0.8201417272655201,
              "mean_reward": 0.2654243636420416,
              "min_reward": -0.40117476668286134,
              "max_reward": 0.7765016089999697,
              "num_responses": 7,
              "rvariance": 0.1326605806238724
            },
            {
              "id": "safety_sample_329",
              "rewards": [
                0.7363784852077412,
                -0.3090169667225866,
                0.1571008854574426,
                0.30003951396725653,
                0.09190080929507133,
                0.10694698071715701
              ],
              "variance": 0.6267670783012566,
              "mean_reward": 0.18055828465368032,
              "min_reward": -0.3090169667225866,
              "max_reward": 0.7363784852077412,
              "num_responses": 6,
              "rvariance": 0.09612080130727067
            },
            {
              "id": "safety_sample_357",
              "rewards": [
                -1.1393775520789398,
                -1.5155318376310818,
                -0.6127615523059412,
                -0.9237157616957118,
                -1.0641466949685114,
                -1.0641466949685114,
                -1.0491005235464257
              ],
              "variance": 0.4905051883599931,
              "mean_reward": -1.0526829453135889,
              "min_reward": -1.5155318376310818,
              "max_reward": -0.6127615523059412,
              "num_responses": 7,
              "rvariance": 0.06174058389940925
            },
            {
              "id": "safety_sample_144",
              "rewards": [
                -1.5506395709492817,
                -1.0240235711762828,
                -1.214608409189368,
                -1.1042698187607398,
                -1.4051932472024533
              ],
              "variance": 0.4363389712404848,
              "mean_reward": -1.2597469234556251,
              "min_reward": -1.5506395709492817,
              "max_reward": -1.0240235711762828,
              "num_responses": 5,
              "rvariance": 0.03750985596432325
            },
            {
              "id": "safety_sample_359",
              "rewards": [
                -0.08865324776995678,
                -0.2994563786314697,
                0.01165456171061439,
                0.24487021875294238,
                -0.07862246682189968,
                -0.21278416200216363,
                0.059300771213885696
              ],
              "variance": 0.38098159888339445,
              "mean_reward": -0.05195581479257818,
              "min_reward": -0.2994563786314697,
              "max_reward": 0.24487021875294238,
              "num_responses": 7,
              "rvariance": 0.027672871486196626
            },
            {
              "id": "safety_sample_221",
              "rewards": [
                -0.030976257318628363,
                -0.003391609711471288,
                -0.1237609810881567,
                0.340162637759485,
                0.385301152025742,
                0.277470256834128,
                0.5207166948245131
              ],
              "variance": 0.5075575159716902,
              "mean_reward": 0.19507455618937314,
              "min_reward": -0.1237609810881567,
              "max_reward": 0.5207166948245131,
              "num_responses": 7,
              "rvariance": 0.05174463603469405
            },
            {
              "id": "safety_sample_300",
              "rewards": [
                -0.8309310379261834,
                -0.3858151333561489,
                0.2072547901977282,
                -0.54756147614357,
                0.22480865685682813,
                -0.022199323989078385,
                -0.49866141902179145
              ],
              "variance": 0.8751856377179835,
              "mean_reward": -0.2647292776260309,
              "min_reward": -0.8309310379261834,
              "max_reward": 0.22480865685682813,
              "num_responses": 7,
              "rvariance": 0.14160023501564373
            },
            {
              "id": "safety_sample_339",
              "rewards": [
                -0.943777323591826,
                -0.4873767904552272,
                -1.0039620092801687,
                -0.9663465807249545,
                -0.6905001046533837,
                -0.7356386189196408,
                -0.6090000094504198
              ],
              "variance": 0.42104203029469744,
              "mean_reward": -0.77665734815366,
              "min_reward": -1.0039620092801687,
              "max_reward": -0.4873767904552272,
              "num_responses": 7,
              "rvariance": 0.03378233302181226
            },
            {
              "id": "safety_sample_395",
              "rewards": [
                1.8497951704420812,
                1.7093642371692817,
                2.4717035892216224,
                1.829733608545967,
                2.41151890353328,
                2.2008725036240806,
                2.1105954750915665
              ],
              "variance": 0.6540069178133239,
              "mean_reward": 2.0833690696611256,
              "min_reward": 1.7093642371692817,
              "max_reward": 2.4717035892216224,
              "num_responses": 7,
              "rvariance": 0.07597166785101331
            },
            {
              "id": "safety_sample_289",
              "rewards": [
                -0.9337465426437689,
                -0.40932477620315777,
                -0.7256078379715837,
                -0.5337691523399913,
                -0.6679308475202552,
                -0.7983309998449978,
                -0.8760695521924404
              ],
              "variance": 0.415148946487714,
              "mean_reward": -0.7063971012451707,
              "min_reward": -0.9337465426437689,
              "max_reward": -0.40932477620315777,
              "num_responses": 7,
              "rvariance": 0.02983277585096419
            },
            {
              "id": "safety_sample_374",
              "rewards": [
                -0.20212645724485293,
                -0.4905114095014951,
                -0.020945476370571245,
                -0.356898272654328,
                0.1821778378275854,
                0.09691619976909989,
                0.2523933044639852
              ],
              "variance": 0.6206075518753401,
              "mean_reward": -0.07699918195865381,
              "min_reward": -0.4905114095014951,
              "max_reward": 0.2523933044639852,
              "num_responses": 7,
              "rvariance": 0.06772191627555525
            },
            {
              "id": "safety_sample_333",
              "rewards": [
                -0.09492248586249248,
                -0.22657648580574216,
                0.4254242758179705,
                0.17214705687952828,
                -0.08739940015144965,
                0.17716244735355682,
                0.761455437577884
              ],
              "variance": 0.7074208263617283,
              "mean_reward": 0.1610415494013222,
              "min_reward": -0.22657648580574216,
              "max_reward": 0.761455437577884,
              "num_responses": 7,
              "rvariance": 0.1011809303958479
            },
            {
              "id": "safety_sample_241",
              "rewards": [
                -1.1544237235010255,
                -1.5957780852155388,
                -0.9688542759619688,
                -1.1293467711308827,
                -0.8058540855560407,
                -1.2898392662997966,
                -1.0491005235464257
              ],
              "variance": 0.5085605940664959,
              "mean_reward": -1.1418852473159542,
              "min_reward": -1.5957780852155388,
              "max_reward": -0.8058540855560407,
              "num_responses": 7,
              "rvariance": 0.054241312926643644
            },
            {
              "id": "safety_sample_261",
              "rewards": [
                -0.9187003712216832,
                -0.9738696664359974,
                -1.1092852092347685,
                -0.988915837858083,
                -0.5325153047214842,
                -1.2898392662997966
              ],
              "variance": 0.47395439979569876,
              "mean_reward": -0.9688542759619688,
              "min_reward": -1.2898392662997966,
              "max_reward": -0.5325153047214842,
              "num_responses": 6,
              "rvariance": 0.0526811572388776
            },
            {
              "id": "safety_sample_230",
              "rewards": [
                -0.5613537999471485,
                -0.6503769808611554,
                -0.5876845999357984,
                -0.3588574095582454,
                -0.21466493342992432,
                -0.17767642868396372,
                -0.17015334297292087
              ],
              "variance": 0.4380943579063946,
              "mean_reward": -0.3886810707698795,
              "min_reward": -0.6503769808611554,
              "max_reward": -0.17015334297292087,
              "num_responses": 7,
              "rvariance": 0.037335917000172844
            },
            {
              "id": "safety_sample_321",
              "rewards": [
                1.5488717420003677,
                1.0874558183897403,
                1.2680098754547684,
                1.4184715896756253,
                1.5889948657925963,
                1.318163780195054,
                1.6491795514809389
              ],
              "variance": 0.41728048743917623,
              "mean_reward": 1.411306746141299,
              "min_reward": 1.0874558183897403,
              "max_reward": 1.6491795514809389,
              "num_responses": 7,
              "rvariance": 0.034460147301900265
            },
            {
              "id": "safety_sample_247",
              "rewards": [
                -0.1513456286953138,
                0.16462397116848543,
                0.4153934948699134,
                0.555824428142713
              ],
              "variance": 0.5702498968970471,
              "mean_reward": 0.2461240663714495,
              "min_reward": -0.1513456286953138,
              "max_reward": 0.555824428142713,
              "num_responses": 4,
              "rvariance": 0.07229771938000154
            },
            {
              "id": "safety_sample_326",
              "rewards": [
                -0.8986388093255689,
                -0.7682386570008265,
                0.13954701879834264,
                -0.5111998952068628,
                -0.9563157997768974,
                -0.3612083738429463,
                -0.41716132381882737
              ],
              "variance": 0.7608033887196698,
              "mean_reward": -0.5390308343105124,
              "min_reward": -0.9563157997768974,
              "max_reward": 0.13954701879834264,
              "num_responses": 7,
              "rvariance": 0.1233851904309403
            },
            {
              "id": "safety_sample_384",
              "rewards": [
                -0.9663465807249545,
                -1.339993171040082,
                -1.4503317614687103,
                -1.2296545806114538,
                -1.1293467711308827,
                -1.0842082568646256,
                -0.9187003712216832
              ],
              "variance": 0.4368405102878873,
              "mean_reward": -1.1597973561517705,
              "min_reward": -1.4503317614687103,
              "max_reward": -0.9187003712216832,
              "num_responses": 7,
              "rvariance": 0.031993244700016056
            },
            {
              "id": "safety_sample_322",
              "rewards": [
                -0.4071305428707703,
                0.20223939972369961,
                -0.2196803239039529,
                -0.26826691912110456,
                -0.6278077237280268,
                -0.5676230380396842
              ],
              "variance": 0.5889949187937289,
              "mean_reward": -0.3147115246566399,
              "min_reward": -0.6278077237280268,
              "max_reward": 0.20223939972369961,
              "num_responses": 6,
              "rvariance": 0.0748268378533086
            },
            {
              "id": "safety_sample_208",
              "rewards": [
                -0.2908361762542331,
                -0.8309310379261834,
                -0.4234305619113631,
                -0.3221040012407549,
                -0.7582078760527693,
                -0.7832848284229121,
                -0.5763999713692342
              ],
              "variance": 0.49274644097807446,
              "mean_reward": -0.5693134933110644,
              "min_reward": -0.8309310379261834,
              "max_reward": -0.2908361762542331,
              "num_responses": 7,
              "rvariance": 0.04427182238017576
            },
            {
              "id": "safety_sample_345",
              "rewards": [
                0.42040888534394194,
                -0.11373020014009959,
                0.11447006642819985,
                0.20223939972369961,
                -0.048530123977728316,
                0.09440850453208562,
                0.34517802823351357
              ],
              "variance": 0.4498805255203618,
              "mean_reward": 0.14492065144908753,
              "min_reward": -0.11373020014009959,
              "max_reward": 0.42040888534394194,
              "num_responses": 7,
              "rvariance": 0.032440629075740156
            },
            {
              "id": "safety_sample_277",
              "rewards": [
                -1.0290389616503115,
                -1.2447007520335396,
                -1.0591313044944828,
                -0.8685464664813977,
                -1.4804241043128819
              ],
              "variance": 0.45339129885218177,
              "mean_reward": -1.1363683177945227,
              "min_reward": -1.4804241043128819,
              "max_reward": -0.8685464664813977,
              "num_responses": 5,
              "rvariance": 0.04386479829990976
            },
            {
              "id": "safety_sample_320",
              "rewards": [
                0.5207166948245131,
                0.7464092661557983,
                1.1576712850261401,
                0.8216401232662267,
                0.8868401994285979,
                0.6561322376232843,
                0.931978713694855
              ],
              "variance": 0.42028972172359325,
              "mean_reward": 0.8173412171456308,
              "min_reward": 0.5207166948245131,
              "max_reward": 1.1576712850261401,
              "num_responses": 7,
              "rvariance": 0.03611724054898841
            },
            {
              "id": "safety_sample_394",
              "rewards": [
                -0.12501482870666383,
                -0.37797858574047927,
                0.08688541882104277,
                -0.5901922951728127,
                -0.04978397159623546
              ],
              "variance": 0.5375244740540108,
              "mean_reward": -0.21121685247902966,
              "min_reward": -0.5901922951728127,
              "max_reward": 0.08688541882104277,
              "num_responses": 5,
              "rvariance": 0.05875763798642873
            },
            {
              "id": "safety_sample_330",
              "rewards": [
                0.05177768550284286,
                0.12199315213924268,
                -0.3861285952607757,
                0.009146866473600109,
                -0.04226088588519262,
                0.12450084737625697,
                -0.062322447781306856
              ],
              "variance": 0.3148411370071428,
              "mean_reward": -0.026184768205047507,
              "min_reward": -0.3861285952607757,
              "max_reward": 0.12450084737625697,
              "num_responses": 7,
              "rvariance": 0.026159035928320296
            },
            {
              "id": "safety_sample_310",
              "rewards": [
                -0.3873824428792828,
                -0.8234079522151406,
                -0.7531924855787407,
                -0.50367680949582,
                -0.8234079522151406,
                -0.50367680949582,
                -0.5676230380396842
              ],
              "variance": 0.3662488893659355,
              "mean_reward": -0.6231953557028042,
              "min_reward": -0.8234079522151406,
              "max_reward": -0.3873824428792828,
              "num_responses": 7,
              "rvariance": 0.026333542785718683
            },
            {
              "id": "safety_sample_396",
              "rewards": [
                2.7325038938711077,
                3.1738582555856207,
                3.07355044610505,
                3.3945354364428773,
                3.213981379377849,
                3.274166065066192,
                3.3142891888584205
              ],
              "variance": 0.40925586268073033,
              "mean_reward": 3.1681263807581597,
              "min_reward": 2.7325038938711077,
              "max_reward": 3.3945354364428773,
              "num_responses": 7,
              "rvariance": 0.04067373362865213
            },
            {
              "id": "safety_sample_94",
              "rewards": [
                -0.9312388474067546,
                -0.2839400143524438,
                -0.19146875248754225,
                -0.10996865728457816,
                -0.3902036000209239,
                0.11697776166521412,
                -0.25102651436663137
              ],
              "variance": 0.5874276092705949,
              "mean_reward": -0.2915526606076657,
              "min_reward": -0.9312388474067546,
              "max_reward": 0.11697776166521412,
              "num_responses": 7,
              "rvariance": 0.09007391302724685
            },
            {
              "id": "safety_sample_265",
              "rewards": [
                0.38028576155171345,
                0.061808466450899976,
                0.4555166186621418,
                0.5658552090907701,
                0.2523933044639852,
                0.5056705234024275,
                0.4153934948699134
              ],
              "variance": 0.35358502841901346,
              "mean_reward": 0.37670333978455023,
              "min_reward": 0.061808466450899976,
              "max_reward": 0.5658552090907701,
              "num_responses": 7,
              "rvariance": 0.02496343214560923
            },
            {
              "id": "safety_sample_336",
              "rewards": [
                1.3382253420911683,
                1.839764389494024,
                1.6792718943251104,
                1.8798875132862527,
                1.7093642371692817,
                1.990226103714881,
                1.829733608545967
              ],
              "variance": 0.3811696760261707,
              "mean_reward": 1.7523532983752406,
              "min_reward": 1.3382253420911683,
              "max_reward": 1.990226103714881,
              "num_responses": 7,
              "rvariance": 0.03788111056044905
            },
            {
              "id": "safety_sample_215",
              "rewards": [
                -0.4397305809519559,
                -0.27923808578304204,
                -0.2234418667594743,
                0.059300771213885696,
                0.5608398186167416,
                -0.17266103820993514,
                -0.32461169647776916
              ],
              "variance": 0.630575640442472,
              "mean_reward": -0.11707752547879277,
              "min_reward": -0.4397305809519559,
              "max_reward": 0.5608398186167416,
              "num_responses": 7,
              "rvariance": 0.0969365146585641
            },
            {
              "id": "safety_sample_364",
              "rewards": [
                -0.11373020014009959,
                0.056793075976871416,
                -0.17767642868396372,
                0.22480865685682813,
                -0.27641692864140094,
                -0.20839569533738864,
                -0.17893027630247085
              ],
              "variance": 0.3596034969878477,
              "mean_reward": -0.09622111375308917,
              "min_reward": -0.27641692864140094,
              "max_reward": 0.22480865685682813,
              "num_responses": 7,
              "rvariance": 0.02647278090566624
            },
            {
              "id": "safety_sample_313",
              "rewards": [
                0.8266555137402553,
                0.6310552852531414,
                0.5809013805128558,
                0.5959475519349415,
                0.5407782567206274,
                0.8768094184805408,
                0.9570556660649978
              ],
              "variance": 0.3440557865183592,
              "mean_reward": 0.7156004389581943,
              "min_reward": 0.5407782567206274,
              "max_reward": 0.9570556660649978,
              "num_responses": 7,
              "rvariance": 0.02382764564957995
            },
            {
              "id": "safety_sample_389",
              "rewards": [
                0.7564400471038555,
                0.41037810439588485,
                0.7815169994739982,
                0.977117227961112,
                0.8717940280065123,
                0.8216401232662267,
                0.716316923311627
              ],
              "variance": 0.3199819122430221,
              "mean_reward": 0.7621719219313167,
              "min_reward": 0.41037810439588485,
              "max_reward": 0.977117227961112,
              "num_responses": 7,
              "rvariance": 0.026860516437621097
            },
            {
              "id": "safety_sample_77",
              "rewards": [
                -0.8610233807703548,
                -0.5262460666289486,
                -0.4773460095071701,
                -0.8284233426891692,
                -0.2895823286357259,
                -0.6541385237166767,
                -0.33673018268906324
              ],
              "variance": 0.5235923168539152,
              "mean_reward": -0.5676414049481584,
              "min_reward": -0.8610233807703548,
              "max_reward": -0.2895823286357259,
              "num_responses": 7,
              "rvariance": 0.04315223275740944
            },
            {
              "id": "safety_sample_269",
              "rewards": [
                -1.1293467711308827,
                -0.44537289523523804,
                -0.5638614951841627,
                -0.5162152856808915,
                -0.6679308475202552,
                -0.5713845808952056,
                -0.3712391547910034
              ],
              "variance": 0.436777817906962,
              "mean_reward": -0.6093358614910913,
              "min_reward": -1.1293467711308827,
              "max_reward": -0.3712391547910034,
              "num_responses": 7,
              "rvariance": 0.052799753415159224
            },
            {
              "id": "safety_sample_361",
              "rewards": [
                0.15208549498341403,
                -0.19084182867828867,
                -0.3629324143183936,
                -0.35423384646500033,
                -0.3920843714486846
              ],
              "variance": 0.3953381541153012,
              "mean_reward": -0.22960139318539063,
              "min_reward": -0.3920843714486846,
              "max_reward": 0.15208549498341403,
              "num_responses": 5,
              "rvariance": 0.04137966245458785
            },
            {
              "id": "safety_sample_254",
              "rewards": [
                -0.5876845999357984,
                -0.8560079902963262,
                -0.5450537809065557,
                -0.08363785729592824,
                -0.4271921047668845,
                -0.2927169476819938,
                -0.3157563976720625
              ],
              "variance": 0.485928644552442,
              "mean_reward": -0.44400709693650703,
              "min_reward": -0.8560079902963262,
              "max_reward": -0.08363785729592824,
              "num_responses": 7,
              "rvariance": 0.05286915390040122
            },
            {
              "id": "safety_sample_355",
              "rewards": [
                0.295024123493228,
                0.8116093423181696,
                0.9069017613247122,
                0.590932161460913,
                0.7213323137856555,
                0.7564400471038555,
                0.6109937233570272
              ],
              "variance": 0.3771573636469477,
              "mean_reward": 0.6704619246919374,
              "min_reward": 0.295024123493228,
              "max_reward": 0.9069017613247122,
              "num_responses": 7,
              "rvariance": 0.033803059521146595
            },
            {
              "id": "safety_sample_317",
              "rewards": [
                0.7564400471038555,
                0.295024123493228,
                0.16462397116848543,
                0.340162637759485,
                0.5508090376686845,
                0.12450084737625697,
                0.7413938756817697
              ],
              "variance": 0.59883762259901,
              "mean_reward": 0.4247077914645379,
              "min_reward": 0.12450084737625697,
              "max_reward": 0.7564400471038555,
              "num_responses": 7,
              "rvariance": 0.05828163275353565
            },
            {
              "id": "safety_sample_291",
              "rewards": [
                -0.005899304948485567,
                0.3251164663373993,
                0.43043966629199903,
                0.39533193297379915,
                0.545793647194656,
                0.6812091899934271,
                0.6210245043050843
              ],
              "variance": 0.452388220757376,
              "mean_reward": 0.4275737288782685,
              "min_reward": -0.005899304948485567,
              "max_reward": 0.6812091899934271,
              "num_responses": 7,
              "rvariance": 0.04502488677683036
            },
            {
              "id": "safety_sample_193",
              "rewards": [
                -0.3165400524336294,
                -0.5350229999584986,
                -0.6516308284796625,
                -0.3349265522768943,
                -0.028468562081614083,
                -0.42029594286509525,
                -0.6039846189763912
              ],
              "variance": 0.4217316464848765,
              "mean_reward": -0.41298136529596935,
              "min_reward": -0.6516308284796625,
              "max_reward": -0.028468562081614083,
              "num_responses": 7,
              "rvariance": 0.03880386418975793
            },
            {
              "id": "safety_sample_213",
              "rewards": [
                0.20976248543474246,
                1.0974865993377974,
                1.1175481612339118,
                0.7363784852077412,
                0.796563170896084,
                0.4505012281881133,
                0.8868401994285979
              ],
              "variance": 0.751305493009478,
              "mean_reward": 0.7564400471038554,
              "min_reward": 0.20976248543474246,
              "max_reward": 1.1175481612339118,
              "num_responses": 7,
              "rvariance": 0.09402618132687783
            },
            {
              "id": "safety_sample_332",
              "rewards": [
                -0.8509925998222977,
                -0.8986388093255689,
                -0.8234079522151406,
                -0.988915837858083,
                -0.7757617427118693,
                -0.6253000284910126,
                -0.6679308475202552
              ],
              "variance": 0.28387110083001643,
              "mean_reward": -0.8044211168491753,
              "min_reward": -0.988915837858083,
              "max_reward": -0.6253000284910126,
              "num_responses": 7,
              "rvariance": 0.013854285177328146
            },
            {
              "id": "safety_sample_204",
              "rewards": [
                0.014162256947628668,
                0.5608398186167416,
                1.1677020659741972,
                1.318163780195054,
                1.1075173802858547,
                1.0874558183897403,
                1.4084408087275682
              ],
              "variance": 1.0121057976589634,
              "mean_reward": 0.9520402755909692,
              "min_reward": 0.014162256947628668,
              "max_reward": 1.4084408087275682,
              "num_responses": 7,
              "rvariance": 0.20914590711560593
            },
            {
              "id": "safety_sample_351",
              "rewards": [
                0.8266555137402553,
                1.1576712850261401,
                1.1877636278703114,
                1.5589025229484248,
                0.555824428142713,
                0.6812091899934271,
                1.4285023706236823
              ],
              "variance": 0.849607146300438,
              "mean_reward": 1.0566469911921363,
              "min_reward": 0.555824428142713,
              "max_reward": 1.5589025229484248,
              "num_responses": 7,
              "rvariance": 0.12322962638274872
            },
            {
              "id": "safety_sample_399",
              "rewards": [
                -0.7431617046306837,
                -1.0992544282867114,
                -0.8484849045852834,
                -0.9663465807249545,
                -0.7030385808384552,
                -0.8735618569554262,
                -0.5274999142474557
              ],
              "variance": 0.3866866055476019,
              "mean_reward": -0.8230497100384243,
              "min_reward": -1.0992544282867114,
              "max_reward": -0.5274999142474557,
              "num_responses": 7,
              "rvariance": 0.029736558852990185
            },
            {
              "id": "safety_sample_368",
              "rewards": [
                -0.008407000185499848,
                0.036731514080757185,
                -0.09492248586249248,
                0.21227018067175674,
                0.9570556660649978,
                0.10443928548014272,
                0.38028576155171345
              ],
              "variance": 0.6540069178133243,
              "mean_reward": 0.22677898882876793,
              "min_reward": -0.09492248586249248,
              "max_reward": 0.9570556660649978,
              "num_responses": 7,
              "rvariance": 0.10956688486025945
            },
            {
              "id": "safety_sample_366",
              "rewards": [
                -0.17767642868396372,
                0.024193037895685787,
                -0.11498404775860672,
                -0.04978397159623546,
                0.16211627593147115,
                0.0016237807625572706,
                0.20474709496071392
              ],
              "variance": 0.31922960367191777,
              "mean_reward": 0.007176534501660321,
              "min_reward": -0.17767642868396372,
              "max_reward": 0.20474709496071392,
              "num_responses": 7,
              "rvariance": 0.01652845277255554
            },
            {
              "id": "safety_sample_324",
              "rewards": [
                -0.6528846760981696,
                0.39533193297379915,
                0.5006551329283989,
                0.5508090376686845,
                0.6812091899934271,
                0.38028576155171345,
                0.8567478565844266
              ],
              "variance": 0.7844070701380667,
              "mean_reward": 0.38745060508603996,
              "min_reward": -0.6528846760981696,
              "max_reward": 0.8567478565844266,
              "num_responses": 7,
              "rvariance": 0.2040637438113392
            },
            {
              "id": "safety_sample_340",
              "rewards": [
                0.977117227961112,
                0.40536271392185624,
                0.6109937233570272,
                0.8065939518441411,
                0.716316923311627,
                0.67117840904537,
                0.9470248851169407
              ],
              "variance": 0.43032050267165045,
              "mean_reward": 0.7335125477940105,
              "min_reward": 0.40536271392185624,
              "max_reward": 0.977117227961112,
              "num_responses": 7,
              "rvariance": 0.03387800859613881
            },
            {
              "id": "safety_sample_206",
              "rewards": [
                -0.09743018109950677,
                0.5658552090907701,
                0.5959475519349415,
                0.545793647194656,
                0.4153934948699134,
                -0.03724549541116406
              ],
              "variance": 0.6482392187681912,
              "mean_reward": 0.33138570442993504,
              "min_reward": -0.09743018109950677,
              "max_reward": 0.5959475519349415,
              "num_responses": 6,
              "rvariance": 0.0829615032875091
            },
            {
              "id": "safety_sample_371",
              "rewards": [
                -1.1042698187607398,
                -0.8133771712670834,
                -0.5776538189877413,
                -1.1795006758711684,
                -0.8509925998222977,
                -0.8585156855333405
              ],
              "variance": 0.4463697521885419,
              "mean_reward": -0.8973849617070618,
              "min_reward": -1.1795006758711684,
              "max_reward": -0.5776538189877413,
              "num_responses": 6,
              "rvariance": 0.03922316743452841
            },
            {
              "id": "safety_sample_308",
              "rewards": [
                2.060441570351281,
                2.2911495321565947,
                2.1206262560396234,
                2.2008725036240806,
                2.2309648464682517,
                2.3513342178449372,
                2.41151890353328
              ],
              "variance": 0.2788557103559879,
              "mean_reward": 2.2381296900025784,
              "min_reward": 2.060441570351281,
              "max_reward": 2.41151890353328,
              "num_responses": 7,
              "rvariance": 0.013215677990408176
            },
            {
              "id": "safety_sample_385",
              "rewards": [
                0.006639171236585829,
                0.3501934187075421,
                0.3150856853893422,
                0.277470256834128,
                0.07936233310999993,
                0.11196237119118557,
                0.3351472472854564
              ],
              "variance": 0.2908926474936564,
              "mean_reward": 0.2108372119648914,
              "min_reward": 0.006639171236585829,
              "max_reward": 0.3501934187075421,
              "num_responses": 7,
              "rvariance": 0.016991365980598208
            },
            {
              "id": "safety_sample_171",
              "rewards": [
                -2.3330404848977366,
                -2.3531020467938513,
                -2.5436868848069363,
                -2.5436868848069363,
                -2.623933132391393,
                -2.623933132391393,
                -2.684117818079736
              ],
              "variance": 0.30292958463132447,
              "mean_reward": -2.529357197738283,
              "min_reward": -2.684117818079736,
              "max_reward": -2.3330404848977366,
              "num_responses": 7,
              "rvariance": 0.015979553468203296
            },
            {
              "id": "safety_sample_212",
              "rewards": [
                0.6511168471492557,
                0.7062861423635699,
                0.9119171517987408,
                1.3382253420911683,
                0.7413938756817697,
                1.1777328469222543,
                0.8717940280065123
              ],
              "variance": 0.5577114207119758,
              "mean_reward": 0.9140666048590386,
              "min_reward": 0.6511168471492557,
              "max_reward": 1.3382253420911683,
              "num_responses": 7,
              "rvariance": 0.05619332565032788
            },
            {
              "id": "safety_sample_338",
              "rewards": [
                0.13954701879834264,
                0.06682385692492854,
                0.1796701425905711,
                0.39533193297379915,
                0.20223939972369961,
                -0.034737800174149784
              ],
              "variance": 0.28274263797335997,
              "mean_reward": 0.15814575847286524,
              "min_reward": -0.034737800174149784,
              "max_reward": 0.39533193297379915,
              "num_responses": 6,
              "rvariance": 0.017425749950156583
            },
            {
              "id": "safety_sample_369",
              "rewards": [
                0.0843777235840285,
                0.24737791398995665,
                0.20976248543474246,
                0.63607067572717,
                0.44548583771408473,
                0.4956397424543703,
                0.590932161460913
              ],
              "variance": 0.449378986472959,
              "mean_reward": 0.38709236290932364,
              "min_reward": 0.0843777235840285,
              "max_reward": 0.63607067572717,
              "num_responses": 7,
              "rvariance": 0.03733362296812578
            },
            {
              "id": "safety_sample_20",
              "rewards": [
                -0.3281773256428988,
                -0.9337465426437689,
                -0.9839004473840545,
                -0.3152862048151223,
                -0.48674986664597364,
                -1.1193159901828256,
                -0.7205924474975551
              ],
              "variance": 0.7150457871917748,
              "mean_reward": -0.6982526892588856,
              "min_reward": -1.1193159901828256,
              "max_reward": -0.3152862048151223,
              "num_responses": 7,
              "rvariance": 0.09188541597472448
            },
            {
              "id": "safety_sample_377",
              "rewards": [
                0.8617632470584552,
                0.8266555137402553,
                0.7865323899480268,
                1.0874558183897403,
                0.977117227961112,
                0.9670864470130549
              ],
              "variance": 0.22569257133128517,
              "mean_reward": 0.9177684406851075,
              "min_reward": 0.7865323899480268,
              "max_reward": 1.0874558183897403,
              "num_responses": 6,
              "rvariance": 0.010568233105708836
            },
            {
              "id": "safety_sample_383",
              "rewards": [
                -0.700530885601441,
                -0.6202846380169841,
                -0.8760695521924404,
                -0.7883002188969407,
                -0.8660387712443833,
                -0.10369941919204247,
                -0.8610233807703548
              ],
              "variance": 0.4564005331365989,
              "mean_reward": -0.6879924094163696,
              "min_reward": -0.8760695521924404,
              "max_reward": -0.10369941919204247,
              "num_responses": 7,
              "rvariance": 0.06474496377195676
            },
            {
              "id": "safety_sample_278",
              "rewards": [
                -2.0321170564560234,
                -1.8415322184429381,
                -2.18257877067688,
                -2.022086275507966,
                -1.751255189910424,
                -2.4032559515341365,
                -1.8615937803390523
              ],
              "variance": 0.46542823598985006,
              "mean_reward": -2.0134884632667744,
              "min_reward": -2.4032559515341365,
              "max_reward": -1.751255189910424,
              "num_responses": 7,
              "rvariance": 0.04319120118866461
            },
            {
              "id": "safety_sample_199",
              "rewards": [
                -0.7180847522605408,
                -0.4271921047668845,
                -0.15636101916934234,
                -0.575146123750727
              ],
              "variance": 0.43759281885899176,
              "mean_reward": -0.46919599998687367,
              "min_reward": -0.7180847522605408,
              "max_reward": -0.15636101916934234,
              "num_responses": 4,
              "rvariance": 0.043200273042668935
            },
            {
              "id": "safety_sample_379",
              "rewards": [
                -0.6854847141793552,
                -1.1343621616049113,
                -0.8560079902963262,
                -0.46919599998687367,
                -0.5901922951728127,
                -0.773254047474855,
                -0.7231001427345695
              ],
              "variance": 0.4255558817213232,
              "mean_reward": -0.7473710502071006,
              "min_reward": -1.1343621616049113,
              "max_reward": -0.46919599998687367,
              "num_responses": 7,
              "rvariance": 0.038391364248008424
            },
            {
              "id": "safety_sample_73",
              "rewards": [
                -0.988915837858083,
                -0.9788850569100259,
                -0.7531924855787407,
                -1.1494083330269969,
                -0.7782694379488836,
                -1.0240235711762828,
                -0.9462850188288403
              ],
              "variance": 0.30593881891574204,
              "mean_reward": -0.9455685344754076,
              "min_reward": -1.1494083330269969,
              "max_reward": -0.7531924855787407,
              "num_responses": 7,
              "rvariance": 0.016527554410355284
            },
            {
              "id": "safety_sample_314",
              "rewards": [
                1.5288101801042535,
                2.0704723512993377,
                1.8899182942343098,
                2.1406878179357376,
                1.3382253420911683,
                1.8798875132862527,
                1.7996412657017957
              ],
              "variance": 0.6459822930548782,
              "mean_reward": 1.8068061092361223,
              "min_reward": 1.3382253420911683,
              "max_reward": 2.1406878179357376,
              "num_responses": 7,
              "rvariance": 0.07002091663656289
            },
            {
              "id": "safety_sample_97",
              "rewards": [
                -0.728115533208598,
                -0.8660387712443833,
                -0.37233627145719717,
                -0.38706898097465603,
                -0.745669399867698,
                -0.5500691713805842,
                -0.4209228666743488
              ],
              "variance": 0.41264125125069967,
              "mean_reward": -0.5814601421153522,
              "min_reward": -0.8660387712443833,
              "max_reward": -0.37233627145719717,
              "num_responses": 7,
              "rvariance": 0.03396225812623091
            },
            {
              "id": "safety_sample_35",
              "rewards": [
                -0.1275225239436781,
                0.05428538073985714,
                -0.12501482870666383,
                0.1545931902204283,
                -0.09241479062547821,
                0.19220861877564252,
                0.0718392473989571
              ],
              "variance": 0.29565726844398355,
              "mean_reward": 0.01828204197986642,
              "min_reward": -0.1275225239436781,
              "max_reward": 0.19220861877564252,
              "num_responses": 7,
              "rvariance": 0.015291793035183982
            },
            {
              "id": "safety_sample_107",
              "rewards": [
                -0.5237383713919342,
                -0.18958798105978153,
                0.009146866473600109,
                -0.5011691142588057,
                -0.2190534000946993,
                -0.15636101916934234
              ],
              "variance": 0.4388466664774988,
              "mean_reward": -0.2634605032501605,
              "min_reward": -0.5237383713919342,
              "max_reward": 0.009146866473600109,
              "num_responses": 6,
              "rvariance": 0.03624402837593305
            },
            {
              "id": "safety_sample_131",
              "rewards": [
                0.19722400924967107,
                0.01666995218464295,
                0.18970092353862822,
                0.3903165424997706,
                0.3501934187075421,
                0.23483943780488525,
                0.1345316283243141
              ],
              "variance": 0.2788557103559879,
              "mean_reward": 0.21621084461563633,
              "min_reward": 0.01666995218464295,
              "max_reward": 0.3903165424997706,
              "num_responses": 7,
              "rvariance": 0.013737498091295762
            },
            {
              "id": "safety_sample_187",
              "rewards": [
                -0.6027307713578841,
                -0.6115077046874341,
                -0.19334952391530297,
                -0.5224845237734271,
                -0.23347264770753143,
                -0.5049306571143272,
                -0.3657535714600347
              ],
              "variance": 0.3888181464990641,
              "mean_reward": -0.43346134285942023,
              "min_reward": -0.6115077046874341,
              "max_reward": -0.19334952391530297,
              "num_responses": 7,
              "rvariance": 0.025088448871083194
            },
            {
              "id": "safety_sample_177",
              "rewards": [
                -0.21466493342992432,
                0.12199315213924268,
                0.20223939972369961,
                -0.03348395255564264,
                0.09942389500611416,
                -0.117491742995621,
                0.08939311405805705
              ],
              "variance": 0.3104526703423678,
              "mean_reward": 0.02105841884941794,
              "min_reward": -0.21466493342992432,
              "max_reward": 0.20223939972369961,
              "num_responses": 7,
              "rvariance": 0.01879452329613759
            },
            {
              "id": "safety_sample_72",
              "rewards": [
                0.5608398186167416,
                0.4805935710322846,
                0.8216401232662267,
                0.9871480089091692,
                0.8065939518441411,
                0.7714862185259411,
                0.6210245043050843
              ],
              "variance": 0.35910195794044497,
              "mean_reward": 0.7213323137856555,
              "min_reward": 0.4805935710322846,
              "max_reward": 0.9871480089091692,
              "num_responses": 7,
              "rvariance": 0.02632560591610133
            },
            {
              "id": "safety_sample_376",
              "rewards": [
                1.9701645418187668,
                2.27108797026048,
                2.451642027325508,
                2.3713957797410514,
                2.3914573416371656,
                2.451642027325508
              ],
              "variance": 0.3310157712858848,
              "mean_reward": 2.3178982813514133,
              "min_reward": 1.9701645418187668,
              "max_reward": 2.451642027325508,
              "num_responses": 6,
              "rvariance": 0.02785960928203785
            },
            {
              "id": "safety_sample_224",
              "rewards": [
                -0.057307057307278295,
                0.6461014566752271,
                -0.4422382761889702,
                -0.07486092396637825,
                0.24737791398995665,
                0.17214705687952828
              ],
              "variance": 0.7052892854102661,
              "mean_reward": 0.08187002834701422,
              "min_reward": -0.4422382761889702,
              "max_reward": 0.6461014566752271,
              "num_responses": 6,
              "rvariance": 0.11208737904530373
            },
            {
              "id": "safety_sample_253",
              "rewards": [
                -0.9563157997768974,
                -0.7933156093709692,
                -1.0741774759165685,
                -0.8033463903190263,
                -0.8158848665040977
              ],
              "variance": 0.229704883710508,
              "mean_reward": -0.8886080283775118,
              "min_reward": -1.0741774759165685,
              "max_reward": -0.7933156093709692,
              "num_responses": 5,
              "rvariance": 0.012131842497044725
            },
            {
              "id": "safety_sample_307",
              "rewards": [
                -1.4302701995725962,
                -1.445316370994682,
                -1.5105164471570531,
                -1.375100904358282,
                -1.650947380429853
              ],
              "variance": 0.1976063846767253,
              "mean_reward": -1.4824302605024933,
              "min_reward": -1.650947380429853,
              "max_reward": -1.375100904358282,
              "num_responses": 5,
              "rvariance": 0.008960911406069286
            },
            {
              "id": "safety_sample_319",
              "rewards": [
                -1.4302701995725962,
                -0.46480753332209873,
                -0.16889949535441373,
                0.13954701879834264,
                -0.39960745715972745,
                -0.2008726096263458
              ],
              "variance": 0.9328626281693119,
              "mean_reward": -0.4208183793728065,
              "min_reward": -1.4302701995725962,
              "max_reward": 0.13954701879834264,
              "num_responses": 6,
              "rvariance": 0.24120442856881977
            },
            {
              "id": "safety_sample_205",
              "rewards": [
                -0.04727627635922118,
                0.12951623785028551,
                -0.04100703826668548,
                -0.1588687144063566,
                0.15208549498341403,
                0.22480865685682813,
                0.19220861877564252
              ],
              "variance": 0.2971618855861921,
              "mean_reward": 0.06449528277627241,
              "min_reward": -0.1588687144063566,
              "max_reward": 0.22480865685682813,
              "num_responses": 7,
              "rvariance": 0.018203705769834443
            },
            {
              "id": "safety_sample_348",
              "rewards": [
                1.3783484658833967,
                1.5187793991561964,
                1.4686254944159107,
                1.659210332428996,
                1.6291179895848247,
                1.5990256467406534,
                1.8899182942343098
              ],
              "variance": 0.3189788341482165,
              "mean_reward": 1.5918608032063268,
              "min_reward": 1.3783484658833967,
              "max_reward": 1.8899182942343098,
              "num_responses": 7,
              "rvariance": 0.02298985872911902
            },
            {
              "id": "safety_sample_354",
              "rewards": [
                -0.9187003712216832,
                -0.6704385427572696,
                -0.6854847141793552,
                -0.35627134884507444,
                -0.773254047474855,
                -0.6491231332426481,
                -0.4478805904722523
              ],
              "variance": 0.4201956831522052,
              "mean_reward": -0.6430218211704483,
              "min_reward": -0.9187003712216832,
              "max_reward": -0.35627134884507444,
              "num_responses": 7,
              "rvariance": 0.030836718419720358
            },
            {
              "id": "safety_sample_11",
              "rewards": [
                0.510685913876456,
                0.545793647194656,
                0.5658552090907701,
                0.8717940280065123,
                0.8015785613701125,
                0.6410860662011986,
                0.7514246566298269
              ],
              "variance": 0.2979141941572965,
              "mean_reward": 0.6697454403385047,
              "min_reward": 0.510685913876456,
              "max_reward": 0.8717940280065123,
              "num_responses": 7,
              "rvariance": 0.016736231115727456
            },
            {
              "id": "safety_sample_341",
              "rewards": [
                -0.5851769046987841,
                0.014162256947628668,
                -0.05605320968877116,
                -0.29992657148840984,
                0.05428538073985714,
                -0.10244557157353533,
                -0.04727627635922118
              ],
              "variance": 0.4442382112370796,
              "mean_reward": -0.14606155658874798,
              "min_reward": -0.5851769046987841,
              "max_reward": 0.05428538073985714,
              "num_responses": 7,
              "rvariance": 0.043152812246786146
            },
            {
              "id": "safety_sample_196",
              "rewards": [
                -2.413286732482194,
                -2.092301742144366,
                -2.363132827741908,
                -2.092301742144366,
                -2.2828865801574514,
                -2.0321170564560234,
                -2.1926095516249373
              ],
              "variance": 0.3149665217689934,
              "mean_reward": -2.2098051761073205,
              "min_reward": -2.413286732482194,
              "max_reward": -2.0321170564560234,
              "num_responses": 7,
              "rvariance": 0.018533982215883198
            },
            {
              "id": "safety_sample_236",
              "rewards": [
                -0.5437999332880485,
                -0.8334387331631977,
                -0.5939538380283341,
                -0.4710767714146344,
                -0.8986388093255689,
                -0.9161926759846689,
                -0.4710767714146344
              ],
              "variance": 0.4345835845745745,
              "mean_reward": -0.6754539332312982,
              "min_reward": -0.9161926759846689,
              "max_reward": -0.4710767714146344,
              "num_responses": 7,
              "rvariance": 0.03432013113611855
            },
            {
              "id": "safety_sample_346",
              "rewards": [
                0.5708705995647987,
                0.2549009997009995,
                0.2072547901977282,
                0.2549009997009995,
                0.34517802823351357,
                0.3602241996555992,
                0.43043966629199903
              ],
              "variance": 0.25076952370142797,
              "mean_reward": 0.3462527547636625,
              "min_reward": 0.2072547901977282,
              "max_reward": 0.5708705995647987,
              "num_responses": 7,
              "rvariance": 0.013392527006400085
            },
            {
              "id": "safety_sample_267",
              "rewards": [
                1.0874558183897403,
                1.2579790945067113,
                1.5087486182081393,
                1.6190872086367676,
                1.4385331515717394,
                1.147640504078083,
                1.2780406564028255
              ],
              "variance": 0.42931742457684474,
              "mean_reward": 1.3339264359705727,
              "min_reward": 1.0874558183897403,
              "max_reward": 1.6190872086367676,
              "num_responses": 7,
              "rvariance": 0.03245192277197186
            },
            {
              "id": "safety_sample_279",
              "rewards": [
                -1.8415322184429381,
                -2.363132827741908,
                -2.1324248659365943,
                -1.9217784660273949,
                -2.2427634563652226,
                -1.8615937803390523,
                -2.1023325230924232
              ],
              "variance": 0.43734204933529,
              "mean_reward": -2.0665083054207907,
              "min_reward": -2.363132827741908,
              "max_reward": -1.8415322184429381,
              "num_responses": 7,
              "rvariance": 0.03403304024441036
            },
            {
              "id": "safety_sample_56",
              "rewards": [
                -0.375470890503465,
                -0.6002230761208698,
                -0.4792267809349308,
                -0.21842647628544576,
                -0.6704385427572696,
                -0.3201448643368375,
                -0.2447572762740957
              ],
              "variance": 0.39408430649679393,
              "mean_reward": -0.41552684388755917,
              "min_reward": -0.6704385427572696,
              "max_reward": -0.21842647628544576,
              "num_responses": 7,
              "rvariance": 0.025980479422566073
            },
            {
              "id": "safety_sample_257",
              "rewards": [
                0.3652395901296278,
                0.22731635209384243,
                0.6862245804674556,
                0.19973170448668534,
                0.1420547140353569,
                0.796563170896084,
                0.39533193297379915
              ],
              "variance": 0.553699108332753,
              "mean_reward": 0.401780292154693,
              "min_reward": 0.1420547140353569,
              "max_reward": 0.796563170896084,
              "num_responses": 7,
              "rvariance": 0.05383679326161717
            },
            {
              "id": "safety_sample_256",
              "rewards": [
                -0.7782694379488836,
                -0.38017281907286676,
                -0.2626246048378224,
                -0.2829996286385634,
                -0.2698342286442385,
                -0.2745361572136403,
                -0.08238400967742109
              ],
              "variance": 0.34888309984961163,
              "mean_reward": -0.33297441229049085,
              "min_reward": -0.7782694379488836,
              "max_reward": -0.08238400967742109,
              "num_responses": 7,
              "rvariance": 0.03973702660252538
            },
            {
              "id": "safety_sample_202",
              "rewards": [
                0.43545505676602764,
                0.67117840904537,
                0.761455437577884,
                0.6260398947791128,
                0.5407782567206274,
                0.8517324661103981,
                0.44548583771408473
              ],
              "variance": 0.3560927236560278,
              "mean_reward": 0.6188750512447864,
              "min_reward": 0.43545505676602764,
              "max_reward": 0.8517324661103981,
              "num_responses": 7,
              "rvariance": 0.02102064878617287
            },
            {
              "id": "safety_sample_356",
              "rewards": [
                0.1796701425905711,
                0.10694698071715701,
                0.07936233310999993,
                0.24487021875294238,
                0.15208549498341403,
                0.23483943780488525
              ],
              "variance": 0.14670017136533534,
              "mean_reward": 0.16629576799316162,
              "min_reward": 0.07936233310999993,
              "max_reward": 0.24487021875294238,
              "num_responses": 6,
              "rvariance": 0.0037221142316767597
            },
            {
              "id": "safety_sample_272",
              "rewards": [
                -0.2529072857943921,
                -0.12626867632517097,
                0.11196237119118557,
                -0.22469571437798144,
                0.2900087330191994,
                -0.1551071715508352,
                0.08688541882104277
              ],
              "variance": 0.4191612588669369,
              "mean_reward": -0.038588903573850274,
              "min_reward": -0.2529072857943921,
              "max_reward": 0.2900087330191994,
              "num_responses": 7,
              "rvariance": 0.035459751713681056
            },
            {
              "id": "safety_sample_268",
              "rewards": [
                1.147640504078083,
                1.4987178372600822,
                1.3783484658833967,
                1.0373019136494548,
                0.9420094946429122,
                0.7464092661557983,
                1.1677020659741972
              ],
              "variance": 0.5627268111860043,
              "mean_reward": 1.131161363949132,
              "min_reward": 0.7464092661557983,
              "max_reward": 1.4987178372600822,
              "num_responses": 7,
              "rvariance": 0.055775458889754846
            },
            {
              "id": "safety_sample_138",
              "rewards": [
                -0.2322188000890243,
                -0.23472649532603856,
                0.059300771213885696,
                0.019177647421657226,
                -0.13379176203621382,
                -0.19836491438933151,
                0.07434694263597137
              ],
              "variance": 0.29854111796655,
              "mean_reward": -0.09232523008129913,
              "min_reward": -0.23472649532603856,
              "max_reward": 0.07434694263597137,
              "num_responses": 7,
              "rvariance": 0.01657359547311806
            },
            {
              "id": "safety_sample_283",
              "rewards": [
                -1.2296545806114538,
                -0.988915837858083,
                -1.3500239519881392,
                -1.445316370994682
              ],
              "variance": 0.3555911846086248,
              "mean_reward": -1.2534776853630896,
              "min_reward": -1.445316370994682,
              "max_reward": -0.988915837858083,
              "num_responses": 4,
              "rvariance": 0.02917094359484046
            },
            {
              "id": "safety_sample_305",
              "rewards": [
                -1.0942390378126827,
                -0.9738696664359974,
                -1.0591313044944828,
                -0.9287311521697403,
                -0.7857925236599264,
                -1.0641466949685114
              ],
              "variance": 0.22193102847576363,
              "mean_reward": -0.9843183965902237,
              "min_reward": -1.0942390378126827,
              "max_reward": -0.7857925236599264,
              "num_responses": 6,
              "rvariance": 0.011110619284109268
            },
            {
              "id": "safety_sample_334",
              "rewards": [
                1.3582869039872825,
                1.6291179895848247,
                1.8999490751823669,
                2.090533913195452,
                1.990226103714881,
                1.990226103714881,
                1.9300414180265382
              ],
              "variance": 0.5095636721613015,
              "mean_reward": 1.8411973582008898,
              "min_reward": 1.3582869039872825,
              "max_reward": 2.090533913195452,
              "num_responses": 7,
              "rvariance": 0.056587578318780085
            },
            {
              "id": "safety_sample_363",
              "rewards": [
                0.07936233310999993,
                0.43043966629199903,
                0.34517802823351357,
                0.44548583771408473,
                0.39533193297379915,
                0.38028576155171345,
                0.44548583771408473
              ],
              "variance": 0.20663408752997658,
              "mean_reward": 0.36022419965559926,
              "min_reward": 0.07936233310999993,
              "max_reward": 0.44548583771408473,
              "num_responses": 7,
              "rvariance": 0.014316300023170572
            },
            {
              "id": "safety_sample_167",
              "rewards": [
                -0.6804693237053266,
                -0.6240461808725054,
                -0.6190307903984769,
                -0.4372228857149416,
                -0.700530885601441,
                -0.35979779527212574,
                -0.3414014997443413
              ],
              "variance": 0.33605467140276035,
              "mean_reward": -0.5374999087584512,
              "min_reward": -0.700530885601441,
              "max_reward": -0.3414014997443413,
              "num_responses": 7,
              "rvariance": 0.020177857629187383
            },
            {
              "id": "safety_sample_1",
              "rewards": [
                -1.5155318376310818,
                -1.5105164471570531,
                -1.3349777805660537,
                -1.239685361559511,
                -1.5757165233194244,
                -1.671008942325967,
                -1.5105164471570531
              ],
              "variance": 0.31697267795860506,
              "mean_reward": -1.4797076199594492,
              "min_reward": -1.671008942325967,
              "max_reward": -1.239685361559511,
              "num_responses": 7,
              "rvariance": 0.018221865520025197
            },
            {
              "id": "safety_sample_29",
              "rewards": [
                -0.16639180011739946,
                0.1821778378275854,
                0.3251164663373993,
                0.04174690455478574,
                0.510685913876456,
                0.27496256159711374,
                0.12951623785028551
              ],
              "variance": 0.44085282266711034,
              "mean_reward": 0.18540201741803233,
              "min_reward": -0.16639180011739946,
              "max_reward": 0.510685913876456,
              "num_responses": 7,
              "rvariance": 0.040125732686500167
            },
            {
              "id": "safety_sample_179",
              "rewards": [
                -0.8936234188515404,
                -0.8986388093255689,
                -0.710561666549498,
                -0.4196690190558417,
                -0.8058540855560407,
                -0.5525768666175985,
                -0.6955154951274123
              ],
              "variance": 0.39621584744825605,
              "mean_reward": -0.7109199087262142,
              "min_reward": -0.8986388093255689,
              "max_reward": -0.4196690190558417,
              "num_responses": 7,
              "rvariance": 0.026824068599782397
            },
            {
              "id": "safety_sample_160",
              "rewards": [
                -1.2647623139296538,
                -1.7211628470662526,
                -1.650947380429853,
                -1.5957780852155388,
                -1.1443929425529684,
                -1.5305780090531673
              ],
              "variance": 0.48147748550674185,
              "mean_reward": -1.4846035963745725,
              "min_reward": -1.7211628470662526,
              "max_reward": -1.1443929425529684,
              "num_responses": 6,
              "rvariance": 0.04369623760209677
            },
            {
              "id": "safety_sample_23",
              "rewards": [
                -0.35321509527496325,
                -0.3329576196884573,
                -0.09366863824398534,
                -0.07611477158488539,
                0.036731514080757185,
                -0.18582643820426012,
                0.22731635209384243
              ],
              "variance": 0.454026059209051,
              "mean_reward": -0.11110495668885023,
              "min_reward": -0.35321509527496325,
              "max_reward": 0.22731635209384243,
              "num_responses": 7,
              "rvariance": 0.0359045950954837
            },
            {
              "id": "safety_sample_350",
              "rewards": [
                0.3752703710776849,
                0.6009629424089701,
                0.9018863708506837,
                0.5056705234024275,
                0.8216401232662267,
                0.6160091138310557
              ],
              "variance": 0.421292799818399,
              "mean_reward": 0.6369065741395081,
              "min_reward": 0.3752703710776849,
              "max_reward": 0.9018863708506837,
              "num_responses": 6,
              "rvariance": 0.03195763818550779
            },
            {
              "id": "safety_sample_367",
              "rewards": [
                0.6210245043050843,
                -0.08363785729592824,
                0.33013185681142787,
                0.25740869493801377,
                0.2799779520711423,
                0.38028576155171345,
                0.37025498060365636
              ],
              "variance": 0.3555911846086249,
              "mean_reward": 0.30792084185501567,
              "min_reward": -0.08363785729592824,
              "max_reward": 0.6210245043050843,
              "num_responses": 7,
              "rvariance": 0.037757136576814655
            },
            {
              "id": "safety_sample_303",
              "rewards": [
                1.137609723130026,
                0.8467170756363696,
                1.0473326945975119,
                0.9069017613247122
              ],
              "variance": 0.24575413322739936,
              "mean_reward": 0.9846403136721549,
              "min_reward": 0.8467170756363696,
              "max_reward": 1.137609723130026,
              "num_responses": 4,
              "rvariance": 0.013099019241832967
            },
            {
              "id": "safety_sample_18",
              "rewards": [
                -0.46355368570359157,
                -0.7707463522378407,
                -0.6528846760981696,
                -0.5237383713919342,
                -0.583923057080277,
                -0.8459772093482691,
                -0.6491231332426481
              ],
              "variance": 0.30117419796541495,
              "mean_reward": -0.6414209264432473,
              "min_reward": -0.8459772093482691,
              "max_reward": -0.46355368570359157,
              "num_responses": 7,
              "rvariance": 0.01536443203594698
            },
            {
              "id": "safety_sample_30",
              "rewards": [
                -0.8509925998222977,
                -0.6039846189763912,
                -1.0039620092801687,
                -0.6704385427572696,
                -0.8986388093255689,
                -0.7682386570008265,
                -0.6403461999130983
              ],
              "variance": 0.3149665217689934,
              "mean_reward": -0.7766573481536602,
              "min_reward": -1.0039620092801687,
              "max_reward": -0.6039846189763912,
              "num_responses": 7,
              "rvariance": 0.018831789285265774
            },
            {
              "id": "safety_sample_263",
              "rewards": [
                -0.04727627635922118,
                0.7113015328375984,
                0.1420547140353569,
                0.0467622950288143,
                0.18970092353862822,
                0.01165456171061439
              ],
              "variance": 0.4683120855124167,
              "mean_reward": 0.17569962513196516,
              "min_reward": -0.04727627635922118,
              "max_reward": 0.7113015328375984,
              "num_responses": 6,
              "rvariance": 0.06357521508508933
            },
            {
              "id": "safety_sample_295",
              "rewards": [
                -0.31434581910124193,
                0.019177647421657226,
                0.2649317806490566,
                0.4003473234478277,
                -0.0008839144744570087,
                0.20474709496071392,
                0.10443928548014272
              ],
              "variance": 0.445366674093736,
              "mean_reward": 0.09691619976909989,
              "min_reward": -0.31434581910124193,
              "max_reward": 0.4003473234478277,
              "num_responses": 7,
              "rvariance": 0.04524691057774908
            },
            {
              "id": "safety_sample_47",
              "rewards": [
                0.08688541882104277,
                -0.24162265722782783,
                0.12450084737625697,
                0.14957779974639976,
                0.169639361642514,
                0.28499334254517084,
                0.3501934187075421
              ],
              "variance": 0.3555911846086248,
              "mean_reward": 0.13202393308729982,
              "min_reward": -0.24162265722782783,
              "max_reward": 0.3501934187075421,
              "num_responses": 7,
              "rvariance": 0.030632354304095773
            },
            {
              "id": "safety_sample_375",
              "rewards": [
                -2.503563761014708,
                -2.5637484467030505,
                -2.4634406372224795,
                -2.4634406372224795,
                -2.523625322910822,
                -2.3932251705860796,
                -2.4634406372224795
              ],
              "variance": 0.10432012185979378,
              "mean_reward": -2.4820692304117284,
              "min_reward": -2.5637484467030505,
              "max_reward": -2.3932251705860796,
              "num_responses": 7,
              "rvariance": 0.002542108351790753
            },
            {
              "id": "safety_sample_28",
              "rewards": [
                -0.4027420762059953,
                -0.3503939381333222,
                -0.3713958857433168,
                -0.2801784714969224,
                -0.26074383341006174,
                -0.4240574857206167,
                -0.23723419056305284
              ],
              "variance": 0.15992826374058572,
              "mean_reward": -0.33239226875332684,
              "min_reward": -0.4240574857206167,
              "max_reward": -0.23723419056305284,
              "num_responses": 7,
              "rvariance": 0.004587398343570513
            },
            {
              "id": "safety_sample_347",
              "rewards": [
                2.752565455767222,
                2.3713957797410514,
                2.511826713013851,
                2.7926885795594503,
                2.6923807700788793,
                2.220934065520195,
                2.5720113987021938
              ],
              "variance": 0.4574036112314044,
              "mean_reward": 2.5591146803404063,
              "min_reward": 2.220934065520195,
              "max_reward": 2.7926885795594503,
              "num_responses": 7,
              "rvariance": 0.037392401523513495
            },
            {
              "id": "safety_sample_10",
              "rewards": [
                -1.1795006758711684,
                -1.4302701995725962,
                -1.3801162948323107,
                -0.9362542378807832,
                -1.2898392662997966,
                -1.3249469996179966,
                -1.1193159901828256
              ],
              "variance": 0.3540865674664162,
              "mean_reward": -1.2371776663224967,
              "min_reward": -1.4302701995725962,
              "max_reward": -0.9362542378807832,
              "num_responses": 7,
              "rvariance": 0.02513797108737192
            },
            {
              "id": "safety_sample_365",
              "rewards": [
                -0.3356857178271623,
                -0.4698229237961273,
                -0.3898901381162971,
                -0.22594956199648858,
                -0.6779616284683124,
                -0.3836209000237614,
                -0.3917709095440578
              ],
              "variance": 0.26128715017010856,
              "mean_reward": -0.410671682824601,
              "min_reward": -0.6779616284683124,
              "max_reward": -0.22594956199648858,
              "num_responses": 7,
              "rvariance": 0.016601256843103797
            },
            {
              "id": "safety_sample_387",
              "rewards": [
                -1.2246391901374254,
                -1.2647623139296538,
                -0.926223456932726,
                -0.8861003331404976,
                -1.1393775520789398,
                -1.0741774759165685,
                -0.9638388854879403
              ],
              "variance": 0.3305142322384821,
              "mean_reward": -1.0684456010891072,
              "min_reward": -1.2647623139296538,
              "max_reward": -0.8861003331404976,
              "num_responses": 7,
              "rvariance": 0.018917197863018046
            },
            {
              "id": "safety_sample_170",
              "rewards": [
                -0.6579000665721981,
                -0.710561666549498,
                -0.391457447639431,
                -0.35337182622727664,
                -0.5425460856695413,
                -0.49489987616627007,
                -0.10119172395502819
              ],
              "variance": 0.426464921244741,
              "mean_reward": -0.46456124182560626,
              "min_reward": -0.710561666549498,
              "max_reward": -0.10119172395502819,
              "num_responses": 7,
              "rvariance": 0.03637754801496529
            },
            {
              "id": "safety_sample_82",
              "rewards": [
                -0.647869285624141,
                -0.6328231142020554,
                -0.3558011559881342,
                -0.6064923142134055,
                -0.6516308284796625,
                -0.46041906665732374
              ],
              "variance": 0.2416399457291727,
              "mean_reward": -0.5591726275274537,
              "min_reward": -0.6516308284796625,
              "max_reward": -0.3558011559881342,
              "num_responses": 6,
              "rvariance": 0.012531897372816783
            },
            {
              "id": "safety_sample_286",
              "rewards": [
                -1.0039620092801687,
                -1.1042698187607398,
                -1.114300599708797,
                -1.0039620092801687,
                -0.9136849807476547,
                -1.1042698187607398
              ],
              "variance": 0.15046171422085686,
              "mean_reward": -1.0407415394230448,
              "min_reward": -1.114300599708797,
              "max_reward": -0.9136849807476547,
              "num_responses": 6,
              "rvariance": 0.005388576113138942
            },
            {
              "id": "safety_sample_290",
              "rewards": [
                -2.18257877067688,
                -1.9318092469754522,
                -1.9217784660273949,
                -2.082270961196309,
                -1.6409165994817956,
                -2.092301742144366,
                -2.022086275507966
              ],
              "variance": 0.3189788341482165,
              "mean_reward": -1.9819631517157377,
              "min_reward": -2.18257877067688,
              "max_reward": -1.6409165994817956,
              "num_responses": 7,
              "rvariance": 0.026649016308191022
            },
            {
              "id": "safety_sample_296",
              "rewards": [
                -0.03724549541116406,
                0.340162637759485,
                0.34517802823351357,
                -0.010914695422514126,
                0.3652395901296278,
                0.036731514080757185,
                0.20474709496071392
              ],
              "variance": 0.3746496684099334,
              "mean_reward": 0.17769981061863135,
              "min_reward": -0.03724549541116406,
              "max_reward": 0.3652395901296278,
              "num_responses": 7,
              "rvariance": 0.027427832167078444
            },
            {
              "id": "safety_sample_183",
              "rewards": [
                -1.1945468472932539,
                -1.2346699710854825,
                -1.159439113975054,
                -1.3550393424621678,
                -1.2296545806114538,
                -0.9989466188061401,
                -0.9563157997768974
              ],
              "variance": 0.3009234284417135,
              "mean_reward": -1.1612303248586358,
              "min_reward": -1.3550393424621678,
              "max_reward": -0.9563157997768974,
              "num_responses": 7,
              "rvariance": 0.016725194094410107
            },
            {
              "id": "safety_sample_304",
              "rewards": [
                -0.8259156474521548,
                -0.6390923522945912,
                -0.52123067615492,
                -0.3168535143382562,
                -0.7306232284456122,
                -0.5488153237620771,
                -0.575146123750727
              ],
              "variance": 0.32926038461997487,
              "mean_reward": -0.593953838028334,
              "min_reward": -0.8259156474521548,
              "max_reward": -0.3168535143382562,
              "num_responses": 7,
              "rvariance": 0.02271239314669919
            },
            {
              "id": "safety_sample_353",
              "rewards": [
                -0.26011690960080813,
                -0.5864307523172912,
                -0.40744400477539705,
                -0.4622998380850844,
                -0.33595509915145094,
                -0.3154429357674357,
                -0.52123067615492
              ],
              "variance": 0.2539981813190838,
              "mean_reward": -0.4127028879789125,
              "min_reward": -0.5864307523172912,
              "max_reward": -0.26011690960080813,
              "num_responses": 7,
              "rvariance": 0.011868481022574219
            },
            {
              "id": "safety_sample_141",
              "rewards": [
                -0.8735618569554262,
                -0.4861229428367201,
                -0.4124593952494256,
                -0.6779616284683124,
                -0.5412922380510342,
                -0.6428538951501125
              ],
              "variance": 0.3264705736687964,
              "mean_reward": -0.6057086594518385,
              "min_reward": -0.8735618569554262,
              "max_reward": -0.4124593952494256,
              "num_responses": 6,
              "rvariance": 0.022356848759813874
            },
            {
              "id": "safety_sample_156",
              "rewards": [
                -1.4403009805206533,
                -1.9619015898196235,
                -1.59076269474151,
                -1.4051932472024533,
                -1.7813475327545953,
                -1.751255189910424,
                -1.365070123410225
              ],
              "variance": 0.4644251578950447,
              "mean_reward": -1.6136901940513548,
              "min_reward": -1.9619015898196235,
              "max_reward": -1.365070123410225,
              "num_responses": 7,
              "rvariance": 0.043450956201993844
            },
            {
              "id": "safety_sample_372",
              "rewards": [
                -0.43910365714270233,
                -0.6704385427572696,
                -0.5325153047214842,
                -0.4416113523797166,
                -0.462926761894338,
                -0.5074383523513415,
                -0.35399875003653025
              ],
              "variance": 0.18262290563556488,
              "mean_reward": -0.48686181732619754,
              "min_reward": -0.6704385427572696,
              "max_reward": -0.35399875003653025,
              "num_responses": 7,
              "rvariance": 0.008394568113588245
            },
            {
              "id": "safety_sample_85",
              "rewards": [
                -1.0039620092801687,
                -0.8585156855333405,
                -0.7180847522605408,
                -0.7080539713124837,
                -0.9538081045398831,
                -0.5249922190104415,
                -0.47609216188866293
              ],
              "variance": 0.4684374702742672,
              "mean_reward": -0.7490727005465029,
              "min_reward": -1.0039620092801687,
              "max_reward": -0.47609216188866293,
              "num_responses": 7,
              "rvariance": 0.03517659115659894
            },
            {
              "id": "safety_sample_98",
              "rewards": [
                -0.10746096204756389,
                0.03923920931777146,
                0.2423625235159281,
                0.06933155216194281,
                -0.11999943823263529,
                -0.4196690190558417,
                -0.03724549541116406
              ],
              "variance": 0.3784112112654548,
              "mean_reward": -0.04763451853593751,
              "min_reward": -0.4196690190558417,
              "max_reward": 0.2423625235159281,
              "num_responses": 7,
              "rvariance": 0.03609426814415349
            },
            {
              "id": "safety_sample_382",
              "rewards": [
                -0.3807997428821203,
                -0.3091736976749,
                -0.3438112381361597,
                -0.2485188191296171,
                -0.4591652190388166,
                -0.3468283089681925,
                -0.13128406679919954
              ],
              "variance": 0.21052101514734878,
              "mean_reward": -0.31708301323271515,
              "min_reward": -0.4591652190388166,
              "max_reward": -0.13128406679919954,
              "num_responses": 7,
              "rvariance": 0.009304458564318238
            },
            {
              "id": "safety_sample_148",
              "rewards": [
                -1.0039620092801687,
                -1.0992544282867114,
                -1.2747930948777109,
                -0.9638388854879403,
                -1.0190081807022544,
                -1.114300599708797,
                -1.0190081807022544
              ],
              "variance": 0.19058483801308523,
              "mean_reward": -1.0705950541494054,
              "min_reward": -1.2747930948777109,
              "max_reward": -0.9638388854879403,
              "num_responses": 7,
              "rvariance": 0.009369661073684353
            },
            {
              "id": "safety_sample_37",
              "rewards": [
                0.09190080929507133,
                0.2799779520711423,
                0.34517802823351357,
                0.4555166186621418,
                0.28499334254517084,
                0.545793647194656
              ],
              "variance": 0.31471575224529214,
              "mean_reward": 0.3338933996669493,
              "min_reward": 0.09190080929507133,
              "max_reward": 0.545793647194656,
              "num_responses": 6,
              "rvariance": 0.02061329500230036
            },
            {
              "id": "safety_sample_271",
              "rewards": [
                1.2078251897664258,
                1.2579790945067113,
                1.6692411133770533,
                1.6993334562212246,
                1.1977944088183687
              ],
              "variance": 0.48548979788596447,
              "mean_reward": 1.4064346525379565,
              "min_reward": 1.1977944088183687,
              "max_reward": 1.6993334562212246,
              "num_responses": 5,
              "rvariance": 0.05197449355399895
            },
            {
              "id": "safety_sample_111",
              "rewards": [
                -0.37453050478958466,
                -0.4271921047668845,
                -0.18519951439500654,
                -0.2359803429445457,
                -0.48863063807373436,
                -0.3108977381503473,
                -0.42217671429285597
              ],
              "variance": 0.23609950656489442,
              "mean_reward": -0.3492296510589941,
              "min_reward": -0.48863063807373436,
              "max_reward": -0.18519951439500654,
              "num_responses": 7,
              "rvariance": 0.010381830524632044
            },
            {
              "id": "safety_sample_209",
              "rewards": [
                1.308132999246997,
                1.7595181419095671,
                1.4485639325197965,
                1.2780406564028255,
                1.0473326945975119,
                1.3582869039872825,
                1.4184715896756253
              ],
              "variance": 0.38718814459500495,
              "mean_reward": 1.3740495597628009,
              "min_reward": 1.0473326945975119,
              "max_reward": 1.7595181419095671,
              "num_responses": 7,
              "rvariance": 0.039523830012333214
            },
            {
              "id": "safety_sample_7",
              "rewards": [
                -0.027214714463106943,
                -0.2723419238812528,
                0.029208428369714344,
                -0.12125328585114242,
                -0.27892462387841527,
                -0.1676456477359066,
                0.024193037895685787
              ],
              "variance": 0.30117419796541495,
              "mean_reward": -0.11628267564920343,
              "min_reward": -0.27892462387841527,
              "max_reward": 0.029208428369714344,
              "num_responses": 7,
              "rvariance": 0.014614849043477488
            },
            {
              "id": "safety_sample_49",
              "rewards": [
                -1.535593399527196,
                -1.2196237996633967,
                -1.2998700472478537,
                -1.0440851330723973,
                -1.3700855138842536,
                -1.1995622377672825
              ],
              "variance": 0.3310157712858848,
              "mean_reward": -1.2781366885270635,
              "min_reward": -1.535593399527196,
              "max_reward": -1.0440851330723973,
              "num_responses": 6,
              "rvariance": 0.02326478608183018
            },
            {
              "id": "safety_sample_358",
              "rewards": [
                -0.8835926379034833,
                -0.9839004473840545,
                -0.8509925998222977,
                -0.8234079522151406,
                -0.5763999713692342,
                -0.881084942666469
              ],
              "variance": 0.2338425808515815,
              "mean_reward": -0.8332297585601132,
              "min_reward": -0.9839004473840545,
              "max_reward": -0.5763999713692342,
              "num_responses": 6,
              "rvariance": 0.01565028678839749
            },
            {
              "id": "safety_sample_335",
              "rewards": [
                0.036731514080757185,
                -0.005899304948485567,
                -0.019691628752064105,
                0.019177647421657226,
                -0.032230104937135504,
                -0.08614555253294251,
                0.169639361642514
              ],
              "variance": 0.14369093708091826,
              "mean_reward": 0.01165456171061439,
              "min_reward": -0.08614555253294251,
              "max_reward": 0.169639361642514,
              "num_responses": 7,
              "rvariance": 0.005489442224622478
            },
            {
              "id": "safety_sample_132",
              "rewards": [
                -0.908669590273626,
                -0.9061618950366118,
                -0.5362768475770057,
                -0.5049306571143272,
                -0.6140153999244483,
                -0.8560079902963262,
                -0.4804806285534379
              ],
              "variance": 0.41201432744144606,
              "mean_reward": -0.6866490012536833,
              "min_reward": -0.908669590273626,
              "max_reward": -0.4804806285534379,
              "num_responses": 7,
              "rvariance": 0.032796556971042425
            },
            {
              "id": "safety_sample_38",
              "rewards": [
                -0.7130693617865123,
                -0.6604077618092125,
                -0.471703695223888,
                -0.258863061982301,
                -0.5237383713919342,
                -0.24538420008334924,
                -0.4491344380907595
              ],
              "variance": 0.42800088457741203,
              "mean_reward": -0.47461441290970807,
              "min_reward": -0.7130693617865123,
              "max_reward": -0.24538420008334924,
              "num_responses": 7,
              "rvariance": 0.02764941881853364
            },
            {
              "id": "safety_sample_53",
              "rewards": [
                0.024193037895685787,
                0.3150856853893422,
                0.056793075976871416,
                0.5257320852985417,
                0.716316923311627,
                0.22731635209384243,
                0.2900087330191994
              ],
              "variance": 0.5582129597593788,
              "mean_reward": 0.3079208418550157,
              "min_reward": 0.024193037895685787,
              "max_reward": 0.716316923311627,
              "num_responses": 7,
              "rvariance": 0.05209499729279123
            },
            {
              "id": "safety_sample_219",
              "rewards": [
                -0.3066660024378857,
                0.3100702949153136,
                -0.19711106677082438,
                -0.1839456667764994,
                0.07434694263597137
              ],
              "variance": 0.4786249821746379,
              "mean_reward": -0.0606610996867849,
              "min_reward": -0.3066660024378857,
              "max_reward": 0.3100702949153136,
              "num_responses": 5,
              "rvariance": 0.05000100572255047
            },
            {
              "id": "safety_sample_270",
              "rewards": [
                1.0172403517533406,
                0.9971787898572263,
                1.1977944088183687,
                1.2780406564028255,
                0.8818248089545694,
                1.1576712850261401,
                1.217855970714483
              ],
              "variance": 0.2908926474936564,
              "mean_reward": 1.1068008959324218,
              "min_reward": 0.8818248089545694,
              "max_reward": 1.2780406564028255,
              "num_responses": 7,
              "rvariance": 0.017596605428651785
            },
            {
              "id": "safety_sample_112",
              "rewards": [
                0.14957779974639976,
                0.37025498060365636,
                0.3752703710776849,
                0.24737791398995665,
                0.4254242758179705,
                0.385301152025742
              ],
              "variance": 0.20688485705367804,
              "mean_reward": 0.3255344155435684,
              "min_reward": 0.14957779974639976,
              "max_reward": 0.4254242758179705,
              "num_responses": 6,
              "rvariance": 0.009182135094241076
            },
            {
              "id": "safety_sample_362",
              "rewards": [
                0.7664708280519126,
                0.340162637759485,
                0.23233174256787098,
                0.19973170448668534,
                0.23734713304189953,
                0.4003473234478277,
                0.3150856853893422
              ],
              "variance": 0.32750499795406507,
              "mean_reward": 0.35592529353500335,
              "min_reward": 0.19973170448668534,
              "max_reward": 0.7664708280519126,
              "num_responses": 7,
              "rvariance": 0.032309981544332504
            },
            {
              "id": "safety_sample_258",
              "rewards": [
                -0.7381463141566551,
                -0.22030724771320645,
                -0.3615218357475731,
                -0.471703695223888,
                -0.5638614951841627,
                -0.5663691904211771,
                -0.37985935716824
              ],
              "variance": 0.3300440393815418,
              "mean_reward": -0.47168130508784323,
              "min_reward": -0.7381463141566551,
              "max_reward": -0.22030724771320645,
              "num_responses": 7,
              "rvariance": 0.024603125737217114
            },
            {
              "id": "safety_sample_78",
              "rewards": [
                -0.35760356193973825,
                -0.33127276195108835,
                -0.31834245838523345,
                0.04926999026582858,
                -0.25102651436663137,
                -0.16639180011739946,
                0.07685463787298566
              ],
              "variance": 0.4021089312552397,
              "mean_reward": -0.18550178123161093,
              "min_reward": -0.35760356193973825,
              "max_reward": 0.07685463787298566,
              "num_responses": 7,
              "rvariance": 0.028160314945356202
            },
            {
              "id": "safety_sample_12",
              "rewards": [
                -0.34236147682726087,
                -0.23284572389827785,
                -0.12125328585114242,
                -0.27829770006916166,
                0.09942389500611416,
                -0.3152862048151223,
                -0.2359803429445457
              ],
              "variance": 0.293133900111738,
              "mean_reward": -0.2038001199141995,
              "min_reward": -0.34236147682726087,
              "max_reward": 0.09942389500611416,
              "num_responses": 7,
              "rvariance": 0.019688040444054394
            },
            {
              "id": "safety_sample_173",
              "rewards": [
                -1.7311936280143096,
                -1.5656857423713673,
                -1.5556549614233102,
                -1.671008942325967,
                -1.615839647111653,
                -1.5556549614233102
              ],
              "variance": 0.1454463237468282,
              "mean_reward": -1.6158396471116527,
              "min_reward": -1.7311936280143096,
              "max_reward": -1.5556549614233102,
              "num_responses": 6,
              "rvariance": 0.004351666498006918
            },
            {
              "id": "safety_sample_67",
              "rewards": [
                0.47557818055825607,
                0.4404704472400562,
                0.41037810439588485,
                0.6761937995193985,
                0.6410860662011986,
                0.6310552852531414,
                0.340162637759485
              ],
              "variance": 0.2728372417871537,
              "mean_reward": 0.5164177887039172,
              "min_reward": 0.340162637759485,
              "max_reward": 0.6761937995193985,
              "num_responses": 7,
              "rvariance": 0.01485121054469036
            },
            {
              "id": "safety_sample_154",
              "rewards": [
                0.031716123606728625,
                -0.2090226191466422,
                0.18719322830161395,
                -0.023453171607585525,
                0.2925164282562137,
                0.3602241996555992,
                0.5056705234024275
              ],
              "variance": 0.5160836797775388,
              "mean_reward": 0.16354924463833645,
              "min_reward": -0.2090226191466422,
              "max_reward": 0.5056705234024275,
              "num_responses": 7,
              "rvariance": 0.052011321270710884
            },
            {
              "id": "safety_sample_17",
              "rewards": [
                -0.027214714463106943,
                0.014162256947628668,
                0.12951623785028551,
                0.14707010450938549,
                -0.05856090492578544
              ],
              "variance": 0.18607098658645954,
              "mean_reward": 0.04099459598368145,
              "min_reward": -0.05856090492578544,
              "max_reward": 0.14707010450938549,
              "num_responses": 5,
              "rvariance": 0.006874375359770583
            },
            {
              "id": "safety_sample_249",
              "rewards": [
                -1.0741774759165685,
                -0.583923057080277,
                -0.8033463903190263,
                -0.7481770951047122,
                -0.5600999523286413,
                -0.6052384665948983
              ],
              "variance": 0.36675042841333827,
              "mean_reward": -0.7291604062240206,
              "min_reward": -1.0741774759165685,
              "max_reward": -0.5600999523286413,
              "num_responses": 6,
              "rvariance": 0.031655657475069855
            },
            {
              "id": "safety_sample_266",
              "rewards": [
                -1.3851316853063391,
                -1.1995622377672825,
                -1.2647623139296538,
                -1.4403009805206533,
                -1.1945468472932539,
                -1.1945468472932539,
                -1.0741774759165685
              ],
              "variance": 0.2608003046494851,
              "mean_reward": -1.2504326268610009,
              "min_reward": -1.4403009805206533,
              "max_reward": -1.0741774759165685,
              "num_responses": 7,
              "rvariance": 0.013471326205107647
            },
            {
              "id": "safety_sample_133",
              "rewards": [
                -1.3600547329361965,
                -1.0842082568646256,
                -1.2095930187153396,
                -1.0591313044944828,
                -0.9939312283321116,
                -1.0541159140204543
              ],
              "variance": 0.26080030464948534,
              "mean_reward": -1.1268390758938682,
              "min_reward": -1.3600547329361965,
              "max_reward": -0.9939312283321116,
              "num_responses": 6,
              "rvariance": 0.015098773499587603
            },
            {
              "id": "safety_sample_125",
              "rewards": [
                -0.6253000284910126,
                -0.21215723819291005,
                -0.30635254053325894,
                -0.2779842381645349,
                -0.4610459904665773,
                -0.6064923142134055
              ],
              "variance": 0.3708254331734866,
              "mean_reward": -0.41488872501028323,
              "min_reward": -0.6253000284910126,
              "max_reward": -0.21215723819291005,
              "num_responses": 6,
              "rvariance": 0.025789723798148725
            },
            {
              "id": "safety_sample_182",
              "rewards": [
                -0.4654344571313523,
                -0.24350342865558855,
                -0.2961650286328884,
                -0.18582643820426012,
                -0.10119172395502819,
                -0.08614555253294251,
                -0.015930085896542684
              ],
              "variance": 0.3058134341538914,
              "mean_reward": -0.19917095928694323,
              "min_reward": -0.4654344571313523,
              "max_reward": -0.015930085896542684,
              "num_responses": 7,
              "rvariance": 0.01977134780926923
            },
            {
              "id": "safety_sample_117",
              "rewards": [
                -0.14507639060277808,
                -0.09617633348099963,
                0.1571008854574426,
                0.1545931902204283,
                -0.03975319064817834,
                0.10193159024312845
              ],
              "variance": 0.2764733998808243,
              "mean_reward": 0.022103291864840554,
              "min_reward": -0.14507639060277808,
              "max_reward": 0.1571008854574426,
              "num_responses": 6,
              "rvariance": 0.014652636849141634
            },
            {
              "id": "safety_sample_242",
              "rewards": [
                -0.023453171607585525,
                0.09942389500611416,
                0.18719322830161395,
                0.10443928548014272,
                -0.4478805904722523,
                0.37025498060365636
              ],
              "variance": 0.5143909854925541,
              "mean_reward": 0.04832960455194823,
              "min_reward": -0.4478805904722523,
              "max_reward": 0.37025498060365636,
              "num_responses": 6,
              "rvariance": 0.06334255019282095
            },
            {
              "id": "safety_sample_70",
              "rewards": [
                -0.9939312283321116,
                -0.790807914133955,
                -1.1393775520789398,
                -0.8509925998222977,
                -1.0741774759165685,
                -0.9588234950139117,
                -0.7632232665267978
              ],
              "variance": 0.3204834512904249,
              "mean_reward": -0.9387619331177974,
              "min_reward": -1.1393775520789398,
              "max_reward": -0.7632232665267978,
              "num_responses": 7,
              "rvariance": 0.017491112038851096
            },
            {
              "id": "safety_sample_31",
              "rewards": [
                0.021685342658671506,
                0.0467622950288143,
                0.17465475211654255,
                0.37025498060365636,
                0.3752703710776849,
                0.17214705687952828,
                0.3025472092042708
              ],
              "variance": 0.3355296227125106,
              "mean_reward": 0.2090460010813098,
              "min_reward": 0.021685342658671506,
              "max_reward": 0.3752703710776849,
              "num_responses": 7,
              "rvariance": 0.01804937997757736
            },
            {
              "id": "safety_sample_59",
              "rewards": [
                0.09190080929507133,
                0.12951623785028551,
                0.10694698071715701,
                0.41037810439588485,
                0.277470256834128,
                0.12199315213924268
              ],
              "variance": 0.24450028560889223,
              "mean_reward": 0.18970092353862825,
              "min_reward": 0.09190080929507133,
              "max_reward": 0.41037810439588485,
              "num_responses": 6,
              "rvariance": 0.01350358168601184
            },
            {
              "id": "safety_sample_149",
              "rewards": [
                -0.003391609711471288,
                0.14957779974639976,
                0.23233174256787098,
                0.25991639017502804,
                0.17214705687952828,
                0.23734713304189953,
                0.17214705687952828
              ],
              "variance": 0.1579847999318996,
              "mean_reward": 0.1742965099398262,
              "min_reward": -0.003391609711471288,
              "max_reward": 0.25991639017502804,
              "num_responses": 7,
              "rvariance": 0.006695365140999792
            },
            {
              "id": "safety_sample_309",
              "rewards": [
                -0.06483014301832113,
                -0.2645053762655831,
                -0.37233627145719717,
                0.0041314759995715504,
                -0.1883341334412744,
                -0.30431503815318484,
                -0.22971110485201002
              ],
              "variance": 0.2942780360636257,
              "mean_reward": -0.20284294159828556,
              "min_reward": -0.37233627145719717,
              "max_reward": 0.0041314759995715504,
              "num_responses": 7,
              "rvariance": 0.01509216813108844
            }
          ]
        }
      },
      "overall_stats": {
        "mean_variance_across_files": 0.5718670002668702,
        "mean_rvariance_across_files": 0.09716267378513026,
        "total_processed_files": 4
      }
    }
  },
  "summary": {
    "model_comparison": {
      "GRM-llama3-8B-distill": {
        "mean_variance": 0.5718670002668702,
        "mean_rvariance": 0.09716267378513026
      }
    }
  }
}