{
  "models": {
    "GRM-gemma2-2B-rewardmodel-ft": {
      "model_name": "GRM-gemma2-2B-rewardmodel-ft",
      "model_path": "Ray2333/GRM-gemma2-2B-rewardmodel-ft",
      "files": {
        "semantic_benchmark_chat_filtered.json": {
          "file_name": "semantic_benchmark_chat_filtered.json",
          "processed_samples": 200,
          "global_mean": 1.1715457217555982,
          "global_std": 5.179184615488683,
          "mean_variance": 0.5396229330877378,
          "mean_rvariance": 0.08727506334071837,
          "sample_results": [
            {
              "id": "chat_sample_306",
              "variance": 0.6613010066791823,
              "mean_reward": 0.9206442278272872,
              "min_reward": 0.31985329761953174,
              "max_reward": 1.2400029647598172,
              "num_responses": 7,
              "rvariance": 0.09544818860450174
            },
            {
              "id": "chat_sample_202",
              "variance": 0.7008221891038963,
              "mean_reward": -0.2902037767772244,
              "min_reward": -0.6214145586026621,
              "max_reward": 0.18711039481896594,
              "num_responses": 7,
              "rvariance": 0.09260208426152158
            },
            {
              "id": "chat_sample_298",
              "variance": 0.5701911052115212,
              "mean_reward": 0.10091370468872841,
              "min_reward": -0.7632081138669028,
              "max_reward": 0.3500221391651149,
              "num_responses": 7,
              "rvariance": 0.12978570148112117
            },
            {
              "id": "chat_sample_268",
              "variance": 0.2532674247751704,
              "mean_reward": -0.24155651978497159,
              "min_reward": -0.5444840126614251,
              "max_reward": -0.11834912583006331,
              "num_responses": 7,
              "rvariance": 0.017869903925251417
            },
            {
              "id": "chat_sample_303",
              "variance": 0.29203438616124444,
              "mean_reward": -1.257977115214466,
              "min_reward": -1.565699298979414,
              "max_reward": -1.0709302976318509,
              "num_responses": 7,
              "rvariance": 0.02160457421052111
            },
            {
              "id": "chat_sample_65",
              "variance": 0.9890854700719429,
              "mean_reward": 0.2799873284342968,
              "min_reward": -0.3747842789675199,
              "max_reward": 0.7210988901757873,
              "num_responses": 7,
              "rvariance": 0.1766596561968308
            },
            {
              "id": "chat_sample_212",
              "variance": 0.9835042343860103,
              "mean_reward": 1.4714410777595053,
              "min_reward": 0.4827650419656806,
              "max_reward": 2.163169516054661,
              "num_responses": 7,
              "rvariance": 0.23184275890750156
            },
            {
              "id": "chat_sample_262",
              "variance": 0.9955717710042434,
              "mean_reward": 0.06632728277397057,
              "min_reward": -0.6666678209210368,
              "max_reward": 0.6004235239934548,
              "num_responses": 7,
              "rvariance": 0.18275349575997238
            },
            {
              "id": "chat_sample_178",
              "variance": 0.9907447563569503,
              "mean_reward": -0.38491239005782285,
              "min_reward": -0.8929341325129103,
              "max_reward": 0.2715831511465987,
              "num_responses": 7,
              "rvariance": 0.18935725654664579
            },
            {
              "id": "chat_sample_290",
              "variance": 0.5020095233185033,
              "mean_reward": 0.7310115095407647,
              "min_reward": 0.3862247490198146,
              "max_reward": 0.9624496225404524,
              "num_responses": 7,
              "rvariance": 0.040901802482161534
            },
            {
              "id": "chat_sample_292",
              "variance": 0.41995027431451726,
              "mean_reward": 0.6732597271535055,
              "min_reward": 0.3952754014834895,
              "max_reward": 0.920213244376636,
              "num_responses": 7,
              "rvariance": 0.035523320031168946
            },
            {
              "id": "chat_sample_116",
              "variance": 0.8196874247934938,
              "mean_reward": -0.43485259740202914,
              "min_reward": -1.2640108835235828,
              "max_reward": -0.008987075227324446,
              "num_responses": 7,
              "rvariance": 0.15719302109852645
            },
            {
              "id": "chat_sample_106",
              "variance": 0.5038196538112383,
              "mean_reward": 0.6205360850238436,
              "min_reward": 0.28666757191939024,
              "max_reward": 0.8779768662128197,
              "num_responses": 6,
              "rvariance": 0.046960159259337136
            },
            {
              "id": "chat_sample_251",
              "variance": 0.6803073768528998,
              "mean_reward": -0.26602156472584293,
              "min_reward": -0.841647101885419,
              "max_reward": 0.2685662669920404,
              "num_responses": 7,
              "rvariance": 0.09996650159876072
            },
            {
              "id": "chat_sample_280",
              "variance": 0.23130073702479276,
              "mean_reward": -0.3866969309081755,
              "min_reward": -0.5957710432889165,
              "max_reward": -0.22398721005451924,
              "num_responses": 7,
              "rvariance": 0.011523340964555746
            },
            {
              "id": "chat_sample_58",
              "variance": 0.2964088681853544,
              "mean_reward": -0.02277854564816244,
              "min_reward": -0.1771783668439504,
              "max_reward": 0.25951561452836547,
              "num_responses": 7,
              "rvariance": 0.019085012627205442
            },
            {
              "id": "chat_sample_90",
              "variance": 0.5752820972223384,
              "mean_reward": -0.40551878629208277,
              "min_reward": -0.7119210832394115,
              "max_reward": -0.010495517304603604,
              "num_responses": 6,
              "rvariance": 0.059501822403668365
            },
            {
              "id": "chat_sample_180",
              "variance": 0.4827014647293302,
              "mean_reward": -1.535530457433831,
              "min_reward": -1.7648136531802627,
              "max_reward": -1.2217745053597664,
              "num_responses": 5,
              "rvariance": 0.0462652022982936
            },
            {
              "id": "chat_sample_291",
              "variance": 0.17196239680982384,
              "mean_reward": -1.3897143899635125,
              "min_reward": -1.4932940792700147,
              "max_reward": -1.2579771152144663,
              "num_responses": 6,
              "rvariance": 0.005915022213538262
            },
            {
              "id": "chat_sample_129",
              "variance": 0.32371166978410704,
              "mean_reward": -0.7494166434460648,
              "min_reward": -0.9291367423676101,
              "max_reward": -0.5203489394249586,
              "num_responses": 7,
              "rvariance": 0.0189185835528827
            },
            {
              "id": "chat_sample_31",
              "variance": 0.47327370174633543,
              "mean_reward": -0.28902306169887787,
              "min_reward": -0.5475008968159835,
              "max_reward": 0.013639555931862904,
              "num_responses": 6,
              "rvariance": 0.04092606284786766
            },
            {
              "id": "chat_sample_294",
              "variance": 0.21208695606544947,
              "mean_reward": -0.659664339847955,
              "min_reward": -0.8114782603398358,
              "max_reward": -0.3129381537990745,
              "num_responses": 7,
              "rvariance": 0.02159526365544253
            },
            {
              "id": "chat_sample_128",
              "variance": 0.24859125433560503,
              "mean_reward": -1.2631489166222802,
              "min_reward": -1.4148550912514986,
              "max_reward": -1.1192004441047838,
              "num_responses": 7,
              "rvariance": 0.01125922407270917
            },
            {
              "id": "chat_sample_173",
              "variance": 0.5828620186606662,
              "mean_reward": 0.2458318899701902,
              "min_reward": -0.09723093674815511,
              "max_reward": 0.6969638169393209,
              "num_responses": 7,
              "rvariance": 0.061598655618373556
            },
            {
              "id": "chat_sample_174",
              "variance": 0.43503469508730885,
              "mean_reward": -1.0709302976318509,
              "min_reward": -1.3484836398512157,
              "max_reward": -0.7903600712579276,
              "num_responses": 7,
              "rvariance": 0.034146565233311624
            },
            {
              "id": "chat_sample_297",
              "variance": 0.6994645912343449,
              "mean_reward": 0.3377929837528874,
              "min_reward": -0.28012953861825285,
              "max_reward": 0.6245585972299214,
              "num_responses": 7,
              "rvariance": 0.0997976283404758
            },
            {
              "id": "chat_sample_264",
              "variance": 0.45132586952192333,
              "mean_reward": -1.5294966891247141,
              "min_reward": -1.7708474214893792,
              "max_reward": -1.2036732004324167,
              "num_responses": 5,
              "rvariance": 0.04188187655331832
            },
            {
              "id": "chat_sample_275",
              "variance": 0.21872410120547764,
              "mean_reward": -0.5563360575543327,
              "min_reward": -0.7239886198576447,
              "max_reward": -0.44643527763827995,
              "num_responses": 7,
              "rvariance": 0.009087566123552519
            },
            {
              "id": "chat_sample_172",
              "variance": 0.24617774701195816,
              "mean_reward": -1.0748091486877114,
              "min_reward": -1.2881459567600493,
              "max_reward": -0.8808665958946771,
              "num_responses": 7,
              "rvariance": 0.013945493350449686
            },
            {
              "id": "chat_sample_145",
              "variance": 1.2121840533015305,
              "mean_reward": 0.09013911842244866,
              "min_reward": -1.3062472616873992,
              "max_reward": 0.8779768662128197,
              "num_responses": 7,
              "rvariance": 0.4015944708211883
            },
            {
              "id": "chat_sample_270",
              "variance": 0.23954060187193016,
              "mean_reward": 0.6180938454701536,
              "min_reward": 0.45561308457465577,
              "max_reward": 0.82367295143077,
              "num_responses": 7,
              "rvariance": 0.01166155150014562
            },
            {
              "id": "chat_sample_278",
              "variance": 0.3080238721804038,
              "mean_reward": -0.6058991543792194,
              "min_reward": -0.7632081138669028,
              "max_reward": -0.35743719507880967,
              "num_responses": 7,
              "rvariance": 0.01881085044673628
            },
            {
              "id": "chat_sample_165",
              "variance": 0.7650818215959881,
              "mean_reward": -0.11312345149091764,
              "min_reward": -1.1192004441047838,
              "max_reward": 0.28666757191939024,
              "num_responses": 7,
              "rvariance": 0.19242957138960612
            },
            {
              "id": "chat_sample_127",
              "variance": 0.588292410138871,
              "mean_reward": 0.7230383157037178,
              "min_reward": 0.13733180626875374,
              "max_reward": 1.1917328182868843,
              "num_responses": 7,
              "rvariance": 0.0868075291247221
            },
            {
              "id": "chat_sample_256",
              "variance": 0.40309343410092263,
              "mean_reward": 0.027188598161709616,
              "min_reward": -0.27937531757961326,
              "max_reward": 0.19012727897352424,
              "num_responses": 7,
              "rvariance": 0.029880057060957692
            },
            {
              "id": "chat_sample_114",
              "variance": 0.2721229507411599,
              "mean_reward": -0.537696023313669,
              "min_reward": -0.7028704307757365,
              "max_reward": -0.41852909920861553,
              "num_responses": 7,
              "rvariance": 0.012562307071902154
            },
            {
              "id": "chat_sample_119",
              "variance": 0.6477250279836699,
              "mean_reward": -0.24829063620139638,
              "min_reward": -0.630465211066337,
              "max_reward": 0.08151944940942496,
              "num_responses": 7,
              "rvariance": 0.071246062400418
            },
            {
              "id": "chat_sample_179",
              "variance": 0.36564635953246727,
              "mean_reward": -1.7036140031877942,
              "min_reward": -1.9156578609081785,
              "max_reward": -1.5174291525064811,
              "num_responses": 7,
              "rvariance": 0.026196233493175364
            },
            {
              "id": "chat_sample_191",
              "variance": 1.6104127617032278,
              "mean_reward": 1.2742661490865868,
              "min_reward": -0.4268255306336509,
              "max_reward": 2.114899369581728,
              "num_responses": 7,
              "rvariance": 0.6421995533197211
            },
            {
              "id": "chat_sample_156",
              "variance": 0.880930173131028,
              "mean_reward": 2.1088656012726115,
              "min_reward": 1.1736315133595343,
              "max_reward": 2.6579385174022248,
              "num_responses": 6,
              "rvariance": 0.21051370902017097
            },
            {
              "id": "chat_sample_166",
              "variance": 0.4899419867002699,
              "mean_reward": -1.7639516862789606,
              "min_reward": -2.096670910181677,
              "max_reward": -1.487260310960898,
              "num_responses": 7,
              "rvariance": 0.040342704810608566
            },
            {
              "id": "chat_sample_245",
              "variance": 0.6154443675298957,
              "mean_reward": -1.4609703204711757,
              "min_reward": -1.8070500313440792,
              "max_reward": -0.9653393522223098,
              "num_responses": 7,
              "rvariance": 0.0697720459685849
            },
            {
              "id": "chat_sample_161",
              "variance": 1.0498756857862932,
              "mean_reward": 2.3200474920916934,
              "min_reward": 1.4149822457241994,
              "max_reward": 3.152707518749788,
              "num_responses": 7,
              "rvariance": 0.2443178811057873
            },
            {
              "id": "chat_sample_296",
              "variance": 0.7536176618086665,
              "mean_reward": -1.5913428142931598,
              "min_reward": -2.096670910181677,
              "max_reward": -1.1131666757956673,
              "num_responses": 4,
              "rvariance": 0.12699220990075466
            },
            {
              "id": "chat_sample_130",
              "variance": 0.5732079893660798,
              "mean_reward": 0.9977902654938499,
              "min_reward": 0.4857819261202389,
              "max_reward": 1.3305094893965668,
              "num_responses": 7,
              "rvariance": 0.0665864894678762
            },
            {
              "id": "chat_sample_18",
              "variance": 0.38857467910711097,
              "mean_reward": 1.48049173022318,
              "min_reward": 1.1494964401230678,
              "max_reward": 1.813210954125897,
              "num_responses": 7,
              "rvariance": 0.03565148527813626
            },
            {
              "id": "chat_sample_44",
              "variance": 0.7964574168033947,
              "mean_reward": 0.3866557324704658,
              "min_reward": -0.7058873149302949,
              "max_reward": 0.8055716465034202,
              "num_responses": 7,
              "rvariance": 0.22016077526653496
            },
            {
              "id": "chat_sample_215",
              "variance": 0.12067536618233232,
              "mean_reward": -1.2660221396266216,
              "min_reward": -1.3726187130876821,
              "max_reward": -1.1795381271959502,
              "num_responses": 6,
              "rvariance": 0.0034666945029935285
            },
            {
              "id": "chat_sample_300",
              "variance": 0.15687797603703224,
              "mean_reward": -0.9366789527540057,
              "min_reward": -1.0226601511589177,
              "max_reward": -0.8205289128035108,
              "num_responses": 6,
              "rvariance": 0.004935337178598068
            },
            {
              "id": "chat_sample_169",
              "variance": 0.3559923302378811,
              "mean_reward": -1.0095869864891653,
              "min_reward": -1.2821121884509328,
              "max_reward": -0.8114782603398358,
              "num_responses": 6,
              "rvariance": 0.02513758029781514
            },
            {
              "id": "chat_sample_82",
              "variance": 0.7434168222610664,
              "mean_reward": -0.035398279812542545,
              "min_reward": -0.6455496318391286,
              "max_reward": 0.37114032824702303,
              "num_responses": 7,
              "rvariance": 0.11254548878186008
            },
            {
              "id": "chat_sample_77",
              "variance": 0.377110519319789,
              "mean_reward": -1.129256724619978,
              "min_reward": -1.360551176469449,
              "max_reward": -0.9291367423676101,
              "num_responses": 6,
              "rvariance": 0.02501622576445479
            },
            {
              "id": "chat_sample_277",
              "variance": 0.17256577364073555,
              "mean_reward": -1.0998923855156106,
              "min_reward": -1.2640108835235828,
              "max_reward": -1.0166263828498012,
              "num_responses": 5,
              "rvariance": 0.007651160619302319
            },
            {
              "id": "chat_sample_73",
              "variance": 0.6369396671311238,
              "mean_reward": -1.2699189483262596,
              "min_reward": -1.535530457433831,
              "max_reward": -0.34009011119009935,
              "num_responses": 6,
              "rvariance": 0.17485072453576048
            },
            {
              "id": "chat_sample_6",
              "variance": 0.7156049214612321,
              "mean_reward": 0.988739613030175,
              "min_reward": 0.3379546025468816,
              "max_reward": 1.583927758379465,
              "num_responses": 7,
              "rvariance": 0.12060572635703785
            },
            {
              "id": "chat_sample_80",
              "variance": 0.3095323142576829,
              "mean_reward": -1.6275454241478595,
              "min_reward": -1.7648136531802627,
              "max_reward": -1.4027875546332653,
              "num_responses": 4,
              "rvariance": 0.022669785297543817
            },
            {
              "id": "chat_sample_224",
              "variance": 0.2330165898876978,
              "mean_reward": -0.3863938956694364,
              "min_reward": -0.5610768755114959,
              "max_reward": -0.2684391125193394,
              "num_responses": 7,
              "rvariance": 0.009750158102719399
            },
            {
              "id": "chat_sample_267",
              "variance": 0.35478557657605775,
              "mean_reward": 0.4271681768316774,
              "min_reward": 0.24744807791013218,
              "max_reward": 0.7995378781943036,
              "num_responses": 7,
              "rvariance": 0.031896800782198816
            },
            {
              "id": "chat_sample_308",
              "variance": 0.5641667646653878,
              "mean_reward": -0.23356312359867532,
              "min_reward": -0.687786010002945,
              "max_reward": 0.49784946273847214,
              "num_responses": 7,
              "rvariance": 0.11070704297036534
            },
            {
              "id": "chat_sample_252",
              "variance": 0.5961363089407229,
              "mean_reward": 1.0995023598475302,
              "min_reward": 0.7693690366487204,
              "max_reward": 1.5718602217612319,
              "num_responses": 7,
              "rvariance": 0.06690151592998711
            },
            {
              "id": "chat_sample_159",
              "variance": 0.6106173528826025,
              "mean_reward": -0.9006918346246316,
              "min_reward": -1.3484836398512157,
              "max_reward": -0.5821950645934041,
              "num_responses": 7,
              "rvariance": 0.0723286640254803
            },
            {
              "id": "chat_sample_188",
              "variance": 1.0329811345207667,
              "mean_reward": 2.5717418272719876,
              "min_reward": 1.6080628316159318,
              "max_reward": 2.9596269328580562,
              "num_responses": 7,
              "rvariance": 0.22602851461682014
            },
            {
              "id": "chat_sample_88",
              "variance": 0.2570385299683684,
              "mean_reward": -0.6371454545514305,
              "min_reward": -0.8054444920307192,
              "max_reward": -0.42531708855637174,
              "num_responses": 7,
              "rvariance": 0.013439054878194162
            },
            {
              "id": "chat_sample_27",
              "variance": 0.41331312917448904,
              "mean_reward": -0.8563005392075594,
              "min_reward": -1.0950653708683173,
              "max_reward": -0.4735872350293048,
              "num_responses": 7,
              "rvariance": 0.0375100671058967
            },
            {
              "id": "chat_sample_167",
              "variance": 1.3482455286721102,
              "mean_reward": 0.4553975928493302,
              "min_reward": -0.9653393522223098,
              "max_reward": 1.0227873056316188,
              "num_responses": 7,
              "rvariance": 0.4310346781631467
            },
            {
              "id": "chat_sample_76",
              "variance": 0.27151957391024817,
              "mean_reward": 0.242419937652535,
              "min_reward": 0.003080461390908807,
              "max_reward": 0.3892416331743729,
              "num_responses": 6,
              "rvariance": 0.01581451827240749
            },
            {
              "id": "chat_sample_209",
              "variance": 0.6306796325104155,
              "mean_reward": -0.29074250609053837,
              "min_reward": -0.8537146385036523,
              "max_reward": 0.11772205926412471,
              "num_responses": 7,
              "rvariance": 0.08749437411308923
            },
            {
              "id": "chat_sample_61",
              "variance": 0.23650486219140587,
              "mean_reward": -0.458832785960918,
              "min_reward": -0.6576171684573618,
              "max_reward": -0.2224787679772401,
              "num_responses": 7,
              "rvariance": 0.014569088945436678
            },
            {
              "id": "chat_sample_118",
              "variance": 1.260887876871681,
              "mean_reward": 0.19059866712267395,
              "min_reward": -1.1192004441047838,
              "max_reward": 0.6667949753937377,
              "num_responses": 7,
              "rvariance": 0.3743112920590931
            },
            {
              "id": "chat_sample_150",
              "variance": 0.4925063382316447,
              "mean_reward": 0.4518958523127892,
              "min_reward": -0.13456487816081425,
              "max_reward": 0.7392001951031373,
              "num_responses": 7,
              "rvariance": 0.06810786551248126
            },
            {
              "id": "chat_sample_120",
              "variance": 0.5840687723224893,
              "mean_reward": -0.834751366675,
              "min_reward": -1.420888859560615,
              "max_reward": -0.5037560765748879,
              "num_responses": 7,
              "rvariance": 0.08103201302823303
            },
            {
              "id": "chat_sample_244",
              "variance": 0.5907436285144498,
              "mean_reward": -0.431853670891248,
              "min_reward": -0.9019847849765853,
              "max_reward": -0.11005269440502795,
              "num_responses": 6,
              "rvariance": 0.07054716677015797
            },
            {
              "id": "chat_sample_8",
              "variance": 0.30229179228674297,
              "mean_reward": 0.29205486505253003,
              "min_reward": 0.034757745013771095,
              "max_reward": 0.45561308457465577,
              "num_responses": 7,
              "rvariance": 0.017958644427771158
            },
            {
              "id": "chat_sample_40",
              "variance": 0.588895786969783,
              "mean_reward": 1.0038240338029663,
              "min_reward": 0.6366261338481546,
              "max_reward": 1.3667120992512665,
              "num_responses": 7,
              "rvariance": 0.06399643699872849
            },
            {
              "id": "chat_sample_286",
              "variance": 0.9931582636805969,
              "mean_reward": 1.457649607338667,
              "min_reward": 0.2776169194557153,
              "max_reward": 1.909751247071763,
              "num_responses": 7,
              "rvariance": 0.2772823541192441
            },
            {
              "id": "chat_sample_307",
              "variance": 1.0645075739359013,
              "mean_reward": 0.019457832515653927,
              "min_reward": -0.7903600712579276,
              "max_reward": 1.0710574521045517,
              "num_responses": 7,
              "rvariance": 0.280074893747595
            },
            {
              "id": "chat_sample_206",
              "variance": 0.5104567989512666,
              "mean_reward": 0.9839987950730118,
              "min_reward": 0.6848962803210876,
              "max_reward": 1.390847172487733,
              "num_responses": 7,
              "rvariance": 0.05324541599225484
            },
            {
              "id": "chat_sample_261",
              "variance": 0.19428733955355515,
              "mean_reward": -1.5303586560260167,
              "min_reward": -1.6381045186888135,
              "max_reward": -1.4329563961788485,
              "num_responses": 7,
              "rvariance": 0.007025684494624365
            },
            {
              "id": "chat_sample_79",
              "variance": 0.09050652463674935,
              "mean_reward": 0.8400503225555153,
              "min_reward": 0.7633352683396037,
              "max_reward": 0.8900444028310529,
              "num_responses": 7,
              "rvariance": 0.0016405151611813276
            },
            {
              "id": "chat_sample_69",
              "variance": 0.08371853528899309,
              "mean_reward": -0.5625853175887751,
              "min_reward": -0.6214145586026621,
              "max_reward": -0.5278911498113544,
              "num_responses": 6,
              "rvariance": 0.0013515861153007172
            },
            {
              "id": "chat_sample_203",
              "variance": 0.5758477630013181,
              "mean_reward": -0.12677126076153858,
              "min_reward": -0.6666678209210368,
              "max_reward": 0.2957182243830652,
              "num_responses": 6,
              "rvariance": 0.08243242118936488
            },
            {
              "id": "chat_sample_168",
              "variance": 0.5710961704578887,
              "mean_reward": 0.2053194456089786,
              "min_reward": -0.3521576478083326,
              "max_reward": 0.5099169993567054,
              "num_responses": 7,
              "rvariance": 0.0733244290520539
            },
            {
              "id": "chat_sample_265",
              "variance": 0.3235608255763791,
              "mean_reward": -0.7277597250508426,
              "min_reward": -0.9653393522223098,
              "max_reward": -0.5459924547387043,
              "num_responses": 6,
              "rvariance": 0.019762396141271968
            },
            {
              "id": "chat_sample_301",
              "variance": 0.15748135286794396,
              "mean_reward": -0.9640464018703562,
              "min_reward": -1.0226601511589177,
              "max_reward": -0.832596449421744,
              "num_responses": 7,
              "rvariance": 0.005127724359100057
            },
            {
              "id": "chat_sample_196",
              "variance": 0.27634658855754135,
              "mean_reward": -1.4329563961788483,
              "min_reward": -1.6441382869979302,
              "max_reward": -1.2157407370506499,
              "num_responses": 7,
              "rvariance": 0.01576915479207992
            },
            {
              "id": "chat_sample_225",
              "variance": 0.2510047616592517,
              "mean_reward": -1.383824282804613,
              "min_reward": -1.5113953841973646,
              "max_reward": -1.2278082736688831,
              "num_responses": 7,
              "rvariance": 0.01075993684974094
            },
            {
              "id": "chat_sample_126",
              "variance": 1.4734462210862804,
              "mean_reward": 1.990345152343535,
              "min_reward": 0.21727923636454907,
              "max_reward": 2.7424112737298576,
              "num_responses": 7,
              "rvariance": 0.6211723728341242
            },
            {
              "id": "chat_sample_162",
              "variance": 0.38797130227619914,
              "mean_reward": 0.5202606021723339,
              "min_reward": 0.31381952931041507,
              "max_reward": 0.7633352683396037,
              "num_responses": 7,
              "rvariance": 0.025759728666547656
            },
            {
              "id": "chat_sample_49",
              "variance": 0.7276724580794652,
              "mean_reward": 0.9930494475366868,
              "min_reward": 0.4163935905653977,
              "max_reward": 1.3305094893965668,
              "num_responses": 7,
              "rvariance": 0.09902641370244072
            },
            {
              "id": "chat_sample_177",
              "variance": 0.2445750273048493,
              "mean_reward": -0.3592284700455786,
              "min_reward": -0.5248742656567961,
              "max_reward": -0.20272760452786615,
              "num_responses": 5,
              "rvariance": 0.012083164227430596
            },
            {
              "id": "chat_sample_273",
              "variance": 0.7735290972287516,
              "mean_reward": -1.0041278627809167,
              "min_reward": -1.457091469415315,
              "max_reward": -0.4645365825656298,
              "num_responses": 7,
              "rvariance": 0.1044743654322243
            },
            {
              "id": "chat_sample_285",
              "variance": 0.9062720000293174,
              "mean_reward": 0.7788506725630464,
              "min_reward": -0.3589456371560888,
              "max_reward": 1.227935428141584,
              "num_responses": 7,
              "rvariance": 0.24719769848112189
            },
            {
              "id": "chat_sample_293",
              "variance": 0.2763465885575416,
              "mean_reward": -1.3889960842124274,
              "min_reward": -1.5294966891247144,
              "max_reward": -1.1554030539594835,
              "num_responses": 7,
              "rvariance": 0.014517964786903597
            },
            {
              "id": "chat_sample_233",
              "variance": 0.3381927137259869,
              "mean_reward": -0.6414552890579424,
              "min_reward": -0.8989679008220269,
              "max_reward": -0.4992307503430504,
              "num_responses": 7,
              "rvariance": 0.020231348600623755
            },
            {
              "id": "chat_sample_235",
              "variance": 0.586482279646136,
              "mean_reward": -1.1584199381140419,
              "min_reward": -1.5777668355976473,
              "max_reward": -0.8084613761852776,
              "num_responses": 7,
              "rvariance": 0.061097673456450854
            },
            {
              "id": "chat_sample_158",
              "variance": 0.6338473608727015,
              "mean_reward": -0.7993029778589398,
              "min_reward": -1.1976394321233,
              "max_reward": -0.3732758368902408,
              "num_responses": 7,
              "rvariance": 0.07825359015172202
            },
            {
              "id": "chat_sample_216",
              "variance": 0.5125686178594575,
              "mean_reward": -0.16917823654123773,
              "min_reward": -0.5309080339659127,
              "max_reward": 0.21426235220999074,
              "num_responses": 7,
              "rvariance": 0.050438694310477615
            },
            {
              "id": "chat_sample_242",
              "variance": 0.42477728896181044,
              "mean_reward": 0.8253968852333747,
              "min_reward": 0.5219845359749387,
              "max_reward": 1.1313951351957179,
              "num_responses": 7,
              "rvariance": 0.033792531956906305
            },
            {
              "id": "chat_sample_92",
              "variance": 0.7095711531521154,
              "mean_reward": 2.102831832963495,
              "min_reward": 1.5959952949976983,
              "max_reward": 2.428655321655793,
              "num_responses": 7,
              "rvariance": 0.08808258758531196
            },
            {
              "id": "chat_sample_250",
              "variance": 1.003113981390639,
              "mean_reward": -1.6607311498480009,
              "min_reward": -2.2052787397457765,
              "max_reward": -0.7963938395670442,
              "num_responses": 6,
              "rvariance": 0.21476035922194903
            },
            {
              "id": "chat_sample_283",
              "variance": 0.47938289215931607,
              "mean_reward": -0.5896295291171371,
              "min_reward": -0.9200860899039351,
              "max_reward": -0.31897192210819114,
              "num_responses": 7,
              "rvariance": 0.03917493830767018
            },
            {
              "id": "chat_sample_140",
              "variance": 0.862376335580494,
              "mean_reward": -0.3451137620367523,
              "min_reward": -1.0769640659409674,
              "max_reward": 0.1840935106644076,
              "num_responses": 7,
              "rvariance": 0.14864513304308227
            },
            {
              "id": "chat_sample_232",
              "variance": 0.6202713821771892,
              "mean_reward": -0.9349550189514011,
              "min_reward": -1.4329563961788485,
              "max_reward": -0.5022476344976088,
              "num_responses": 7,
              "rvariance": 0.0751000981810969
            },
            {
              "id": "chat_sample_0",
              "variance": 0.33789102531053106,
              "mean_reward": 1.0477843457693876,
              "min_reward": 0.8719430979037031,
              "max_reward": 1.2641380379962837,
              "num_responses": 7,
              "rvariance": 0.020724877674815196
            },
            {
              "id": "chat_sample_34",
              "variance": 0.48028795740568364,
              "mean_reward": 0.19820821867323404,
              "min_reward": -0.036893253656988846,
              "max_reward": 0.6909300486302042,
              "num_responses": 7,
              "rvariance": 0.05424786790127889
            },
            {
              "id": "chat_sample_68",
              "variance": 0.4563791504808089,
              "mean_reward": 0.14414673208217565,
              "min_reward": -0.18000669573884884,
              "max_reward": 0.3681234440924647,
              "num_responses": 7,
              "rvariance": 0.03553545596822045
            },
            {
              "id": "chat_sample_149",
              "variance": 0.46309171772470115,
              "mean_reward": -0.6849846175737122,
              "min_reward": -1.1614368222686002,
              "max_reward": -0.44040150932916333,
              "num_responses": 7,
              "rvariance": 0.04893562737956126
            },
            {
              "id": "chat_sample_309",
              "variance": 0.7898202716633664,
              "mean_reward": 0.7025666017977864,
              "min_reward": 0.17202597404617437,
              "max_reward": 1.065023683795435,
              "num_responses": 7,
              "rvariance": 0.10586040756681836
            },
            {
              "id": "chat_sample_243",
              "variance": 0.3642887616629164,
              "mean_reward": -0.2740418973778048,
              "min_reward": -0.5203489394249586,
              "max_reward": -0.06781631624121155,
              "num_responses": 7,
              "rvariance": 0.021998773767166555
            },
            {
              "id": "chat_sample_281",
              "variance": 0.905065246367494,
              "mean_reward": -0.9971243817078348,
              "min_reward": -1.3484836398512157,
              "max_reward": -0.3778011631220783,
              "num_responses": 7,
              "rvariance": 0.15203270399206584
            },
            {
              "id": "chat_sample_99",
              "variance": 0.3137559520740645,
              "mean_reward": 3.5733473665853475,
              "min_reward": 3.394058251114453,
              "max_reward": 3.8526246426073163,
              "num_responses": 7,
              "rvariance": 0.022111291302878738
            },
            {
              "id": "chat_sample_43",
              "variance": 0.152050961389739,
              "mean_reward": 0.005558616232153133,
              "min_reward": -0.09572249467087596,
              "max_reward": 0.10112919641405399,
              "num_responses": 7,
              "rvariance": 0.0043571772483929055
            },
            {
              "id": "chat_sample_148",
              "variance": 0.49290230427693055,
              "mean_reward": -0.03128373468210699,
              "min_reward": -0.21470086351626944,
              "max_reward": 0.4887988102747972,
              "num_responses": 4,
              "rvariance": 0.09020015890597943
            },
            {
              "id": "chat_sample_249",
              "variance": 0.3433214167887362,
              "mean_reward": -0.7151534591192954,
              "min_reward": -0.9623224680677516,
              "max_reward": -0.4931969820339338,
              "num_responses": 7,
              "rvariance": 0.02297269178521328
            },
            {
              "id": "chat_sample_100",
              "variance": 0.9933091078883247,
              "mean_reward": 0.18183084754848886,
              "min_reward": -0.8989679008220269,
              "max_reward": 0.6245585972299214,
              "num_responses": 6,
              "rvariance": 0.2667446593678901
            },
            {
              "id": "chat_sample_141",
              "variance": 0.6018683888343835,
              "mean_reward": -0.7953163809404161,
              "min_reward": -1.1976394321233,
              "max_reward": -0.5369418022750293,
              "num_responses": 7,
              "rvariance": 0.058404067182688306
            },
            {
              "id": "chat_sample_97",
              "variance": 0.34633830094329443,
              "mean_reward": 1.1382908704061372,
              "min_reward": 0.9443483176131026,
              "max_reward": 1.3305094893965668,
              "num_responses": 7,
              "rvariance": 0.024885604532883798
            },
            {
              "id": "chat_sample_137",
              "variance": 0.4763660080047578,
              "mean_reward": -0.6457651235644543,
              "min_reward": -0.9804237729951014,
              "max_reward": -0.2986079540649225,
              "num_responses": 7,
              "rvariance": 0.044841212105793136
            },
            {
              "id": "chat_sample_207",
              "variance": 0.48858438883071886,
              "mean_reward": -0.1326793255642153,
              "min_reward": -0.3830807103925553,
              "max_reward": 0.12677271172779966,
              "num_responses": 7,
              "rvariance": 0.04077658596460817
            },
            {
              "id": "chat_sample_190",
              "variance": 0.4663725792427833,
              "mean_reward": -0.15538676612039976,
              "min_reward": -0.6727015892301534,
              "max_reward": 0.17504285820073268,
              "num_responses": 7,
              "rvariance": 0.06036082922007362
            },
            {
              "id": "chat_sample_254",
              "variance": 0.1755826577952938,
              "mean_reward": -0.8252697307606739,
              "min_reward": -0.9019847849765853,
              "max_reward": -0.648566515993687,
              "num_responses": 7,
              "rvariance": 0.006974046902367992
            },
            {
              "id": "chat_sample_171",
              "variance": 0.5086466684585316,
              "mean_reward": -1.1131666757956673,
              "min_reward": -1.4027875546332653,
              "max_reward": -0.8778497117401187,
              "num_responses": 7,
              "rvariance": 0.04785616023064761
            },
            {
              "id": "chat_sample_131",
              "variance": 0.25070307324379587,
              "mean_reward": 0.27266060977322665,
              "min_reward": 0.12073894341868303,
              "max_reward": 0.44656243211098084,
              "num_responses": 7,
              "rvariance": 0.01122662552076314
            },
            {
              "id": "chat_sample_272",
              "variance": 0.29150643143419713,
              "mean_reward": -0.38308071039255537,
              "min_reward": -0.6002963695207539,
              "max_reward": -0.24656670239879164,
              "num_responses": 7,
              "rvariance": 0.015349140792745422
            },
            {
              "id": "chat_sample_317",
              "variance": 0.7089677763212036,
              "mean_reward": 0.06514207828467981,
              "min_reward": -0.938187394831285,
              "max_reward": 0.3409714867014399,
              "num_responses": 7,
              "rvariance": 0.18204963172703517
            },
            {
              "id": "chat_sample_221",
              "variance": 0.21781903595911023,
              "mean_reward": -1.0261080187641272,
              "min_reward": -1.1433355173412503,
              "max_reward": -0.8386302177308607,
              "num_responses": 7,
              "rvariance": 0.009201521745312568
            },
            {
              "id": "chat_sample_263",
              "variance": 0.9767916671421178,
              "mean_reward": 0.0795261509501632,
              "min_reward": -0.9593055839131932,
              "max_reward": 0.5521533775205218,
              "num_responses": 7,
              "rvariance": 0.22803589699285984
            },
            {
              "id": "chat_sample_112",
              "variance": 0.7433602556831687,
              "mean_reward": 1.61840643443156,
              "min_reward": 1.0288210739407353,
              "max_reward": 2.0545616864905623,
              "num_responses": 7,
              "rvariance": 0.11618532556380956
            },
            {
              "id": "chat_sample_138",
              "variance": 0.4718406817729204,
              "mean_reward": -1.374342646890287,
              "min_reward": -2.024265690472278,
              "max_reward": -1.1071329074865506,
              "num_responses": 7,
              "rvariance": 0.07700168037794855
            },
            {
              "id": "chat_sample_1",
              "variance": 0.41934689748360543,
              "mean_reward": -1.5868174880613226,
              "min_reward": -1.9639280073811114,
              "max_reward": -1.3243485666147492,
              "num_responses": 6,
              "rvariance": 0.03988620125220765
            },
            {
              "id": "chat_sample_42",
              "variance": 0.18946032490626208,
              "mean_reward": -1.112304708894365,
              "min_reward": -1.245909578596233,
              "max_reward": -0.9623224680677516,
              "num_responses": 7,
              "rvariance": 0.007691400791915359
            },
            {
              "id": "chat_sample_101",
              "variance": 0.4501191158601001,
              "mean_reward": -1.3933059187189392,
              "min_reward": -1.7044759700890963,
              "max_reward": -1.1674705905777167,
              "num_responses": 7,
              "rvariance": 0.03521906687967267
            },
            {
              "id": "chat_sample_21",
              "variance": 0.26488242877021995,
              "mean_reward": 0.12138541859465982,
              "min_reward": -0.03613903261834927,
              "max_reward": 0.2957182243830652,
              "num_responses": 7,
              "rvariance": 0.01255490042085459
            },
            {
              "id": "chat_sample_66",
              "variance": 0.7071387903025027,
              "mean_reward": 0.528456021851123,
              "min_reward": -0.2201218272314914,
              "max_reward": 0.8779768662128197,
              "num_responses": 7,
              "rvariance": 0.12082894196301039
            },
            {
              "id": "chat_sample_151",
              "variance": 0.3668531131942909,
              "mean_reward": 0.43169350306351484,
              "min_reward": 0.01062267177730459,
              "max_reward": 0.6245585972299214,
              "num_responses": 7,
              "rvariance": 0.035987965488109064
            },
            {
              "id": "chat_sample_33",
              "variance": 0.41633001332904734,
              "mean_reward": 0.68575824722239,
              "min_reward": 0.42544424302907263,
              "max_reward": 1.0589899154863185,
              "num_responses": 7,
              "rvariance": 0.03719095421562163
            },
            {
              "id": "chat_sample_219",
              "variance": 0.25568093209881715,
              "mean_reward": -0.7552887929611872,
              "min_reward": -0.8567315226582105,
              "max_reward": -0.5173320552704003,
              "num_responses": 4,
              "rvariance": 0.019513097902622754
            },
            {
              "id": "chat_sample_5",
              "variance": 0.5599336990860233,
              "mean_reward": 1.764940807652964,
              "min_reward": 1.4753199288153658,
              "max_reward": 2.187304589291128,
              "num_responses": 7,
              "rvariance": 0.057126779761281714
            },
            {
              "id": "chat_sample_86",
              "variance": 0.4422752170582488,
              "mean_reward": 0.4260907182050495,
              "min_reward": 0.13733180626875374,
              "max_reward": 0.7271326584849039,
              "num_responses": 7,
              "rvariance": 0.038009447202232295
            },
            {
              "id": "chat_sample_108",
              "variance": 0.9739256271952874,
              "mean_reward": -0.023802131343459043,
              "min_reward": -1.1735043588868335,
              "max_reward": 0.43147801133818925,
              "num_responses": 7,
              "rvariance": 0.25806106723918304
            },
            {
              "id": "chat_sample_28",
              "variance": 0.31377480760003074,
              "mean_reward": -0.2690317147639848,
              "min_reward": -0.5490093388932626,
              "max_reward": 0.034757745013771095,
              "num_responses": 7,
              "rvariance": 0.02665810689777154
            },
            {
              "id": "chat_sample_255",
              "variance": 0.3234099813686512,
              "mean_reward": -0.7713967994292753,
              "min_reward": -1.034727687777151,
              "max_reward": -0.6153807902935455,
              "num_responses": 7,
              "rvariance": 0.01999675047465319
            },
            {
              "id": "chat_sample_29",
              "variance": 0.36564635953246755,
              "mean_reward": 0.5655138644907086,
              "min_reward": 0.3862247490198146,
              "max_reward": 0.7935041098851868,
              "num_responses": 7,
              "rvariance": 0.022597576254415528
            },
            {
              "id": "chat_sample_60",
              "variance": 0.4006422157253442,
              "mean_reward": 1.6511611766810503,
              "min_reward": 1.3667120992512665,
              "max_reward": 1.8252784907441302,
              "num_responses": 7,
              "rvariance": 0.029618431333936823
            },
            {
              "id": "chat_sample_125",
              "variance": 0.7791857550185484,
              "mean_reward": -0.7737402719421913,
              "min_reward": -1.1735043588868335,
              "max_reward": -0.21319242143899028,
              "num_responses": 7,
              "rvariance": 0.1141132612408373
            },
            {
              "id": "chat_sample_314",
              "variance": 0.510155110535811,
              "mean_reward": -0.2805790408890493,
              "min_reward": -0.5927541591343581,
              "max_reward": 0.09207854395037905,
              "num_responses": 7,
              "rvariance": 0.051659603669593566
            },
            {
              "id": "chat_sample_310",
              "variance": 0.5635539600714932,
              "mean_reward": 1.2770675415158195,
              "min_reward": 0.7935041098851868,
              "max_reward": 1.668400514707098,
              "num_responses": 7,
              "rvariance": 0.06955100735425006
            },
            {
              "id": "chat_sample_222",
              "variance": 1.5494717017811497,
              "mean_reward": 0.9098696415610076,
              "min_reward": -0.8476808701945356,
              "max_reward": 1.5959952949976983,
              "num_responses": 7,
              "rvariance": 0.616710364772315
            },
            {
              "id": "chat_sample_143",
              "variance": 0.9201496671402857,
              "mean_reward": 1.2501310758501205,
              "min_reward": -0.0768669687048865,
              "max_reward": 1.6804680513253312,
              "num_responses": 7,
              "rvariance": 0.31469313959542483
            },
            {
              "id": "chat_sample_12",
              "variance": 0.4130114407590331,
              "mean_reward": 0.27998732843429686,
              "min_reward": -0.03010526430923264,
              "max_reward": 0.5702546824478717,
              "num_responses": 7,
              "rvariance": 0.036772931189100036
            },
            {
              "id": "chat_sample_248",
              "variance": 0.24979800799742824,
              "mean_reward": -0.8482842470254471,
              "min_reward": -1.034727687777151,
              "max_reward": -0.7028704307757365,
              "num_responses": 5,
              "rvariance": 0.01290022960527019
            },
            {
              "id": "chat_sample_64",
              "variance": 0.5613667190594384,
              "mean_reward": -0.024576344290209873,
              "min_reward": -0.2580685732380452,
              "max_reward": 0.5762884507569883,
              "num_responses": 7,
              "rvariance": 0.07935120223665189
            },
            {
              "id": "chat_sample_4",
              "variance": 0.15024083089700396,
              "mean_reward": 0.3659685268392088,
              "min_reward": 0.2021948155917575,
              "max_reward": 0.4646637370383307,
              "num_responses": 7,
              "rvariance": 0.005819073705784489
            },
            {
              "id": "chat_sample_311",
              "variance": 0.6435013901672884,
              "mean_reward": 0.3543319736716267,
              "min_reward": 0.03777462916832941,
              "max_reward": 0.8840106345219363,
              "num_responses": 7,
              "rvariance": 0.07784617790742218
            },
            {
              "id": "chat_sample_117",
              "variance": 0.43307372038684594,
              "mean_reward": -0.5979798334735038,
              "min_reward": -1.1071329074865506,
              "max_reward": -0.27786687550233413,
              "num_responses": 7,
              "rvariance": 0.05523285381265238
            },
            {
              "id": "chat_sample_39",
              "variance": 0.3720572383609041,
              "mean_reward": -0.3421372825806925,
              "min_reward": -0.5746528542070083,
              "max_reward": -0.08290073701400312,
              "num_responses": 7,
              "rvariance": 0.026466524015142417
            },
            {
              "id": "chat_sample_287",
              "variance": 0.7975003630833885,
              "mean_reward": 0.5689014056363543,
              "min_reward": -0.2282886269155106,
              "max_reward": 1.0710574521045517,
              "num_responses": 6,
              "rvariance": 0.16051614681544296
            },
            {
              "id": "chat_sample_313",
              "variance": 0.8258720373103384,
              "mean_reward": -0.20120569421775417,
              "min_reward": -1.0829978342500841,
              "max_reward": 0.16599220573705772,
              "num_responses": 7,
              "rvariance": 0.16180488614316865
            },
            {
              "id": "chat_sample_3",
              "variance": 0.6395794407663624,
              "mean_reward": 2.2286790005536417,
              "min_reward": 1.8494135639805966,
              "max_reward": 2.5976008343110584,
              "num_responses": 7,
              "rvariance": 0.07031034000584759
            },
            {
              "id": "chat_sample_170",
              "variance": 0.30696796272630833,
              "mean_reward": -0.8353619265634226,
              "min_reward": -1.0226601511589177,
              "max_reward": -0.4871632137248172,
              "num_responses": 6,
              "rvariance": 0.02767673429192173
            },
            {
              "id": "chat_sample_83",
              "variance": 0.11645172836595086,
              "mean_reward": -1.0041278627809167,
              "min_reward": -1.0829978342500841,
              "max_reward": -0.9321536265221684,
              "num_responses": 7,
              "rvariance": 0.002721189663870748
            },
            {
              "id": "chat_sample_279",
              "variance": 0.2672959360938667,
              "mean_reward": 0.16857810644096485,
              "min_reward": 0.061909702404795916,
              "max_reward": 0.5943897556843382,
              "num_responses": 7,
              "rvariance": 0.03116560876091368
            },
            {
              "id": "chat_sample_55",
              "variance": 0.30319685753311054,
              "mean_reward": -0.6375046074269731,
              "min_reward": -0.8506977543490939,
              "max_reward": -0.4705703508747464,
              "num_responses": 6,
              "rvariance": 0.020617123930142697
            },
            {
              "id": "chat_sample_103",
              "variance": 1.0281541198734736,
              "mean_reward": 1.831312259053247,
              "min_reward": 0.8417742563581199,
              "max_reward": 2.525195614601659,
              "num_responses": 7,
              "rvariance": 0.25828752153175266
            },
            {
              "id": "chat_sample_113",
              "variance": 0.7495448682000128,
              "mean_reward": 0.6598453672519872,
              "min_reward": -0.26278245472954254,
              "max_reward": 1.0770912204136682,
              "num_responses": 7,
              "rvariance": 0.1682804294416055
            },
            {
              "id": "chat_sample_104",
              "variance": 0.8753489374450946,
              "mean_reward": -0.4065962449187106,
              "min_reward": -1.5838006039067638,
              "max_reward": -0.01652928561372023,
              "num_responses": 7,
              "rvariance": 0.255215031100082
            },
            {
              "id": "chat_sample_282",
              "variance": 0.6214781358390129,
              "mean_reward": 1.4977310682492273,
              "min_reward": 1.0951925253410182,
              "max_reward": 2.042494149872329,
              "num_responses": 7,
              "rvariance": 0.08003901098433867
            },
            {
              "id": "chat_sample_62",
              "variance": 0.33743849268734744,
              "mean_reward": -0.23234898345290775,
              "min_reward": -0.5158236131931211,
              "max_reward": 0.05285904994112098,
              "num_responses": 7,
              "rvariance": 0.02630306657527785
            },
            {
              "id": "chat_sample_91",
              "variance": 0.22505955793005022,
              "mean_reward": 0.5004353634423794,
              "min_reward": 0.2715831511465987,
              "max_reward": 0.6667949753937377,
              "num_responses": 7,
              "rvariance": 0.012777146388965255
            },
            {
              "id": "chat_sample_284",
              "variance": 0.7077610226593802,
              "mean_reward": 0.5769349259329651,
              "min_reward": 0.028723976704654472,
              "max_reward": 0.9564158542313358,
              "num_responses": 7,
              "rvariance": 0.1002981287218053
            },
            {
              "id": "chat_sample_84",
              "variance": 0.16653200533161905,
              "mean_reward": -1.1786761602946478,
              "min_reward": -1.2579771152144663,
              "max_reward": -1.0407614560862677,
              "num_responses": 7,
              "rvariance": 0.0050597410541869765
            },
            {
              "id": "chat_sample_175",
              "variance": 0.4054692303726374,
              "mean_reward": 0.8034167292501643,
              "min_reward": 0.23538054129189895,
              "max_reward": 1.0046860007042688,
              "num_responses": 7,
              "rvariance": 0.057820358068782926
            },
            {
              "id": "chat_sample_185",
              "variance": 1.0087706391804363,
              "mean_reward": -0.3680434284346788,
              "min_reward": -1.1735043588868335,
              "max_reward": 0.19616104728264086,
              "num_responses": 7,
              "rvariance": 0.20304670409993844
            },
            {
              "id": "chat_sample_154",
              "variance": 0.7684003941660024,
              "mean_reward": 0.7625810473009642,
              "min_reward": -0.18321213515306706,
              "max_reward": 1.0951925253410182,
              "num_responses": 7,
              "rvariance": 0.17213788412312073
            },
            {
              "id": "chat_sample_189",
              "variance": 1.048367243709014,
              "mean_reward": 0.23214816541201497,
              "min_reward": -1.1252342124139005,
              "max_reward": 0.7331664267940206,
              "num_responses": 7,
              "rvariance": 0.3447945124396732
            },
            {
              "id": "chat_sample_218",
              "variance": 0.5573693475546483,
              "mean_reward": 0.3542960583840724,
              "min_reward": 0.11319673303228725,
              "max_reward": 0.775402804957837,
              "num_responses": 6,
              "rvariance": 0.062481214459665445
            },
            {
              "id": "chat_sample_257",
              "variance": 0.7421535020213453,
              "mean_reward": 1.3279235886926595,
              "min_reward": 0.7874703415760702,
              "max_reward": 1.728738197798264,
              "num_responses": 7,
              "rvariance": 0.10016801313412335
            },
            {
              "id": "chat_sample_13",
              "variance": 0.7244764464282301,
              "mean_reward": -0.2756183540308899,
              "min_reward": -0.6636509367664785,
              "max_reward": 0.3590727916287898,
              "num_responses": 5,
              "rvariance": 0.12248030366509374
            },
            {
              "id": "chat_sample_237",
              "variance": 0.4298305699206958,
              "mean_reward": -0.5471507227623293,
              "min_reward": -0.8869003642037937,
              "max_reward": -0.2591999047960046,
              "num_responses": 7,
              "rvariance": 0.03918385269979112
            },
            {
              "id": "chat_sample_89",
              "variance": 0.8302465193344479,
              "mean_reward": 0.5609885382588712,
              "min_reward": 0.025707092550096157,
              "max_reward": 1.1374289035048346,
              "num_responses": 7,
              "rvariance": 0.13144674165649067
            },
            {
              "id": "chat_sample_23",
              "variance": 0.304101922779478,
              "mean_reward": 0.14983032633763818,
              "min_reward": -0.05122345339114084,
              "max_reward": 0.31080264515585676,
              "num_responses": 7,
              "rvariance": 0.015612291674596058
            },
            {
              "id": "chat_sample_236",
              "variance": 0.5606879201246626,
              "mean_reward": -0.15164259739286753,
              "min_reward": -0.784326302948811,
              "max_reward": 0.22029612051910738,
              "num_responses": 7,
              "rvariance": 0.08459609815599031
            },
            {
              "id": "chat_sample_234",
              "variance": 0.2123886444809049,
              "mean_reward": -1.558803563768995,
              "min_reward": -1.6441382869979302,
              "max_reward": -1.3665849447785656,
              "num_responses": 7,
              "rvariance": 0.009189262460820025
            },
            {
              "id": "chat_sample_194",
              "variance": 0.7687020825814581,
              "mean_reward": 0.9275399630377061,
              "min_reward": 0.32588706592864836,
              "max_reward": 1.3063744161601,
              "num_responses": 7,
              "rvariance": 0.10746600234186947
            },
            {
              "id": "chat_sample_70",
              "variance": 0.4977858855021217,
              "mean_reward": 0.46768062119288906,
              "min_reward": 0.23839742544645726,
              "max_reward": 0.8538417929763531,
              "num_responses": 7,
              "rvariance": 0.047700132973470026
            },
            {
              "id": "chat_sample_74",
              "variance": 0.1641184980079723,
              "mean_reward": -0.6565397098307338,
              "min_reward": -0.7782925346396944,
              "max_reward": -0.5444840126614251,
              "num_responses": 7,
              "rvariance": 0.005144162945124126
            },
            {
              "id": "chat_sample_200",
              "variance": 0.6528537310464193,
              "mean_reward": 1.5339336781039274,
              "min_reward": 1.179665281668651,
              "max_reward": 1.8976837104535298,
              "num_responses": 7,
              "rvariance": 0.07115585914236226
            },
            {
              "id": "chat_sample_260",
              "variance": 0.16894551265526536,
              "mean_reward": -1.009730647639382,
              "min_reward": -1.1976394321233,
              "max_reward": -0.9200860899039351,
              "num_responses": 7,
              "rvariance": 0.007275328106108494
            },
            {
              "id": "chat_sample_315",
              "variance": 0.5713978588733445,
              "mean_reward": 0.3933359759555592,
              "min_reward": -0.06178254793209493,
              "max_reward": 0.6969638169393209,
              "num_responses": 7,
              "rvariance": 0.058554893531293284
            },
            {
              "id": "chat_sample_240",
              "variance": 0.6244195978897069,
              "mean_reward": 0.31837179200791826,
              "min_reward": -0.2546745785641671,
              "max_reward": 0.7090313535575541,
              "num_responses": 7,
              "rvariance": 0.08391373866103778
            },
            {
              "id": "chat_sample_20",
              "variance": 1.2607558881899192,
              "mean_reward": 0.7567627707171731,
              "min_reward": -0.10024782090271343,
              "max_reward": 1.4994550020518322,
              "num_responses": 7,
              "rvariance": 0.2839941034138241
            },
            {
              "id": "chat_sample_210",
              "variance": 0.32642686552320954,
              "mean_reward": 0.28602109674341347,
              "min_reward": 0.01967332424097953,
              "max_reward": 0.5461196092114052,
              "num_responses": 7,
              "rvariance": 0.022487335567350192
            },
            {
              "id": "chat_sample_93",
              "variance": 0.31556608256679963,
              "mean_reward": 0.26167053178162136,
              "min_reward": 0.0935869860276582,
              "max_reward": 0.5340520725931719,
              "num_responses": 7,
              "rvariance": 0.022225339798006175
            },
            {
              "id": "chat_sample_226",
              "variance": 0.6323389187954225,
              "mean_reward": 1.4761818957166681,
              "min_reward": 0.8538417929763531,
              "max_reward": 1.728738197798264,
              "num_responses": 7,
              "rvariance": 0.0872549001353319
            },
            {
              "id": "chat_sample_30",
              "variance": 0.1761860346262054,
              "mean_reward": 1.0383027098550615,
              "min_reward": 0.9021119394492861,
              "max_reward": 1.1253613668866014,
              "num_responses": 7,
              "rvariance": 0.005885942530289167
            },
            {
              "id": "chat_sample_142",
              "variance": 0.5792417576751961,
              "mean_reward": 0.41510064021344417,
              "min_reward": 0.06341814448207507,
              "max_reward": 0.8779768662128197,
              "num_responses": 7,
              "rvariance": 0.06359373807782255
            },
            {
              "id": "chat_sample_136",
              "variance": 0.5563134381005529,
              "mean_reward": -1.1463524014958089,
              "min_reward": -1.535530457433831,
              "max_reward": -0.9050016691311435,
              "num_responses": 7,
              "rvariance": 0.06049436806203094
            },
            {
              "id": "chat_sample_16",
              "variance": 0.48632172571480015,
              "mean_reward": 0.9809819109184535,
              "min_reward": 0.42846112718363094,
              "max_reward": 1.390847172487733,
              "num_responses": 7,
              "rvariance": 0.07076467651900988
            },
            {
              "id": "chat_sample_22",
              "variance": 0.9218089534252928,
              "mean_reward": -0.49405894893523616,
              "min_reward": -0.9080185532857019,
              "max_reward": 0.12828115380507882,
              "num_responses": 7,
              "rvariance": 0.14539666971023224
            },
            {
              "id": "chat_sample_217",
              "variance": 0.2682010013402341,
              "mean_reward": 0.23419533680260818,
              "min_reward": -0.07762118974352608,
              "max_reward": 0.4797481578111223,
              "num_responses": 7,
              "rvariance": 0.02319602901539051
            }
          ]
        },
        "semantic_benchmark_chat_hard_filtered.json": {
          "file_name": "semantic_benchmark_chat_hard_filtered.json",
          "processed_samples": 200,
          "global_mean": -4.1197998529366355,
          "global_std": 3.3051985325775166,
          "mean_variance": 0.6803411304766389,
          "mean_rvariance": 0.14388695859650447,
          "sample_results": [
            {
              "id": "chat_hard_sample_121",
              "variance": 0.35691880181249985,
              "mean_reward": 0.5121376228747322,
              "min_reward": 0.3482543761263878,
              "max_reward": 0.7926301028863214,
              "num_responses": 6,
              "rvariance": 0.030257146885339176
            },
            {
              "id": "chat_hard_sample_77",
              "variance": 1.744411097600165,
              "mean_reward": 0.6545224492048527,
              "min_reward": -0.360855826150102,
              "max_reward": 1.7593836786566024,
              "num_responses": 7,
              "rvariance": 0.5285663565236628
            },
            {
              "id": "chat_hard_sample_265",
              "variance": 1.685318580743791,
              "mean_reward": 1.3977374754955927,
              "min_reward": -0.5594066827875191,
              "max_reward": 1.998117446756354,
              "num_responses": 7,
              "rvariance": 0.7867583623864023
            },
            {
              "id": "chat_hard_sample_334",
              "variance": 0.8367500386862576,
              "mean_reward": 2.7639564652149633,
              "min_reward": 1.9177516238316852,
              "max_reward": 3.2886980148995653,
              "num_responses": 6,
              "rvariance": 0.17907711628477677
            },
            {
              "id": "chat_hard_sample_61",
              "variance": 0.6136166950365891,
              "mean_reward": 0.5626757944338026,
              "min_reward": 0.16388572353450048,
              "max_reward": 0.8469952183941857,
              "num_responses": 7,
              "rvariance": 0.06206243460756155
            },
            {
              "id": "chat_hard_sample_133",
              "variance": 0.9348436166678391,
              "mean_reward": 0.14537006825283663,
              "min_reward": -0.4364942477262609,
              "max_reward": 0.6957183752418679,
              "num_responses": 6,
              "rvariance": 0.1652442800156079
            },
            {
              "id": "chat_hard_sample_62",
              "variance": 1.9381754603722157,
              "mean_reward": 0.5965906782153002,
              "min_reward": -1.2117880688818896,
              "max_reward": 1.360509189876077,
              "num_responses": 4,
              "rvariance": 1.126097866266764
            },
            {
              "id": "chat_hard_sample_84",
              "variance": 1.0116638885811255,
              "mean_reward": 1.179489113239384,
              "min_reward": 0.7382649873784571,
              "max_reward": 1.927206426528705,
              "num_responses": 6,
              "rvariance": 0.18940142095958346
            },
            {
              "id": "chat_hard_sample_343",
              "variance": 0.37062826572317853,
              "mean_reward": -1.5899801767626842,
              "min_reward": -1.816895441491161,
              "max_reward": -1.400884122822287,
              "num_responses": 4,
              "rvariance": 0.03075129314961347
            },
            {
              "id": "chat_hard_sample_87",
              "variance": 0.29971724549552964,
              "mean_reward": 0.23196030295304348,
              "min_reward": 0.01733628173069258,
              "max_reward": 0.42862019905105664,
              "num_responses": 5,
              "rvariance": 0.01879583400476085
            },
            {
              "id": "chat_hard_sample_110",
              "variance": 0.769148199402566,
              "mean_reward": 0.5464675612389114,
              "min_reward": -0.8619603690921548,
              "max_reward": 0.88717812985652,
              "num_responses": 7,
              "rvariance": 0.3340698091935292
            },
            {
              "id": "chat_hard_sample_150",
              "variance": 0.8698418481258274,
              "mean_reward": 0.001128048535801392,
              "min_reward": -0.4743134585143403,
              "max_reward": 0.5515326341123149,
              "num_responses": 7,
              "rvariance": 0.12803582582935447
            },
            {
              "id": "chat_hard_sample_65",
              "variance": 1.3189449762342709,
              "mean_reward": 0.2800447280978874,
              "min_reward": -0.6634095124547376,
              "max_reward": 0.9391795446901293,
              "num_responses": 7,
              "rvariance": 0.3494821708712451
            },
            {
              "id": "chat_hard_sample_46",
              "variance": 1.3019263313796352,
              "mean_reward": 2.3945438169814013,
              "min_reward": 0.41916539635403677,
              "max_reward": 2.98614432859493,
              "num_responses": 7,
              "rvariance": 0.6796344101711371
            },
            {
              "id": "chat_hard_sample_114",
              "variance": 0.941934718690604,
              "mean_reward": 0.6147616271486352,
              "min_reward": 0.14497611814046074,
              "max_reward": 1.0904563878424471,
              "num_responses": 4,
              "rvariance": 0.22071588410181173
            },
            {
              "id": "chat_hard_sample_371",
              "variance": 0.5190686680663905,
              "mean_reward": -0.5286785740222045,
              "min_reward": -1.0321468176385122,
              "max_reward": -0.29467220727096294,
              "num_responses": 4,
              "rvariance": 0.08614720004976203
            },
            {
              "id": "chat_hard_sample_223",
              "variance": 1.0003181253447018,
              "mean_reward": 1.4571993205823193,
              "min_reward": 0.9959083608722484,
              "max_reward": 2.3857643573341685,
              "num_responses": 5,
              "rvariance": 0.24743971690617772
            },
            {
              "id": "chat_hard_sample_52",
              "variance": 0.8868604929804632,
              "mean_reward": -0.5067299249041227,
              "min_reward": -0.9659631987593732,
              "max_reward": 0.01733628173069258,
              "num_responses": 7,
              "rvariance": 0.1269603697714702
            },
            {
              "id": "chat_hard_sample_372",
              "variance": 0.38150128882475154,
              "mean_reward": 0.27143410421310143,
              "min_reward": 0.0929747033068515,
              "max_reward": 0.5609874368093347,
              "num_responses": 4,
              "rvariance": 0.034498827648178756
            },
            {
              "id": "chat_hard_sample_346",
              "variance": 1.1061602095990748,
              "mean_reward": 1.7722917003074166,
              "min_reward": 1.1696403604299885,
              "max_reward": 2.3715821532886388,
              "num_responses": 5,
              "rvariance": 0.23993309318196882
            },
            {
              "id": "chat_hard_sample_108",
              "variance": 0.693982517961258,
              "mean_reward": -0.5537338011693071,
              "min_reward": -0.8146863556070554,
              "max_reward": 0.12133911139791108,
              "num_responses": 5,
              "rvariance": 0.12931991488940947
            },
            {
              "id": "chat_hard_sample_64",
              "variance": 1.4944497512977022,
              "mean_reward": 0.7078323411974244,
              "min_reward": -0.12448575872460538,
              "max_reward": 1.5513780193221656,
              "num_responses": 6,
              "rvariance": 0.47658844552574503
            },
            {
              "id": "chat_hard_sample_233",
              "variance": 1.4423301514303808,
              "mean_reward": -0.4420658278870047,
              "min_reward": -1.19287846348785,
              "max_reward": 1.1507307550359487,
              "num_responses": 7,
              "rvariance": 0.5244268426927191
            },
            {
              "id": "chat_hard_sample_47",
              "variance": 0.8206768741013244,
              "mean_reward": -0.5263148733479496,
              "min_reward": -0.843050763698115,
              "max_reward": 0.30098036264128847,
              "num_responses": 4,
              "rvariance": 0.22931614753501742
            },
            {
              "id": "chat_hard_sample_26",
              "variance": 0.971953717253642,
              "mean_reward": -0.5600820258373063,
              "min_reward": -0.9092343825772541,
              "max_reward": 0.08824730195834156,
              "num_responses": 7,
              "rvariance": 0.16345198944548203
            },
            {
              "id": "chat_hard_sample_379",
              "variance": 0.567288161821192,
              "mean_reward": -0.5364450190947566,
              "min_reward": -0.776867144818976,
              "max_reward": 0.01733628173069258,
              "num_responses": 7,
              "rvariance": 0.06977420252729696
            },
            {
              "id": "chat_hard_sample_247",
              "variance": 1.0705200353700741,
              "mean_reward": 0.420938171859728,
              "min_reward": -0.20957898299778416,
              "max_reward": 1.0715467824484073,
              "num_responses": 4,
              "rvariance": 0.24718188621840304
            },
            {
              "id": "chat_hard_sample_215",
              "variance": 0.7894760252011588,
              "mean_reward": 0.26620019557725116,
              "min_reward": -0.23794339108884374,
              "max_reward": 0.8564500210912055,
              "num_responses": 7,
              "rvariance": 0.1186643528228333
            },
            {
              "id": "chat_hard_sample_49",
              "variance": 1.3558187067526488,
              "mean_reward": -0.9261179588219324,
              "min_reward": -1.4387033336103665,
              "max_reward": 0.6177162529914539,
              "num_responses": 7,
              "rvariance": 0.4799644539925806
            },
            {
              "id": "chat_hard_sample_415",
              "variance": 2.198241627057118,
              "mean_reward": 1.0744169904100027,
              "min_reward": -0.776867144818976,
              "max_reward": 2.1730312966512213,
              "num_responses": 7,
              "rvariance": 1.0692762333345143
            },
            {
              "id": "chat_hard_sample_297",
              "variance": 0.7043828009279802,
              "mean_reward": 1.4209523928320251,
              "min_reward": 0.9876354085123561,
              "max_reward": 2.135212085863142,
              "num_responses": 7,
              "rvariance": 0.11555527058933544
            },
            {
              "id": "chat_hard_sample_80",
              "variance": 0.7611116171100991,
              "mean_reward": -0.18310553544612854,
              "min_reward": -0.5026778666053999,
              "max_reward": 0.25843375050469913,
              "num_responses": 5,
              "rvariance": 0.13073411680111555
            },
            {
              "id": "chat_hard_sample_413",
              "variance": 1.0967571128543043,
              "mean_reward": -1.2291218738264262,
              "min_reward": -2.100539522401757,
              "max_reward": -0.5310422746964595,
              "num_responses": 6,
              "rvariance": 0.25365098869023484
            },
            {
              "id": "chat_hard_sample_306",
              "variance": 0.6429265833973508,
              "mean_reward": -0.6850204900479259,
              "min_reward": -1.0037824095474528,
              "max_reward": -0.33249141805904237,
              "num_responses": 7,
              "rvariance": 0.062108271475168585
            },
            {
              "id": "chat_hard_sample_43",
              "variance": 1.6053073129202604,
              "mean_reward": -0.2822205697905127,
              "min_reward": -1.0983304365176514,
              "max_reward": 1.3194398906608968,
              "num_responses": 7,
              "rvariance": 0.6004675372239643
            },
            {
              "id": "chat_hard_sample_102",
              "variance": 0.4112839173203642,
              "mean_reward": 0.8824507285080102,
              "min_reward": 0.7075368786131426,
              "max_reward": 1.369373067404533,
              "num_responses": 6,
              "rvariance": 0.05202131005015464
            },
            {
              "id": "chat_hard_sample_187",
              "variance": 0.2930988836076158,
              "mean_reward": -0.6886223196467905,
              "min_reward": -0.8619603690921548,
              "max_reward": -0.5121326693024197,
              "num_responses": 6,
              "rvariance": 0.014948545281062117
            },
            {
              "id": "chat_hard_sample_360",
              "variance": 0.8387905771589546,
              "mean_reward": 1.600729504102997,
              "min_reward": 1.2479656448819607,
              "max_reward": 2.5323137991379765,
              "num_responses": 6,
              "rvariance": 0.1923149516480078
            },
            {
              "id": "chat_hard_sample_236",
              "variance": 0.9312980656564568,
              "mean_reward": 0.9101397935492824,
              "min_reward": 0.5373504300667851,
              "max_reward": 1.7097459644972481,
              "num_responses": 7,
              "rvariance": 0.1803664777248272
            },
            {
              "id": "chat_hard_sample_259",
              "variance": 0.9686445363096852,
              "mean_reward": 0.9447511248508731,
              "min_reward": 0.48534901523317586,
              "max_reward": 1.5986520328072649,
              "num_responses": 7,
              "rvariance": 0.1708380533544725
            },
            {
              "id": "chat_hard_sample_127",
              "variance": 0.8684236277212746,
              "mean_reward": 1.099438450404616,
              "min_reward": 0.7240827833329274,
              "max_reward": 1.6151979375270495,
              "num_responses": 5,
              "rvariance": 0.16619420171426355
            },
            {
              "id": "chat_hard_sample_280",
              "variance": 1.295307969491722,
              "mean_reward": 0.2131857661689612,
              "min_reward": -0.3986750369381814,
              "max_reward": 2.2297601128333406,
              "num_responses": 7,
              "rvariance": 0.7114611593786347
            },
            {
              "id": "chat_hard_sample_421",
              "variance": 0.8849695324410592,
              "mean_reward": -0.614784812870064,
              "min_reward": -1.051056423032552,
              "max_reward": -0.08666654793652592,
              "num_responses": 7,
              "rvariance": 0.13616970341048593
            },
            {
              "id": "chat_hard_sample_270",
              "variance": 1.1026663645399415,
              "mean_reward": 0.09573235409348231,
              "min_reward": -0.7485027367279163,
              "max_reward": 0.7429923887269672,
              "num_responses": 6,
              "rvariance": 0.24373904162352397
            },
            {
              "id": "chat_hard_sample_276",
              "variance": 0.34037289709271507,
              "mean_reward": -0.22848858839182387,
              "min_reward": -0.44594905042328076,
              "max_reward": 0.01733628173069258,
              "num_responses": 6,
              "rvariance": 0.023033672097530256
            },
            {
              "id": "chat_hard_sample_349",
              "variance": 0.560669799933278,
              "mean_reward": -0.07180900084120899,
              "min_reward": -0.6066806962726184,
              "max_reward": 0.4333476003995666,
              "num_responses": 7,
              "rvariance": 0.08731444386491909
            },
            {
              "id": "chat_hard_sample_267",
              "variance": 0.6467085044761587,
              "mean_reward": -0.9808207458546901,
              "min_reward": -1.4197937282163267,
              "max_reward": -0.427039445029241,
              "num_responses": 7,
              "rvariance": 0.08660568274789104
            },
            {
              "id": "chat_hard_sample_14",
              "variance": 0.3653394854645331,
              "mean_reward": 1.4195524629684038,
              "min_reward": 1.1448215033503113,
              "max_reward": 1.6317438422468342,
              "num_responses": 6,
              "rvariance": 0.025904221619351103
            },
            {
              "id": "chat_hard_sample_13",
              "variance": 1.8323407626824493,
              "mean_reward": 0.7737204974922817,
              "min_reward": -0.2757626018769232,
              "max_reward": 1.8019302907931918,
              "num_responses": 7,
              "rvariance": 0.5252191249677626
            },
            {
              "id": "chat_hard_sample_147",
              "variance": 0.7563842157615891,
              "mean_reward": 0.005045038224566767,
              "min_reward": -0.5121326693024197,
              "max_reward": 0.4806216138846659,
              "num_responses": 5,
              "rvariance": 0.11601104127279767
            },
            {
              "id": "chat_hard_sample_173",
              "variance": 1.246261180500931,
              "mean_reward": 1.0130451907605968,
              "min_reward": 0.3482543761263878,
              "max_reward": 2.092665473726553,
              "num_responses": 6,
              "rvariance": 0.3450500835639947
            },
            {
              "id": "chat_hard_sample_345",
              "variance": 0.6381991820488407,
              "mean_reward": -0.34667362210457214,
              "min_reward": -0.7201383286368568,
              "max_reward": 0.3482543761263878,
              "num_responses": 6,
              "rvariance": 0.11286648316613224
            },
            {
              "id": "chat_hard_sample_412",
              "variance": 0.6353627412397349,
              "mean_reward": 0.2513426484819342,
              "min_reward": -0.23794339108884374,
              "max_reward": 0.6768087698478281,
              "num_responses": 7,
              "rvariance": 0.08040767167977478
            },
            {
              "id": "chat_hard_sample_21",
              "variance": 0.9785720791415555,
              "mean_reward": 2.498434089473655,
              "min_reward": 1.941388630574235,
              "max_reward": 3.1185115663532077,
              "num_responses": 6,
              "rvariance": 0.17754563533758486
            },
            {
              "id": "chat_hard_sample_357",
              "variance": 0.6088892936880793,
              "mean_reward": -0.6309930460649552,
              "min_reward": -1.0226920149414924,
              "max_reward": -0.3230366153620225,
              "num_responses": 7,
              "rvariance": 0.060451759006027075
            },
            {
              "id": "chat_hard_sample_184",
              "variance": 0.1843686525918873,
              "mean_reward": -0.20327578119977088,
              "min_reward": -0.44594905042328076,
              "max_reward": -0.12448575872460538,
              "num_responses": 6,
              "rvariance": 0.012236948695195031
            },
            {
              "id": "chat_hard_sample_348",
              "variance": 0.43964832541142373,
              "mean_reward": 0.3671639815204275,
              "min_reward": 0.19225013162556007,
              "max_reward": 0.9580891500841691,
              "num_responses": 6,
              "rvariance": 0.07211803996642642
            },
            {
              "id": "chat_hard_sample_283",
              "variance": 0.16545904719784765,
              "mean_reward": -1.3205182998976182,
              "min_reward": -1.400884122822287,
              "max_reward": -1.1266948446087108,
              "num_responses": 6,
              "rvariance": 0.008276329139830575
            },
            {
              "id": "chat_hard_sample_0",
              "variance": 0.46801273350248324,
              "mean_reward": 0.5191161677225326,
              "min_reward": 0.24897894780767924,
              "max_reward": 0.8446315177199306,
              "num_responses": 7,
              "rvariance": 0.03999346514154169
            },
            {
              "id": "chat_hard_sample_258",
              "variance": 0.482194937548013,
              "mean_reward": -0.8916754632827885,
              "min_reward": -1.19287846348785,
              "max_reward": -0.568861485484539,
              "num_responses": 7,
              "rvariance": 0.04777250607592422
            },
            {
              "id": "chat_hard_sample_161",
              "variance": 0.4387028451417217,
              "mean_reward": 0.07311961764310977,
              "min_reward": -0.12448575872460538,
              "max_reward": 0.49007641658168577,
              "num_responses": 5,
              "rvariance": 0.04931291672399066
            },
            {
              "id": "chat_hard_sample_4",
              "variance": 0.7166740444341059,
              "mean_reward": -0.6363957904632522,
              "min_reward": -1.0132372122444726,
              "max_reward": 0.1402487167919508,
              "num_responses": 7,
              "rvariance": 0.12541696718458287
            },
            {
              "id": "chat_hard_sample_238",
              "variance": 0.8651144467773175,
              "mean_reward": -0.061453740744472955,
              "min_reward": -0.5404970773934794,
              "max_reward": 0.49007641658168577,
              "num_responses": 6,
              "rvariance": 0.13169618729674587
            },
            {
              "id": "chat_hard_sample_8",
              "variance": 0.22029690284056286,
              "mean_reward": 0.41376265195573975,
              "min_reward": 0.24897894780767924,
              "max_reward": 0.608261450294434,
              "num_responses": 7,
              "rvariance": 0.011004496931565525
            },
            {
              "id": "chat_hard_sample_32",
              "variance": 1.0022090858841055,
              "mean_reward": 1.1916734274292937,
              "min_reward": 0.3246173693838382,
              "max_reward": 1.7097459644972481,
              "num_responses": 7,
              "rvariance": 0.19393922175984826
            },
            {
              "id": "chat_hard_sample_109",
              "variance": 0.8758101923283214,
              "mean_reward": 0.5850676374283071,
              "min_reward": -0.5594066827875191,
              "max_reward": 1.211743778690155,
              "num_responses": 7,
              "rvariance": 0.25646175942588895
            },
            {
              "id": "chat_hard_sample_188",
              "variance": 0.4046655554324501,
              "mean_reward": -1.4562622529048321,
              "min_reward": -1.6467089929448033,
              "max_reward": -1.1456044500027507,
              "num_responses": 7,
              "rvariance": 0.031068730561100953
            },
            {
              "id": "chat_hard_sample_53",
              "variance": 0.41222939759006616,
              "mean_reward": -0.9740673153568188,
              "min_reward": -1.2117880688818896,
              "max_reward": -0.635045104363678,
              "num_responses": 7,
              "rvariance": 0.03403147973498399
            },
            {
              "id": "chat_hard_sample_356",
              "variance": 1.1950870609033108,
              "mean_reward": -1.3009333514537913,
              "min_reward": -1.7601666253090418,
              "max_reward": -0.5310422746964595,
              "num_responses": 7,
              "rvariance": 0.24015782096672522
            },
            {
              "id": "chat_hard_sample_63",
              "variance": 0.7204559655129136,
              "mean_reward": 0.3816838570908509,
              "min_reward": 0.09770210465536143,
              "max_reward": 0.8564500210912055,
              "num_responses": 7,
              "rvariance": 0.08886400364297752
            },
            {
              "id": "chat_hard_sample_159",
              "variance": 0.5015772830769039,
              "mean_reward": -0.15403201715279247,
              "min_reward": -0.3986750369381814,
              "max_reward": 0.22061453971661965,
              "num_responses": 4,
              "rvariance": 0.058601494553598914
            },
            {
              "id": "chat_hard_sample_152",
              "variance": 0.34982769978973505,
              "mean_reward": 0.5137134233242354,
              "min_reward": 0.2773433558987388,
              "max_reward": 0.8115397082803611,
              "num_responses": 6,
              "rvariance": 0.026803089329532303
            },
            {
              "id": "chat_hard_sample_318",
              "variance": 0.5861977672152316,
              "mean_reward": -0.5074052679539098,
              "min_reward": -0.8241411583040753,
              "max_reward": -0.13394056142162525,
              "num_responses": 6,
              "rvariance": 0.06009464191810368
            },
            {
              "id": "chat_hard_sample_176",
              "variance": 0.34793673925033075,
              "mean_reward": -1.9681722846434788,
              "min_reward": -2.138358733189836,
              "max_reward": -1.7790762307030816,
              "num_responses": 7,
              "rvariance": 0.018185150101764764
            },
            {
              "id": "chat_hard_sample_274",
              "variance": 0.44437572675993375,
              "mean_reward": -1.162938254947287,
              "min_reward": -1.533251360580565,
              "max_reward": -0.8997795798802342,
              "num_responses": 6,
              "rvariance": 0.04104393769944779
            },
            {
              "id": "chat_hard_sample_389",
              "variance": 1.006936487232616,
              "mean_reward": -0.754918495700894,
              "min_reward": -1.1739688580938104,
              "max_reward": 0.7477197900754771,
              "num_responses": 7,
              "rvariance": 0.3941840629057336
            },
            {
              "id": "chat_hard_sample_42",
              "variance": 1.550469457277545,
              "mean_reward": 0.20453293334356354,
              "min_reward": -0.4081298396352013,
              "max_reward": 1.2591655234673953,
              "num_responses": 7,
              "rvariance": 0.44194078761609246
            },
            {
              "id": "chat_hard_sample_5",
              "variance": 0.5597243196635759,
              "mean_reward": -1.6467089929448033,
              "min_reward": -1.9114434684613597,
              "max_reward": -1.19287846348785,
              "num_responses": 7,
              "rvariance": 0.06150258629922697
            },
            {
              "id": "chat_hard_sample_17",
              "variance": 0.9708900519502273,
              "mean_reward": 1.4517086408910813,
              "min_reward": 1.0124542655920332,
              "max_reward": 2.215577908787811,
              "num_responses": 6,
              "rvariance": 0.20003549822970776
            },
            {
              "id": "chat_hard_sample_182",
              "variance": 0.5023454857960364,
              "mean_reward": 1.0022608064343086,
              "min_reward": 0.7004457765903778,
              "max_reward": 1.3451451354934196,
              "num_responses": 4,
              "rvariance": 0.055996758164358396
            },
            {
              "id": "chat_hard_sample_140",
              "variance": 0.6088892936880792,
              "mean_reward": -0.3948931158593735,
              "min_reward": -0.8619603690921548,
              "max_reward": -0.029937731754406737,
              "num_responses": 5,
              "rvariance": 0.07979602999148541
            },
            {
              "id": "chat_hard_sample_251",
              "variance": 0.7516568144130791,
              "mean_reward": -0.594074292676592,
              "min_reward": -0.9281439879712938,
              "max_reward": 0.3482543761263878,
              "num_responses": 6,
              "rvariance": 0.18798416477699767
            },
            {
              "id": "chat_hard_sample_98",
              "variance": 0.9322435459261588,
              "mean_reward": -0.3115557835156412,
              "min_reward": -0.8052315529100356,
              "max_reward": 0.5609874368093347,
              "num_responses": 7,
              "rvariance": 0.18472394472102152
            },
            {
              "id": "chat_hard_sample_409",
              "variance": 0.5601970597984269,
              "mean_reward": -0.44831275109753577,
              "min_reward": -0.701228723242817,
              "max_reward": 0.2773433558987388,
              "num_responses": 6,
              "rvariance": 0.10953472060286563
            },
            {
              "id": "chat_hard_sample_248",
              "variance": 0.6618361887913905,
              "mean_reward": -0.7944260641134414,
              "min_reward": -1.3630649120342075,
              "max_reward": -0.5026778666053999,
              "num_responses": 7,
              "rvariance": 0.08815273404065756
            },
            {
              "id": "chat_hard_sample_382",
              "variance": 0.2874260019894037,
              "mean_reward": -1.5035362663899312,
              "min_reward": -1.6845282037328828,
              "max_reward": -1.3063360958520884,
              "num_responses": 7,
              "rvariance": 0.016127279985914986
            },
            {
              "id": "chat_hard_sample_254",
              "variance": 0.5341963523816223,
              "mean_reward": -0.5877710908785786,
              "min_reward": -0.8146863556070554,
              "max_reward": -0.09612135063354578,
              "num_responses": 6,
              "rvariance": 0.0632606544153386
            },
            {
              "id": "chat_hard_sample_2",
              "variance": 0.31200848900165556,
              "mean_reward": -0.33114073195946814,
              "min_reward": -0.4837682612113602,
              "max_reward": -0.0015733236633471456,
              "num_responses": 7,
              "rvariance": 0.023942807979089185
            },
            {
              "id": "chat_hard_sample_203",
              "variance": 0.5521604775059601,
              "mean_reward": -0.8619603690921548,
              "min_reward": -1.4954321497924856,
              "max_reward": -0.5972258935755985,
              "num_responses": 7,
              "rvariance": 0.08479592463182457
            },
            {
              "id": "chat_hard_sample_68",
              "variance": 0.2893169625288078,
              "mean_reward": -0.7636304210431482,
              "min_reward": -0.9375987906683136,
              "max_reward": -0.6066806962726184,
              "num_responses": 5,
              "rvariance": 0.01711345221093606
            },
            {
              "id": "chat_hard_sample_220",
              "variance": 0.431139002984106,
              "mean_reward": -1.9303530738553991,
              "min_reward": -2.2707259709481145,
              "max_reward": -1.533251360580565,
              "num_responses": 7,
              "rvariance": 0.045360711489795306
            },
            {
              "id": "chat_hard_sample_11",
              "variance": 0.11534859290364241,
              "mean_reward": -0.9423261920168235,
              "min_reward": -1.0226920149414924,
              "max_reward": -0.8619603690921548,
              "num_responses": 4,
              "rvariance": 0.003240506908934559
            },
            {
              "id": "chat_hard_sample_6",
              "variance": 0.8107493312694535,
              "mean_reward": -0.8895368769584627,
              "min_reward": -1.325245701246128,
              "max_reward": 0.09770210465536143,
              "num_responses": 6,
              "rvariance": 0.21016673822085952
            },
            {
              "id": "chat_hard_sample_286",
              "variance": 0.5672881618211918,
              "mean_reward": -1.5868285758636775,
              "min_reward": -1.9114434684613597,
              "max_reward": -1.117240041911691,
              "num_responses": 6,
              "rvariance": 0.06989562335072035
            },
            {
              "id": "chat_hard_sample_400",
              "variance": 0.6415083629927979,
              "mean_reward": 0.48940107353189866,
              "min_reward": 0.15915832218599055,
              "max_reward": 0.9580891500841691,
              "num_responses": 7,
              "rvariance": 0.07910143497503322
            },
            {
              "id": "chat_hard_sample_209",
              "variance": 0.7034373206582778,
              "mean_reward": -0.47431345851434026,
              "min_reward": -0.7295931313338766,
              "max_reward": 0.03624588712473231,
              "num_responses": 7,
              "rvariance": 0.08740110062954928
            },
            {
              "id": "chat_hard_sample_337",
              "variance": 1.3028718116493372,
              "mean_reward": 0.10850759345195557,
              "min_reward": -0.5404970773934794,
              "max_reward": 0.9155425379475797,
              "num_responses": 7,
              "rvariance": 0.304107776734403
            },
            {
              "id": "chat_hard_sample_268",
              "variance": 0.6907915220510137,
              "mean_reward": 1.1990881313300816,
              "min_reward": 0.3482543761263878,
              "max_reward": 1.449738890329202,
              "num_responses": 6,
              "rvariance": 0.15495517589028796
            },
            {
              "id": "chat_hard_sample_249",
              "variance": 0.4656490328282283,
              "mean_reward": 0.6774841128976151,
              "min_reward": 0.2773433558987388,
              "max_reward": 1.019545367614798,
              "num_responses": 7,
              "rvariance": 0.047553583723174246
            },
            {
              "id": "chat_hard_sample_295",
              "variance": 0.9639171349611753,
              "mean_reward": 1.2950853319279485,
              "min_reward": 0.7382649873784571,
              "max_reward": 1.9602982359682746,
              "num_responses": 7,
              "rvariance": 0.16046881607033012
            },
            {
              "id": "chat_hard_sample_153",
              "variance": 0.30491738697889065,
              "mean_reward": 0.29231346016902027,
              "min_reward": -0.18121457490672455,
              "max_reward": 0.42862019905105664,
              "num_responses": 6,
              "rvariance": 0.04520631295316544
            },
            {
              "id": "chat_hard_sample_192",
              "variance": 0.21746046203145697,
              "mean_reward": -0.9924366463110289,
              "min_reward": -1.0983304365176514,
              "max_reward": -0.8619603690921548,
              "num_responses": 5,
              "rvariance": 0.010026351859478633
            },
            {
              "id": "chat_hard_sample_363",
              "variance": 0.4207387200173841,
              "mean_reward": -1.0494806225830489,
              "min_reward": -1.4576129390044061,
              "max_reward": -0.8525055663951349,
              "num_responses": 6,
              "rvariance": 0.04116312875816722
            },
            {
              "id": "chat_hard_sample_129",
              "variance": 1.5078046601072428,
              "mean_reward": 0.7929846579874595,
              "min_reward": 0.16388572353450048,
              "max_reward": 1.9792078413623142,
              "num_responses": 5,
              "rvariance": 0.5273002567238125
            },
            {
              "id": "chat_hard_sample_359",
              "variance": 0.7209287056477648,
              "mean_reward": 0.33390333631841124,
              "min_reward": -0.0677569425424862,
              "max_reward": 1.0325457213232005,
              "num_responses": 7,
              "rvariance": 0.11557292975568033
            },
            {
              "id": "chat_hard_sample_7",
              "variance": 0.486922338896523,
              "mean_reward": -0.4491006513222873,
              "min_reward": -0.6823191178487773,
              "max_reward": 0.0929747033068515,
              "num_responses": 6,
              "rvariance": 0.06590272288361934
            },
            {
              "id": "chat_hard_sample_316",
              "variance": 0.5389237537301323,
              "mean_reward": -0.4959244361075286,
              "min_reward": -0.9470535933653336,
              "max_reward": -0.23794339108884374,
              "num_responses": 7,
              "rvariance": 0.05996283241821881
            },
            {
              "id": "chat_hard_sample_41",
              "variance": 1.3189449762342709,
              "mean_reward": -0.022058729506890157,
              "min_reward": -0.9186891852742739,
              "max_reward": 0.5704422395063546,
              "num_responses": 6,
              "rvariance": 0.3416661361133655
            },
            {
              "id": "chat_hard_sample_143",
              "variance": 0.4682491035699088,
              "mean_reward": 0.7164007561415988,
              "min_reward": 0.4664394098391361,
              "max_reward": 1.092820088516702,
              "num_responses": 4,
              "rvariance": 0.05427395122144095
            },
            {
              "id": "chat_hard_sample_370",
              "variance": 0.5899796882940397,
              "mean_reward": -0.5222628150492267,
              "min_reward": -0.8525055663951349,
              "max_reward": 0.09770210465536143,
              "num_responses": 7,
              "rvariance": 0.08298525433928829
            },
            {
              "id": "chat_hard_sample_91",
              "variance": 0.281753120371192,
              "mean_reward": -0.33114073195946814,
              "min_reward": -0.5026778666053999,
              "max_reward": -0.15285016681566496,
              "num_responses": 7,
              "rvariance": 0.01607619810360667
            },
            {
              "id": "chat_hard_sample_245",
              "variance": 0.2930988836076158,
              "mean_reward": -1.0645632840282948,
              "min_reward": -1.19287846348785,
              "max_reward": -0.8714151717891746,
              "num_responses": 7,
              "rvariance": 0.015244293163156763
            },
            {
              "id": "chat_hard_sample_131",
              "variance": 1.035300895323675,
              "mean_reward": -0.427039445029241,
              "min_reward": -0.8808699744861944,
              "max_reward": 0.4522572057936063,
              "num_responses": 6,
              "rvariance": 0.22384080827509348
            },
            {
              "id": "chat_hard_sample_171",
              "variance": 0.4803039770086093,
              "mean_reward": -0.6296423599653809,
              "min_reward": -1.060511225729572,
              "max_reward": -0.1433953641186451,
              "num_responses": 7,
              "rvariance": 0.06402749076761005
            },
            {
              "id": "chat_hard_sample_329",
              "variance": 0.5171777075269866,
              "mean_reward": 1.2206962949938958,
              "min_reward": 0.9699076534554438,
              "max_reward": 1.5726513253904602,
              "num_responses": 5,
              "rvariance": 0.05377028984803891
            },
            {
              "id": "chat_hard_sample_384",
              "variance": 0.6410356228579467,
              "mean_reward": -1.1334482751065824,
              "min_reward": -1.5143417551865253,
              "max_reward": -0.7201383286368568,
              "num_responses": 7,
              "rvariance": 0.07602808440418796
            },
            {
              "id": "chat_hard_sample_29",
              "variance": 1.0026818260189572,
              "mean_reward": -0.36271301953701646,
              "min_reward": -0.7863219475159958,
              "max_reward": 1.5076495568484487,
              "num_responses": 7,
              "rvariance": 0.5875996241081347
            },
            {
              "id": "chat_hard_sample_106",
              "variance": 0.272298317674172,
              "mean_reward": -1.178020916392533,
              "min_reward": -1.325245701246128,
              "max_reward": -0.9565083960623534,
              "num_responses": 7,
              "rvariance": 0.015167670339694263
            },
            {
              "id": "chat_hard_sample_320",
              "variance": 0.5672881618211918,
              "mean_reward": 0.09061100263259654,
              "min_reward": -0.3230366153620225,
              "max_reward": 0.33879957342936795,
              "num_responses": 6,
              "rvariance": 0.06486787134775844
            },
            {
              "id": "chat_hard_sample_23",
              "variance": 0.6750729125672185,
              "mean_reward": -0.6215382433679354,
              "min_reward": -0.9281439879712938,
              "max_reward": 0.007881479033672718,
              "num_responses": 7,
              "rvariance": 0.09557055309300264
            },
            {
              "id": "chat_hard_sample_235",
              "variance": 1.8228859599854297,
              "mean_reward": -0.6137717982953834,
              "min_reward": -1.2306976742759295,
              "max_reward": 0.6531717631052785,
              "num_responses": 7,
              "rvariance": 0.6298507830234398
            },
            {
              "id": "chat_hard_sample_202",
              "variance": 0.4301935227144038,
              "mean_reward": 0.4495558335944578,
              "min_reward": 0.04097328847324224,
              "max_reward": 0.612988851642944,
              "num_responses": 7,
              "rvariance": 0.039172506318729296
            },
            {
              "id": "chat_hard_sample_304",
              "variance": 0.20611469879503308,
              "mean_reward": -1.0334975037380867,
              "min_reward": -1.2306976742759295,
              "max_reward": -0.9281439879712938,
              "num_responses": 7,
              "rvariance": 0.01012515881468645
            },
            {
              "id": "chat_hard_sample_277",
              "variance": 0.5625607604726819,
              "mean_reward": -0.08036334613851268,
              "min_reward": -0.4081298396352013,
              "max_reward": 0.5278956273697653,
              "num_responses": 6,
              "rvariance": 0.08759549557055601
            },
            {
              "id": "chat_hard_sample_196",
              "variance": 0.43113900298410585,
              "mean_reward": 0.14497611814046074,
              "min_reward": -0.1433953641186451,
              "max_reward": 0.4806216138846659,
              "num_responses": 7,
              "rvariance": 0.03710460226171179
            },
            {
              "id": "chat_hard_sample_185",
              "variance": 0.5029955034814566,
              "mean_reward": -1.3671169703329302,
              "min_reward": -1.7601666253090418,
              "max_reward": -1.1266948446087108,
              "num_responses": 7,
              "rvariance": 0.043518115020816324
            },
            {
              "id": "chat_hard_sample_160",
              "variance": 1.5222232342201982,
              "mean_reward": 0.6584900896223521,
              "min_reward": -0.4364942477262609,
              "max_reward": 1.1903227413297195,
              "num_responses": 7,
              "rvariance": 0.436651521666438
            },
            {
              "id": "chat_hard_sample_163",
              "variance": 0.836750038686258,
              "mean_reward": 0.475894212536156,
              "min_reward": -0.058302139845466325,
              "max_reward": 0.8304493136744009,
              "num_responses": 6,
              "rvariance": 0.14290262996342917
            },
            {
              "id": "chat_hard_sample_266",
              "variance": 0.43492092406291377,
              "mean_reward": -0.3797654315441417,
              "min_reward": -0.7390479340308965,
              "max_reward": -0.16230496951268483,
              "num_responses": 7,
              "rvariance": 0.03575731761582963
            },
            {
              "id": "chat_hard_sample_289",
              "variance": 0.342263857632119,
              "mean_reward": -1.0632125979287204,
              "min_reward": -1.268516885064009,
              "max_reward": -0.8525055663951349,
              "num_responses": 7,
              "rvariance": 0.01973585010041046
            },
            {
              "id": "chat_hard_sample_69",
              "variance": 0.38953787111721827,
              "mean_reward": -0.9011302659798084,
              "min_reward": -1.0794208311236115,
              "max_reward": -0.5594066827875191,
              "num_responses": 7,
              "rvariance": 0.030813321149559293
            },
            {
              "id": "chat_hard_sample_40",
              "variance": 0.38008306842019857,
              "mean_reward": -0.7485027367279165,
              "min_reward": -0.9470535933653336,
              "max_reward": -0.4364942477262609,
              "num_responses": 7,
              "rvariance": 0.026715824447255572
            },
            {
              "id": "chat_hard_sample_313",
              "variance": 0.6041618923395694,
              "mean_reward": 0.20305562042215422,
              "min_reward": -0.1717597722097047,
              "max_reward": 0.750083490749732,
              "num_responses": 7,
              "rvariance": 0.07981361675382301
            },
            {
              "id": "chat_hard_sample_226",
              "variance": 1.436184529677317,
              "mean_reward": 2.092327802201659,
              "min_reward": 0.7193553819844175,
              "max_reward": 2.5795878126230756,
              "num_responses": 7,
              "rvariance": 0.4590416342608537
            },
            {
              "id": "chat_hard_sample_28",
              "variance": 0.6965825887029388,
              "mean_reward": 0.8643853019262044,
              "min_reward": 0.4475298044450964,
              "max_reward": 1.6270164408983243,
              "num_responses": 7,
              "rvariance": 0.12239486952913402
            },
            {
              "id": "chat_hard_sample_323",
              "variance": 0.10778475074602645,
              "mean_reward": -0.13866796277013518,
              "min_reward": -0.2001241803007643,
              "max_reward": -0.08666654793652592,
              "num_responses": 4,
              "rvariance": 0.002748843791716903
            },
            {
              "id": "chat_hard_sample_116",
              "variance": 0.5375055333255793,
              "mean_reward": 0.5609874368093348,
              "min_reward": 0.30570776398979843,
              "max_reward": 0.8729959258109903,
              "num_responses": 7,
              "rvariance": 0.04818458179615258
            },
            {
              "id": "chat_hard_sample_36",
              "variance": 0.7417292715812083,
              "mean_reward": 0.5221552114465746,
              "min_reward": -0.19066937760374442,
              "max_reward": 0.8233582116516359,
              "num_responses": 7,
              "rvariance": 0.11872524060219189
            },
            {
              "id": "chat_hard_sample_351",
              "variance": 0.29688080468642375,
              "mean_reward": 0.1510542055885449,
              "min_reward": -0.08666654793652592,
              "max_reward": 0.3293447707323481,
              "num_responses": 7,
              "rvariance": 0.016414615573899345
            },
            {
              "id": "chat_hard_sample_296",
              "variance": 0.2836440809105959,
              "mean_reward": 0.11267220892564289,
              "min_reward": -0.029937731754406737,
              "max_reward": 0.3577091788234077,
              "num_responses": 6,
              "rvariance": 0.016719649919221174
            },
            {
              "id": "chat_hard_sample_338",
              "variance": 0.1947689355586092,
              "mean_reward": -1.0875249477210573,
              "min_reward": -1.2117880688818896,
              "max_reward": -0.9659631987593732,
              "num_responses": 7,
              "rvariance": 0.007136868699649264
            },
            {
              "id": "chat_hard_sample_354",
              "variance": 1.1563223698455292,
              "mean_reward": 2.09334081677634,
              "min_reward": 1.5490143186479106,
              "max_reward": 2.759229063866453,
              "num_responses": 7,
              "rvariance": 0.20298936635212791
            },
            {
              "id": "chat_hard_sample_186",
              "variance": 0.5531059577756621,
              "mean_reward": 0.07248929746330846,
              "min_reward": -0.25685299648288346,
              "max_reward": 0.49953121927870564,
              "num_responses": 6,
              "rvariance": 0.06283355312159396
            },
            {
              "id": "chat_hard_sample_54",
              "variance": 0.5864341372826569,
              "mean_reward": 0.8476705614439727,
              "min_reward": -0.029937731754406737,
              "max_reward": 1.1010930408765944,
              "num_responses": 7,
              "rvariance": 0.13505525180851807
            },
            {
              "id": "chat_hard_sample_241",
              "variance": 0.5181231877966886,
              "mean_reward": -0.42771478807902813,
              "min_reward": -0.8335959610010951,
              "max_reward": 0.19225013162556007,
              "num_responses": 7,
              "rvariance": 0.08242335363389668
            },
            {
              "id": "chat_hard_sample_67",
              "variance": 0.6571087874428805,
              "mean_reward": 1.118401344586178,
              "min_reward": 0.45698460714211625,
              "max_reward": 1.4651029447118593,
              "num_responses": 7,
              "rvariance": 0.10007676101576117
            },
            {
              "id": "chat_hard_sample_262",
              "variance": 0.5597243196635759,
              "mean_reward": -0.2838667184743688,
              "min_reward": -0.9281439879712938,
              "max_reward": -0.0677569425424862,
              "num_responses": 7,
              "rvariance": 0.083861855926758
            },
            {
              "id": "chat_hard_sample_244",
              "variance": 0.5011045429420529,
              "mean_reward": -0.9416508489670365,
              "min_reward": -1.249607279669969,
              "max_reward": -0.6634095124547376,
              "num_responses": 7,
              "rvariance": 0.04637870043008271
            },
            {
              "id": "chat_hard_sample_85",
              "variance": 0.3742920017682738,
              "mean_reward": 1.1845190119956113,
              "min_reward": 0.9037240345763048,
              "max_reward": 1.3989193258327202,
              "num_responses": 7,
              "rvariance": 0.02497703704556875
            },
            {
              "id": "chat_hard_sample_398",
              "variance": 0.4992135824026491,
              "mean_reward": -0.7633602838232333,
              "min_reward": -1.0132372122444726,
              "max_reward": 0.03624588712473231,
              "num_responses": 7,
              "rvariance": 0.11120160907935098
            },
            {
              "id": "chat_hard_sample_319",
              "variance": 0.45572148999635753,
              "mean_reward": -0.5445491356922021,
              "min_reward": -0.7863219475159958,
              "max_reward": -0.1433953641186451,
              "num_responses": 7,
              "rvariance": 0.04121943031694158
            },
            {
              "id": "chat_hard_sample_190",
              "variance": 0.45235321653554394,
              "mean_reward": 1.2360209543653156,
              "min_reward": 0.9793624561524638,
              "max_reward": 1.4934673528029188,
              "num_responses": 6,
              "rvariance": 0.03703520716986062
            },
            {
              "id": "chat_hard_sample_20",
              "variance": 0.8140585122134103,
              "mean_reward": -0.21160501214714553,
              "min_reward": -0.568861485484539,
              "max_reward": 0.3955283896114871,
              "num_responses": 7,
              "rvariance": 0.13057714947419377
            },
            {
              "id": "chat_hard_sample_264",
              "variance": 0.5434147850112167,
              "mean_reward": 0.7144591448734607,
              "min_reward": 0.3766187842174474,
              "max_reward": 0.9817261568267187,
              "num_responses": 7,
              "rvariance": 0.055004184117402447
            },
            {
              "id": "chat_hard_sample_27",
              "variance": 0.651317720790956,
              "mean_reward": 1.002239701964003,
              "min_reward": 0.6366258583854937,
              "max_reward": 1.7073822638229932,
              "num_responses": 7,
              "rvariance": 0.10562064263477668
            },
            {
              "id": "chat_hard_sample_115",
              "variance": 0.7979853476284768,
              "mean_reward": -0.5202367858998654,
              "min_reward": -0.843050763698115,
              "max_reward": 0.41443799500552686,
              "num_responses": 7,
              "rvariance": 0.1740469191421112
            },
            {
              "id": "chat_hard_sample_260",
              "variance": 0.7318017287493375,
              "mean_reward": -0.060328168994827736,
              "min_reward": -0.6255903016666582,
              "max_reward": 0.4380750017480765,
              "num_responses": 7,
              "rvariance": 0.1062238620836984
            },
            {
              "id": "chat_hard_sample_175",
              "variance": 0.3157904100804634,
              "mean_reward": -0.9970289790495813,
              "min_reward": -1.3819745174282472,
              "max_reward": -0.776867144818976,
              "num_responses": 7,
              "rvariance": 0.030590750090930156
            },
            {
              "id": "chat_hard_sample_200",
              "variance": 0.10234823919523994,
              "mean_reward": 1.7387012977568714,
              "min_reward": 1.6837452570804436,
              "max_reward": 1.8279309982099965,
              "num_responses": 4,
              "rvariance": 0.002895155472195736
            },
            {
              "id": "chat_hard_sample_240",
              "variance": 0.17869577097367542,
              "mean_reward": -0.12684945939886033,
              "min_reward": -0.2757626018769232,
              "max_reward": -0.020482929057386873,
              "num_responses": 4,
              "rvariance": 0.008598517470431534
            },
            {
              "id": "chat_hard_sample_130",
              "variance": 0.9246797037685427,
              "mean_reward": 0.05988289386728196,
              "min_reward": -0.4364942477262609,
              "max_reward": 0.6413532597340036,
              "num_responses": 7,
              "rvariance": 0.14412114569765905
            },
            {
              "id": "chat_hard_sample_374",
              "variance": 0.3047105631698932,
              "mean_reward": 1.3469390154694167,
              "min_reward": 1.1152752449221242,
              "max_reward": 1.58210612808748,
              "num_responses": 7,
              "rvariance": 0.019150495592017737
            },
            {
              "id": "chat_hard_sample_257",
              "variance": 0.557360618989321,
              "mean_reward": 0.6107939867311357,
              "min_reward": 0.25370634915618917,
              "max_reward": 1.06563753076277,
              "num_responses": 7,
              "rvariance": 0.06271435572831571
            },
            {
              "id": "chat_hard_sample_237",
              "variance": 0.7062737614673837,
              "mean_reward": -0.029937731754406744,
              "min_reward": -0.9754180014563931,
              "max_reward": 0.3151625666868183,
              "num_responses": 7,
              "rvariance": 0.1641388583272351
            },
            {
              "id": "chat_hard_sample_22",
              "variance": 1.1714500541607613,
              "mean_reward": -0.051683777957552426,
              "min_reward": -0.9848728041534129,
              "max_reward": 0.6649902664765532,
              "num_responses": 5,
              "rvariance": 0.3009121306642527
            },
            {
              "id": "chat_hard_sample_292",
              "variance": 0.23447910688609264,
              "mean_reward": -0.6917739205457971,
              "min_reward": -0.8619603690921548,
              "max_reward": -0.5310422746964595,
              "num_responses": 7,
              "rvariance": 0.011008145637444702
            },
            {
              "id": "chat_hard_sample_92",
              "variance": 0.22691526472847667,
              "mean_reward": -0.6555305102072211,
              "min_reward": -0.776867144818976,
              "max_reward": -0.49322306390838005,
              "num_responses": 6,
              "rvariance": 0.01011385796175515
            },
            {
              "id": "chat_hard_sample_407",
              "variance": 0.351718660329139,
              "mean_reward": -0.5461699590116913,
              "min_reward": -0.710683525939837,
              "max_reward": -0.23794339108884374,
              "num_responses": 5,
              "rvariance": 0.02944972678839729
            },
            {
              "id": "chat_hard_sample_44",
              "variance": 0.2552796728195361,
              "mean_reward": -1.2338492751749361,
              "min_reward": -1.3819745174282472,
              "max_reward": -1.0888756338206316,
              "num_responses": 6,
              "rvariance": 0.012177353165835304
            },
            {
              "id": "chat_hard_sample_119",
              "variance": 0.7374746103675496,
              "mean_reward": -0.6785371967699694,
              "min_reward": -0.9375987906683136,
              "max_reward": 0.2726159545502289,
              "num_responses": 5,
              "rvariance": 0.2264010322163869
            },
            {
              "id": "chat_hard_sample_303",
              "variance": 0.3309180943956952,
              "mean_reward": -1.0078344678461755,
              "min_reward": -1.2117880688818896,
              "max_reward": -0.8241411583040753,
              "num_responses": 7,
              "rvariance": 0.019841662570906273
            },
            {
              "id": "chat_hard_sample_365",
              "variance": 0.2685163965953641,
              "mean_reward": -1.196660384566658,
              "min_reward": -1.3630649120342075,
              "max_reward": -1.0037824095474528,
              "num_responses": 5,
              "rvariance": 0.015075285106833768
            },
            {
              "id": "chat_hard_sample_45",
              "variance": 0.1522223234220198,
              "mean_reward": 0.014634909531544048,
              "min_reward": -0.12448575872460538,
              "max_reward": 0.10715690735238129,
              "num_responses": 7,
              "rvariance": 0.00489017805455262
            },
            {
              "id": "chat_hard_sample_78",
              "variance": 0.44910312810844355,
              "mean_reward": -0.47194975784008536,
              "min_reward": -0.8335959610010951,
              "max_reward": -0.22848858839182387,
              "num_responses": 4,
              "rvariance": 0.05016639919883348
            },
            {
              "id": "chat_hard_sample_189",
              "variance": 0.3665508820600889,
              "mean_reward": 1.6333688864603848,
              "min_reward": 1.390055448304264,
              "max_reward": 1.8184761955129767,
              "num_responses": 4,
              "rvariance": 0.029960961275332473
            },
            {
              "id": "chat_hard_sample_39",
              "variance": 2.1320580081779794,
              "mean_reward": 1.180454291014705,
              "min_reward": -0.4837682612113602,
              "max_reward": 2.2344875141818505,
              "num_responses": 5,
              "rvariance": 0.9690893606526568
            },
            {
              "id": "chat_hard_sample_387",
              "variance": 0.3952107527354305,
              "mean_reward": -1.1915277773882758,
              "min_reward": -1.476522544398446,
              "max_reward": -0.9565083960623534,
              "num_responses": 7,
              "rvariance": 0.027518539740672164
            },
            {
              "id": "chat_hard_sample_118",
              "variance": 0.6358354813745858,
              "mean_reward": 0.583442593214757,
              "min_reward": 0.20643233567108984,
              "max_reward": 0.962816551432679,
              "num_responses": 6,
              "rvariance": 0.07439710337436241
            },
            {
              "id": "chat_hard_sample_154",
              "variance": 0.5521604775059601,
              "mean_reward": 0.16185969438513909,
              "min_reward": -0.219033785694804,
              "max_reward": 0.4806216138846659,
              "num_responses": 7,
              "rvariance": 0.058283515537332506
            },
            {
              "id": "chat_hard_sample_103",
              "variance": 0.8220950945058771,
              "mean_reward": 0.3945153750368065,
              "min_reward": -0.0677569425424862,
              "max_reward": 0.9202699392960896,
              "num_responses": 7,
              "rvariance": 0.10858069803752238
            },
            {
              "id": "chat_hard_sample_162",
              "variance": 0.24393390958311256,
              "mean_reward": -1.5285239592320552,
              "min_reward": -1.7790762307030816,
              "max_reward": -1.4387033336103665,
              "num_responses": 4,
              "rvariance": 0.020985075775790025
            },
            {
              "id": "chat_hard_sample_321",
              "variance": 0.5341963523816222,
              "mean_reward": 0.3570338357736205,
              "min_reward": -0.07721174523950605,
              "max_reward": 0.6271710556884738,
              "num_responses": 7,
              "rvariance": 0.06175434700488945
            },
            {
              "id": "chat_hard_sample_273",
              "variance": 0.2091875096715644,
              "mean_reward": 1.0909628951297874,
              "min_reward": 0.9415432453643843,
              "max_reward": 1.1507307550359487,
              "num_responses": 7,
              "rvariance": 0.008930492694406296
            },
            {
              "id": "chat_hard_sample_291",
              "variance": 0.26851639659536425,
              "mean_reward": -0.4594559114190234,
              "min_reward": -0.6444999070606979,
              "max_reward": -0.22848858839182387,
              "num_responses": 7,
              "rvariance": 0.015474161633544235
            },
            {
              "id": "chat_hard_sample_312",
              "variance": 0.3309180943956953,
              "mean_reward": -0.1190830143263083,
              "min_reward": -0.34194622075606224,
              "max_reward": 0.13079391409493094,
              "num_responses": 7,
              "rvariance": 0.021936019745547732
            },
            {
              "id": "chat_hard_sample_314",
              "variance": 0.7185650049735095,
              "mean_reward": -0.6949255214448038,
              "min_reward": -1.0226920149414924,
              "max_reward": -0.2001241803007643,
              "num_responses": 6,
              "rvariance": 0.09379343062396645
            },
            {
              "id": "chat_hard_sample_399",
              "variance": 0.32713617331688727,
              "mean_reward": -0.11368026992801125,
              "min_reward": -0.3135818126650026,
              "max_reward": 0.03624588712473231,
              "num_responses": 7,
              "rvariance": 0.0218739917456019
            },
            {
              "id": "chat_hard_sample_219",
              "variance": 0.16451356692814556,
              "mean_reward": -0.726891759134728,
              "min_reward": -0.9186891852742739,
              "max_reward": -0.6066806962726184,
              "num_responses": 7,
              "rvariance": 0.007935935287186677
            },
            {
              "id": "chat_hard_sample_406",
              "variance": 0.5861977672152315,
              "mean_reward": -0.3189845570632997,
              "min_reward": -0.8903247771832143,
              "max_reward": 0.007881479033672718,
              "num_responses": 7,
              "rvariance": 0.0768490432270004
            },
            {
              "id": "chat_hard_sample_253",
              "variance": 0.2974717298549874,
              "mean_reward": 1.2423716412215169,
              "min_reward": 1.1058204422251043,
              "max_reward": 1.4213744822381424,
              "num_responses": 7,
              "rvariance": 0.013383909420041352
            },
            {
              "id": "chat_hard_sample_24",
              "variance": 0.801220662926363,
              "mean_reward": 2.0343854789769535,
              "min_reward": 1.2087891528473365,
              "max_reward": 2.4330383708192675,
              "num_responses": 6,
              "rvariance": 0.16144584403356652
            },
            {
              "id": "chat_hard_sample_60",
              "variance": 0.7355836498281454,
              "mean_reward": 0.5515326341123149,
              "min_reward": -0.13394056142162525,
              "max_reward": 0.889541830530775,
              "num_responses": 7,
              "rvariance": 0.11156761988785487
            },
            {
              "id": "chat_hard_sample_386",
              "variance": 0.40655651597185416,
              "mean_reward": -1.1487560509017574,
              "min_reward": -1.3819745174282472,
              "max_reward": -0.8714151717891746,
              "num_responses": 6,
              "rvariance": 0.03083075385542644
            },
            {
              "id": "chat_hard_sample_216",
              "variance": 0.14654944180380786,
              "mean_reward": -0.44594905042328065,
              "min_reward": -0.5215874719994397,
              "max_reward": -0.3135818126650026,
              "num_responses": 6,
              "rvariance": 0.005214608818975158
            },
            {
              "id": "chat_hard_sample_300",
              "variance": 0.745983932794867,
              "mean_reward": 2.677174883317316,
              "min_reward": 1.8066576921417017,
              "max_reward": 3.0050539339889695,
              "num_responses": 7,
              "rvariance": 0.14892079023758487
            },
            {
              "id": "chat_hard_sample_352",
              "variance": 0.7699754946385553,
              "mean_reward": 0.5986096725412263,
              "min_reward": 0.1402487167919508,
              "max_reward": 1.07509233345979,
              "num_responses": 6,
              "rvariance": 0.10490136219101152
            },
            {
              "id": "chat_hard_sample_311",
              "variance": 1.057046941526821,
              "mean_reward": -1.284049775209113,
              "min_reward": -1.816895441491161,
              "max_reward": 0.17334052623152033,
              "num_responses": 7,
              "rvariance": 0.3848171507815613
            },
            {
              "id": "chat_hard_sample_419",
              "variance": 0.48975877970562903,
              "mean_reward": -0.2879187767730916,
              "min_reward": -0.6823191178487773,
              "max_reward": 0.13079391409493094,
              "num_responses": 7,
              "rvariance": 0.05508451265777347
            },
            {
              "id": "chat_hard_sample_287",
              "variance": 0.6694000309490064,
              "mean_reward": -0.22781324534203673,
              "min_reward": -0.6539547097577177,
              "max_reward": 0.1544309208374806,
              "num_responses": 7,
              "rvariance": 0.0731009101126268
            },
            {
              "id": "chat_hard_sample_55",
              "variance": 0.5393964938649832,
              "mean_reward": 0.5208045253470004,
              "min_reward": 0.1686131248830104,
              "max_reward": 0.7831753001893016,
              "num_responses": 7,
              "rvariance": 0.050320443000169544
            }
          ]
        },
        "semantic_benchmark_reasoning_filtered.json": {
          "file_name": "semantic_benchmark_reasoning_filtered.json",
          "processed_samples": 200,
          "global_mean": -2.070465087890625,
          "global_std": 4.69812399612886,
          "mean_variance": 0.5073342135994521,
          "mean_rvariance": 0.09658346734141227,
          "sample_results": [
            {
              "id": "reasoning_sample_9",
              "variance": 3.044433269914849,
              "mean_reward": 1.8850458993637005,
              "min_reward": -0.3940742972375552,
              "max_reward": 2.8618795712861904,
              "num_responses": 7,
              "rvariance": 1.8227843641507537
            },
            {
              "id": "reasoning_sample_5",
              "variance": 2.6059271232704604,
              "mean_reward": 0.9170374635579235,
              "min_reward": -1.3153196716819653,
              "max_reward": 2.017127495080847,
              "num_responses": 5,
              "rvariance": 1.5805186790231107
            },
            {
              "id": "reasoning_sample_85",
              "variance": 0.7662633006209101,
              "mean_reward": -0.6568121477108707,
              "min_reward": -1.2088942132623945,
              "max_reward": -0.28099724766676115,
              "num_responses": 4,
              "rvariance": 0.13431823600533516
            },
            {
              "id": "reasoning_sample_65",
              "variance": 2.4358126795779276,
              "mean_reward": 0.022125263367552224,
              "min_reward": -1.381835583194197,
              "max_reward": 1.3253620153536363,
              "num_responses": 7,
              "rvariance": 1.224659676729438
            },
            {
              "id": "reasoning_sample_256",
              "variance": 0.6342292162691301,
              "mean_reward": -0.742451383782869,
              "min_reward": -1.1423783017501628,
              "max_reward": -0.3076036122716539,
              "num_responses": 4,
              "rvariance": 0.09086750059316338
            },
            {
              "id": "reasoning_sample_263",
              "variance": 0.5653852478539702,
              "mean_reward": -0.7588032120296261,
              "min_reward": -1.2421521690185102,
              "max_reward": -0.49717396008151443,
              "num_responses": 6,
              "rvariance": 0.06908894063377224
            },
            {
              "id": "reasoning_sample_203",
              "variance": 0.7782361646931117,
              "mean_reward": -0.5248889232116111,
              "min_reward": -0.96943693181836,
              "max_reward": -0.09142689985690061,
              "num_responses": 6,
              "rvariance": 0.11633748771405854
            },
            {
              "id": "reasoning_sample_61",
              "variance": 1.1021686537576805,
              "mean_reward": 1.0887554158315547,
              "min_reward": -0.17457178924719033,
              "max_reward": 1.578122479100117,
              "num_responses": 7,
              "rvariance": 0.3262794210446061
            },
            {
              "id": "reasoning_sample_319",
              "variance": 0.7250234354833264,
              "mean_reward": -0.12108191040610394,
              "min_reward": -0.6102510096523085,
              "max_reward": 0.16299646167738593,
              "num_responses": 6,
              "rvariance": 0.1093900801549308
            },
            {
              "id": "reasoning_sample_528",
              "variance": 0.2767061918908842,
              "mean_reward": -0.8183507899548622,
              "min_reward": -1.0559076167842614,
              "max_reward": -0.5038255512327376,
              "num_responses": 7,
              "rvariance": 0.023293838073887758
            },
            {
              "id": "reasoning_sample_551",
              "variance": 0.6146070223730216,
              "mean_reward": -0.5142780516132311,
              "min_reward": -0.7698891972816647,
              "max_reward": -0.03156257949589201,
              "num_responses": 7,
              "rvariance": 0.07257044552579683
            },
            {
              "id": "reasoning_sample_596",
              "variance": 0.30331255649577704,
              "mean_reward": -1.212695122491665,
              "min_reward": -1.3685324008917508,
              "max_reward": -1.0093464787256992,
              "num_responses": 7,
              "rvariance": 0.017834711591419146
            },
            {
              "id": "reasoning_sample_456",
              "variance": 0.5886658168832514,
              "mean_reward": -0.3059407144838481,
              "min_reward": -0.5237803246864071,
              "max_reward": 0.3143201603677132,
              "num_responses": 4,
              "rvariance": 0.1282928018995249
            },
            {
              "id": "reasoning_sample_306",
              "variance": 0.8700281225799916,
              "mean_reward": -0.689119876159669,
              "min_reward": -1.0093464787256992,
              "max_reward": -0.07147212640323107,
              "num_responses": 7,
              "rvariance": 0.13491067222156236
            },
            {
              "id": "reasoning_sample_231",
              "variance": 0.33257955756115887,
              "mean_reward": -0.8839164741597763,
              "min_reward": -1.049256025633038,
              "max_reward": -0.6767669211645402,
              "num_responses": 7,
              "rvariance": 0.019877143629683118
            },
            {
              "id": "reasoning_sample_526",
              "variance": 0.8218040867336235,
              "mean_reward": -0.16060344782962163,
              "min_reward": -1.049256025633038,
              "max_reward": 0.23948975991645247,
              "num_responses": 5,
              "rvariance": 0.20735302330831923
            },
            {
              "id": "reasoning_sample_591",
              "variance": 0.5181589506802856,
              "mean_reward": -0.0688114899427418,
              "min_reward": -0.37744531935949727,
              "max_reward": 0.36420709400188706,
              "num_responses": 5,
              "rvariance": 0.06154913190973342
            },
            {
              "id": "reasoning_sample_23",
              "variance": 1.7117454103225895,
              "mean_reward": 0.09904418425468804,
              "min_reward": -1.049256025633038,
              "max_reward": 1.3852263357146448,
              "num_responses": 6,
              "rvariance": 0.6119788569840308
            },
            {
              "id": "reasoning_sample_275",
              "variance": 0.3824664911953328,
              "mean_reward": -0.7089162783954522,
              "min_reward": -1.075862390237931,
              "max_reward": -0.40405168396438995,
              "num_responses": 6,
              "rvariance": 0.03899956156844129
            },
            {
              "id": "reasoning_sample_656",
              "variance": 0.270054600739661,
              "mean_reward": -0.5104771423839608,
              "min_reward": -0.6368573742572011,
              "max_reward": -0.29097463439359594,
              "num_responses": 4,
              "rvariance": 0.018206268082907033
            },
            {
              "id": "reasoning_sample_405",
              "variance": 0.8139884671309363,
              "mean_reward": 0.6234805740839405,
              "min_reward": 0.1397158926481048,
              "max_reward": 1.0293662091242048,
              "num_responses": 6,
              "rvariance": 0.15310575907571342
            },
            {
              "id": "reasoning_sample_330",
              "variance": 0.5620594522783585,
              "mean_reward": -0.7765407884328878,
              "min_reward": -1.002694887574476,
              "max_reward": -0.0648205352520079,
              "num_responses": 6,
              "rvariance": 0.10584559419280992
            },
            {
              "id": "reasoning_sample_451",
              "variance": 0.5973128853798415,
              "mean_reward": -0.7480339692133601,
              "min_reward": -1.2887133070770727,
              "max_reward": -0.48387077777906806,
              "num_responses": 7,
              "rvariance": 0.07447743777372505
            },
            {
              "id": "reasoning_sample_314",
              "variance": 0.7330053448647942,
              "mean_reward": -0.7333054459499372,
              "min_reward": -1.1756362575062786,
              "max_reward": -0.330884181300935,
              "num_responses": 4,
              "rvariance": 0.11747799107445671
            },
            {
              "id": "reasoning_sample_593",
              "variance": 0.6573434955196307,
              "mean_reward": -0.08361128025421338,
              "min_reward": -0.4306580485692827,
              "max_reward": 0.6094845177032417,
              "num_responses": 5,
              "rvariance": 0.1288485023299534
            },
            {
              "id": "reasoning_sample_599",
              "variance": 0.37681263871679294,
              "mean_reward": 0.1738052972981236,
              "min_reward": -0.5902962361986389,
              "max_reward": 0.3517353605933436,
              "num_responses": 7,
              "rvariance": 0.09774709420171322
            },
            {
              "id": "reasoning_sample_301",
              "variance": 0.35785560393580695,
              "mean_reward": -0.5969478273498622,
              "min_reward": -0.9095726114573515,
              "max_reward": -0.443961230871729,
              "num_responses": 7,
              "rvariance": 0.02630601901095612
            },
            {
              "id": "reasoning_sample_77",
              "variance": 0.8593855767380343,
              "mean_reward": 2.31644909688589,
              "min_reward": 1.4118327003195374,
              "max_reward": 2.662331836749495,
              "num_responses": 7,
              "rvariance": 0.17368798712663966
            },
            {
              "id": "reasoning_sample_511",
              "variance": 0.1270453909883627,
              "mean_reward": 0.21620919088717133,
              "min_reward": 0.13639009707249322,
              "max_reward": 0.291871040232335,
              "num_responses": 7,
              "rvariance": 0.002901120308992999
            },
            {
              "id": "reasoning_sample_12",
              "variance": 0.3392311487123818,
              "mean_reward": 2.9882598031594303,
              "min_reward": 2.675635019051941,
              "max_reward": 3.1545495819400102,
              "num_responses": 6,
              "rvariance": 0.025705569273800733
            },
            {
              "id": "reasoning_sample_543",
              "variance": 0.3718239453533757,
              "mean_reward": -0.3726941828229093,
              "min_reward": -0.6568121477108707,
              "max_reward": -0.05151735294956154,
              "num_responses": 7,
              "rvariance": 0.02970600921435268
            },
            {
              "id": "reasoning_sample_506",
              "variance": 0.27121862919112505,
              "mean_reward": 0.2897033341875167,
              "min_reward": 0.005021171835835465,
              "max_reward": 0.4018301564509931,
              "num_responses": 7,
              "rvariance": 0.017657294283773918
            },
            {
              "id": "reasoning_sample_531",
              "variance": 0.5976454649374027,
              "mean_reward": -0.46332211225832504,
              "min_reward": -0.8164503353402269,
              "max_reward": 0.23865831102254959,
              "num_responses": 7,
              "rvariance": 0.10080972646068169
            },
            {
              "id": "reasoning_sample_274",
              "variance": 0.3206066934889572,
              "mean_reward": -0.5397441434493427,
              "min_reward": -0.7765407884328879,
              "max_reward": -0.3840969105107204,
              "num_responses": 5,
              "rvariance": 0.021743106650458897
            },
            {
              "id": "reasoning_sample_597",
              "variance": 1.0615939477352194,
              "mean_reward": 0.8497732480411789,
              "min_reward": -0.7698891972816647,
              "max_reward": 1.7444122578806964,
              "num_responses": 7,
              "rvariance": 0.5051077996804575
            },
            {
              "id": "reasoning_sample_73",
              "variance": 1.3749670358472208,
              "mean_reward": 0.7411503889734361,
              "min_reward": -0.670115330013317,
              "max_reward": 1.4583938383780997,
              "num_responses": 7,
              "rvariance": 0.4749204219321085
            },
            {
              "id": "reasoning_sample_412",
              "variance": 1.0293337306517867,
              "mean_reward": 0.008901266674048983,
              "min_reward": -0.9494821583646905,
              "max_reward": 0.6269449444752025,
              "num_responses": 6,
              "rvariance": 0.25064189757413025
            },
            {
              "id": "reasoning_sample_491",
              "variance": 0.6199282952940002,
              "mean_reward": -0.4249566847253771,
              "min_reward": -1.0692107990867077,
              "max_reward": -0.07812371755445426,
              "num_responses": 7,
              "rvariance": 0.09266745308179174
            },
            {
              "id": "reasoning_sample_64",
              "variance": 0.6531862510501161,
              "mean_reward": 2.070340224290632,
              "min_reward": 1.4716970206805462,
              "max_reward": 2.436177737607907,
              "num_responses": 7,
              "rvariance": 0.08987784486684193
            },
            {
              "id": "reasoning_sample_535",
              "variance": 0.2893442150782082,
              "mean_reward": -0.29984342259522684,
              "min_reward": -0.5237803246864071,
              "max_reward": -0.17457178924719033,
              "num_responses": 6,
              "rvariance": 0.0166012062416571
            },
            {
              "id": "reasoning_sample_548",
              "variance": 0.5135028368744293,
              "mean_reward": -0.4601150950961281,
              "min_reward": -0.9095726114573515,
              "max_reward": -0.10473008215934697,
              "num_responses": 7,
              "rvariance": 0.05474656911760456
            },
            {
              "id": "reasoning_sample_235",
              "variance": 0.3631768768567855,
              "mean_reward": -0.6395180107176904,
              "min_reward": -0.8696630645500124,
              "max_reward": -0.46391600432539853,
              "num_responses": 5,
              "rvariance": 0.02715853122724583
            },
            {
              "id": "reasoning_sample_156",
              "variance": 1.3635761860007514,
              "mean_reward": -0.1806690811358115,
              "min_reward": -0.9561337495159137,
              "max_reward": 0.6069901710215331,
              "num_responses": 6,
              "rvariance": 0.3476166369659126
            },
            {
              "id": "reasoning_sample_587",
              "variance": 0.7486365840701689,
              "mean_reward": -0.023010533730033634,
              "min_reward": -0.8297535176426734,
              "max_reward": 0.7699541542265009,
              "num_responses": 7,
              "rvariance": 0.18595014141118393
            },
            {
              "id": "reasoning_sample_594",
              "variance": 0.9350474260831981,
              "mean_reward": 0.01090070329986309,
              "min_reward": -1.195591030959948,
              "max_reward": 0.5184408638208745,
              "num_responses": 7,
              "rvariance": 0.27652964198767854
            },
            {
              "id": "reasoning_sample_622",
              "variance": 0.3852934174346027,
              "mean_reward": 0.18532680339934945,
              "min_reward": 0.011672762987058643,
              "max_reward": 0.6444053712471635,
              "num_responses": 7,
              "rvariance": 0.04185459159137579
            },
            {
              "id": "reasoning_sample_647",
              "variance": 0.4842358358090473,
              "mean_reward": -0.3974000928131668,
              "min_reward": -0.8696630645500124,
              "max_reward": -0.1512912202179092,
              "num_responses": 5,
              "rvariance": 0.062489752224296244
            },
            {
              "id": "reasoning_sample_395",
              "variance": 0.3907809801343617,
              "mean_reward": -0.2832144447171689,
              "min_reward": -0.6235541919547548,
              "max_reward": -0.07812371755445426,
              "num_responses": 6,
              "rvariance": 0.03301560589842141
            },
            {
              "id": "reasoning_sample_252",
              "variance": 0.31761347747090674,
              "mean_reward": -0.36635933410745863,
              "min_reward": -0.8231019264914501,
              "max_reward": -0.2510650874862569,
              "num_responses": 6,
              "rvariance": 0.04228834065510653
            },
            {
              "id": "reasoning_sample_497",
              "variance": 0.7411535440250425,
              "mean_reward": 0.14872820476594514,
              "min_reward": -0.3541647503302161,
              "max_reward": 0.5446315039788158,
              "num_responses": 7,
              "rvariance": 0.10705812258983068
            },
            {
              "id": "reasoning_sample_87",
              "variance": 0.49138629629661223,
              "mean_reward": 1.1037808851285142,
              "min_reward": 0.4893401525342731,
              "max_reward": 1.3386651976560826,
              "num_responses": 7,
              "rvariance": 0.07265782535303068
            },
            {
              "id": "reasoning_sample_299",
              "variance": 0.353864649245073,
              "mean_reward": -0.24821440556430407,
              "min_reward": -0.7499344238279951,
              "max_reward": -0.0648205352520079,
              "num_responses": 7,
              "rvariance": 0.04539219426507811
            },
            {
              "id": "reasoning_sample_303",
              "variance": 0.5860051804227621,
              "mean_reward": -0.4532734584834415,
              "min_reward": -0.7565860149792184,
              "max_reward": -0.14131383349107443,
              "num_responses": 5,
              "rvariance": 0.06955723524632193
            },
            {
              "id": "reasoning_sample_509",
              "variance": 0.5534123837817685,
              "mean_reward": -0.7689389699743472,
              "min_reward": -1.0891655725403773,
              "max_reward": -0.5038255512327376,
              "num_responses": 7,
              "rvariance": 0.047851780857576395
            },
            {
              "id": "reasoning_sample_572",
              "variance": 0.3508714332270227,
              "mean_reward": 0.13062934402188028,
              "min_reward": -0.07147212640323107,
              "max_reward": 0.3679486140244501,
              "num_responses": 7,
              "rvariance": 0.02088095704658811
            },
            {
              "id": "reasoning_sample_557",
              "variance": 0.4423308115563416,
              "mean_reward": 1.0889929726583838,
              "min_reward": 0.8447845546777616,
              "max_reward": 1.7909733959392586,
              "num_responses": 7,
              "rvariance": 0.08599264161456732
            },
            {
              "id": "reasoning_sample_678",
              "variance": 0.5334576103280989,
              "mean_reward": -0.17255255621914042,
              "min_reward": -0.48387077777906806,
              "max_reward": 0.2336696176591322,
              "num_responses": 7,
              "rvariance": 0.05518169766068134
            },
            {
              "id": "reasoning_sample_53",
              "variance": 0.5640549296237252,
              "mean_reward": 2.5435534233347954,
              "min_reward": 1.8441861251490441,
              "max_reward": 2.8352732066812973,
              "num_responses": 7,
              "rvariance": 0.09418121847177825
            },
            {
              "id": "reasoning_sample_75",
              "variance": 1.535686107038651,
              "mean_reward": 0.5327140698328742,
              "min_reward": -0.22113292730575257,
              "max_reward": 1.6379867994611255,
              "num_responses": 6,
              "rvariance": 0.4731930621926789
            },
            {
              "id": "reasoning_sample_595",
              "variance": 0.18574568289790722,
              "mean_reward": 0.10363101065271907,
              "min_reward": 0.02996463865292238,
              "max_reward": 0.3218032004128393,
              "num_responses": 5,
              "rvariance": 0.012073985526500906
            },
            {
              "id": "reasoning_sample_245",
              "variance": 0.2274844173718329,
              "mean_reward": -0.988061387041785,
              "min_reward": -1.1756362575062786,
              "max_reward": -0.8896178380036819,
              "num_responses": 5,
              "rvariance": 0.011457339447751184
            },
            {
              "id": "reasoning_sample_418",
              "variance": 0.6664894333525626,
              "mean_reward": -0.9285771576037034,
              "min_reward": -1.2155458044136176,
              "max_reward": -0.09807849100812378,
              "num_responses": 7,
              "rvariance": 0.1317883335883542
            },
            {
              "id": "reasoning_sample_60",
              "variance": 1.6364992854243774,
              "mean_reward": -0.37848463047687586,
              "min_reward": -1.2887133070770727,
              "max_reward": 0.4976546414733021,
              "num_responses": 6,
              "rvariance": 0.4781545216122732
            },
            {
              "id": "reasoning_sample_385",
              "variance": 0.4503127209378091,
              "mean_reward": -0.3194814536131238,
              "min_reward": -0.6967216946182098,
              "max_reward": -0.004956214890999301,
              "num_responses": 7,
              "rvariance": 0.04203735065846016
            },
            {
              "id": "reasoning_sample_243",
              "variance": 0.2228283035659765,
              "mean_reward": -0.888509239478478,
              "min_reward": -1.0226496610281455,
              "max_reward": -0.7299796503743257,
              "num_responses": 6,
              "rvariance": 0.0092678187939248
            },
            {
              "id": "reasoning_sample_71",
              "variance": 0.4376746977504853,
              "mean_reward": 2.0798424973638077,
              "min_reward": 1.7843218047880354,
              "max_reward": 2.289842732280997,
              "num_responses": 7,
              "rvariance": 0.030804425913976082
            },
            {
              "id": "reasoning_sample_218",
              "variance": 0.5520820655515237,
              "mean_reward": -0.5119024833449372,
              "min_reward": -1.1490298929013858,
              "max_reward": -0.2976262255448191,
              "num_responses": 7,
              "rvariance": 0.08162911016942345
            },
            {
              "id": "reasoning_sample_32",
              "variance": 0.5733671572354382,
              "mean_reward": 2.1268787490760293,
              "min_reward": 1.5581677056464474,
              "max_reward": 2.3430554614907826,
              "num_responses": 4,
              "rvariance": 0.10887259826248731
            },
            {
              "id": "reasoning_sample_55",
              "variance": 0.5350633460044488,
              "mean_reward": 0.6164664613167746,
              "min_reward": 0.21953498646278294,
              "max_reward": 1.0094114356705353,
              "num_responses": 7,
              "rvariance": 0.055622305161015476
            },
            {
              "id": "reasoning_sample_403",
              "variance": 0.34455242163336064,
              "mean_reward": -0.5722419173596045,
              "min_reward": -0.7565860149792184,
              "max_reward": -0.32423259014971184,
              "num_responses": 7,
              "rvariance": 0.02591053482317556
            },
            {
              "id": "reasoning_sample_580",
              "variance": 0.3680824253308127,
              "mean_reward": -0.025534575015096,
              "min_reward": -0.21448133615452938,
              "max_reward": 0.28854524465672343,
              "num_responses": 4,
              "rvariance": 0.03589798752849411
            },
            {
              "id": "reasoning_sample_530",
              "variance": 0.5093455924049148,
              "mean_reward": -0.07729226866055136,
              "min_reward": -0.37411952378388563,
              "max_reward": 0.2619388800518307,
              "num_responses": 5,
              "rvariance": 0.0511628209786699
            },
            {
              "id": "reasoning_sample_318",
              "variance": 0.3126247841074894,
              "mean_reward": -0.19333877856671286,
              "min_reward": -0.443961230871729,
              "max_reward": 0.0831773678627078,
              "num_responses": 7,
              "rvariance": 0.022997789265512072
            },
            {
              "id": "reasoning_sample_76",
              "variance": 0.7476388453974852,
              "mean_reward": 2.608168880232392,
              "min_reward": 1.8175797605441513,
              "max_reward": 3.1678527642424563,
              "num_responses": 7,
              "rvariance": 0.14676797439949452
            },
            {
              "id": "reasoning_sample_393",
              "variance": 0.3625117177416632,
              "mean_reward": -0.5636898715937463,
              "min_reward": -0.856359882247566,
              "max_reward": -0.34418736360338137,
              "num_responses": 6,
              "rvariance": 0.028404432829225557
            },
            {
              "id": "reasoning_sample_642",
              "variance": 0.23280569029281128,
              "mean_reward": -0.468350398426214,
              "min_reward": -0.5969478273498621,
              "max_reward": -0.2943004299692075,
              "num_responses": 6,
              "rvariance": 0.010838468895852382
            },
            {
              "id": "reasoning_sample_16",
              "variance": 0.71172025318088,
              "mean_reward": 2.274322352928143,
              "min_reward": 1.8308829428465978,
              "max_reward": 2.5692095606323706,
              "num_responses": 6,
              "rvariance": 0.09377690561618328
            },
            {
              "id": "reasoning_sample_260",
              "variance": 0.3591859221660517,
              "mean_reward": -0.7404321507548193,
              "min_reward": -0.9029210203061283,
              "max_reward": -0.3641421370570509,
              "num_responses": 7,
              "rvariance": 0.030159732511977625
            },
            {
              "id": "reasoning_sample_582",
              "variance": 0.7878809718623853,
              "mean_reward": 0.33934677207419045,
              "min_reward": -0.08477530870567743,
              "max_reward": 0.7799315409533356,
              "num_responses": 5,
              "rvariance": 0.1281923134757502
            },
            {
              "id": "reasoning_sample_295",
              "variance": 0.44316226045024426,
              "mean_reward": -0.08810110428128903,
              "min_reward": -0.37744531935949727,
              "max_reward": 0.1663222572529975,
              "num_responses": 6,
              "rvariance": 0.03668998081410059
            },
            {
              "id": "reasoning_sample_366",
              "variance": 0.32193701171920186,
              "mean_reward": -1.1547312567452914,
              "min_reward": -1.341926036286858,
              "max_reward": -0.896269429154905,
              "num_responses": 7,
              "rvariance": 0.022177814201520707
            },
            {
              "id": "reasoning_sample_286",
              "variance": 0.22881473560207732,
              "mean_reward": -0.15509212944717962,
              "min_reward": -0.32423259014971184,
              "max_reward": -0.0016304193153877124,
              "num_responses": 7,
              "rvariance": 0.010901097258161368
            },
            {
              "id": "reasoning_sample_356",
              "variance": 0.7117202531808801,
              "mean_reward": -0.41070327511561316,
              "min_reward": -0.8497082910963428,
              "max_reward": -0.08477530870567743,
              "num_responses": 6,
              "rvariance": 0.08965241286026075
            },
            {
              "id": "reasoning_sample_343",
              "variance": 0.399760628188513,
              "mean_reward": -0.5683459853996025,
              "min_reward": -0.9095726114573515,
              "max_reward": -0.38077111493510885,
              "num_responses": 5,
              "rvariance": 0.03626918669172267
            },
            {
              "id": "reasoning_sample_205",
              "variance": 0.22137326800164636,
              "mean_reward": 0.3132214600436272,
              "min_reward": 0.13306430149688164,
              "max_reward": 0.4118075431778279,
              "num_responses": 7,
              "rvariance": 0.009963264887032733
            },
            {
              "id": "reasoning_sample_512",
              "variance": 0.29988023153063403,
              "mean_reward": 0.5322723626079883,
              "min_reward": 0.4064031253674591,
              "max_reward": 0.9561987064607499,
              "num_responses": 6,
              "rvariance": 0.03663620301994292
            },
            {
              "id": "reasoning_sample_226",
              "variance": 0.3502062741119003,
              "mean_reward": -0.08572553601299503,
              "min_reward": -0.5104771423839608,
              "max_reward": 0.053245207682203505,
              "num_responses": 7,
              "rvariance": 0.03441197759606226
            },
            {
              "id": "reasoning_sample_225",
              "variance": 0.2061993256879185,
              "mean_reward": -0.24219629928462597,
              "min_reward": -0.43730963972050585,
              "max_reward": -0.13133644676423967,
              "num_responses": 6,
              "rvariance": 0.009662324805441824
            },
            {
              "id": "reasoning_sample_508",
              "variance": 0.35519496747531776,
              "mean_reward": -0.7047036039996776,
              "min_reward": -0.8630114733987893,
              "max_reward": -0.3641421370570509,
              "num_responses": 5,
              "rvariance": 0.03255271884490811
            },
            {
              "id": "reasoning_sample_585",
              "variance": 0.8347746894785089,
              "mean_reward": -0.7146809907265123,
              "min_reward": -1.3286228539844116,
              "max_reward": -0.11470746888618173,
              "num_responses": 5,
              "rvariance": 0.1545236540841745
            },
            {
              "id": "reasoning_sample_574",
              "variance": 0.3578556039358072,
              "mean_reward": -0.3544023071570455,
              "min_reward": -0.5370835069888535,
              "max_reward": 0.10313214131637734,
              "num_responses": 7,
              "rvariance": 0.03944988633058651
            },
            {
              "id": "reasoning_sample_520",
              "variance": 0.4177199242968158,
              "mean_reward": -0.9874912506573944,
              "min_reward": -1.2022426221111713,
              "max_reward": -0.4173548662668363,
              "num_responses": 7,
              "rvariance": 0.0596494895277608
            },
            {
              "id": "reasoning_sample_238",
              "variance": 0.43634437952024036,
              "mean_reward": -0.40671232042487926,
              "min_reward": -0.7499344238279951,
              "max_reward": -0.2111555405789178,
              "num_responses": 5,
              "rvariance": 0.0410554663544417
            },
            {
              "id": "reasoning_sample_630",
              "variance": 0.3418917851728713,
              "mean_reward": -0.36879825086290713,
              "min_reward": -0.5636898715937462,
              "max_reward": -0.20450394942769462,
              "num_responses": 5,
              "rvariance": 0.025703799527206982
            },
            {
              "id": "reasoning_sample_233",
              "variance": 0.43501406128999603,
              "mean_reward": -0.6800927167401518,
              "min_reward": -0.96943693181836,
              "max_reward": -0.10140428658373538,
              "num_responses": 7,
              "rvariance": 0.06427024370805076
            },
            {
              "id": "reasoning_sample_394",
              "variance": 0.3239324890645687,
              "mean_reward": -0.4425358899107526,
              "min_reward": -0.6634637388620939,
              "max_reward": -0.28764883881798436,
              "num_responses": 7,
              "rvariance": 0.020911000695913114
            },
            {
              "id": "reasoning_sample_284",
              "variance": 0.24211791790452367,
              "mean_reward": -0.09760337735446499,
              "min_reward": -0.23443610960819894,
              "max_reward": 0.011672762987058643,
              "num_responses": 7,
              "rvariance": 0.011902900240678556
            },
            {
              "id": "reasoning_sample_207",
              "variance": 0.3073035111865108,
              "mean_reward": -0.7831923795841111,
              "min_reward": -1.042604434481815,
              "max_reward": -0.6435089654084244,
              "num_responses": 7,
              "rvariance": 0.017975568973368383
            },
            {
              "id": "reasoning_sample_345",
              "variance": 0.2128509168391417,
              "mean_reward": -0.8341879117434888,
              "min_reward": -1.0293012521793687,
              "max_reward": -0.7233280592231025,
              "num_responses": 6,
              "rvariance": 0.009905664962078495
            },
            {
              "id": "reasoning_sample_565",
              "variance": 0.20946276259648744,
              "mean_reward": 0.5864934710566588,
              "min_reward": 0.453951608987531,
              "max_reward": 0.8697280214948485,
              "num_responses": 7,
              "rvariance": 0.015031516521395309
            },
            {
              "id": "reasoning_sample_78",
              "variance": 0.8726887590404813,
              "mean_reward": 2.805816160154452,
              "min_reward": 1.9639147658710612,
              "max_reward": 3.2077623111497955,
              "num_responses": 7,
              "rvariance": 0.16933766106105352
            },
            {
              "id": "reasoning_sample_601",
              "variance": 0.22282830356597644,
              "mean_reward": -0.5553753826547172,
              "min_reward": -0.743282832676772,
              "max_reward": -0.4306580485692827,
              "num_responses": 4,
              "rvariance": 0.013237151475224175
            },
            {
              "id": "reasoning_sample_539",
              "variance": 0.39576967349777914,
              "mean_reward": -0.986065909696418,
              "min_reward": -1.381835583194197,
              "max_reward": -0.7632376061304416,
              "num_responses": 6,
              "rvariance": 0.03828183100543213
            },
            {
              "id": "reasoning_sample_603",
              "variance": 0.32966948643249877,
              "mean_reward": -0.1578042365534819,
              "min_reward": -0.26769406536431484,
              "max_reward": 0.3184774048372277,
              "num_responses": 6,
              "rvariance": 0.046082638177966595
            },
            {
              "id": "reasoning_sample_339",
              "variance": 0.5753626345808049,
              "mean_reward": -0.8752060571760317,
              "min_reward": -1.302016489379519,
              "max_reward": -0.2510650874862569,
              "num_responses": 6,
              "rvariance": 0.09779939214482879
            },
            {
              "id": "reasoning_sample_447",
              "variance": 0.9328856589590506,
              "mean_reward": 0.36753288957749863,
              "min_reward": -0.40405168396438995,
              "max_reward": 0.648562615716678,
              "num_responses": 7,
              "rvariance": 0.1838087254594829
            },
            {
              "id": "reasoning_sample_44",
              "variance": 0.6997473891086785,
              "mean_reward": 2.496992285276233,
              "min_reward": 1.6113804348562328,
              "max_reward": 2.8618795712861904,
              "num_responses": 7,
              "rvariance": 0.14860092622870583
            },
            {
              "id": "reasoning_sample_266",
              "variance": 0.48556615403929193,
              "mean_reward": -1.308668080530742,
              "min_reward": -1.607989682335785,
              "max_reward": -1.002694887574476,
              "num_responses": 7,
              "rvariance": 0.04849105666796142
            },
            {
              "id": "reasoning_sample_529",
              "variance": 0.5288014965222428,
              "mean_reward": 0.25017981712377546,
              "min_reward": -0.028236783920280423,
              "max_reward": 0.979479275490031,
              "num_responses": 7,
              "rvariance": 0.09765434616195619
            },
            {
              "id": "reasoning_sample_466",
              "variance": 0.3512040127845839,
              "mean_reward": -1.0996180729208709,
              "min_reward": -1.4882610416137678,
              "max_reward": -0.8896178380036819,
              "num_responses": 7,
              "rvariance": 0.03195476119989486
            },
            {
              "id": "reasoning_sample_349",
              "variance": 0.15963818762935644,
              "mean_reward": -1.0725365946623193,
              "min_reward": -1.155681484052609,
              "max_reward": -0.9561337495159137,
              "num_responses": 6,
              "rvariance": 0.0047598809426960325
            },
            {
              "id": "reasoning_sample_206",
              "variance": 0.29599580622943145,
              "mean_reward": -0.7116877747084619,
              "min_reward": -0.8497082910963428,
              "max_reward": -0.5237803246864071,
              "num_responses": 4,
              "rvariance": 0.02029401601768754
            },
            {
              "id": "reasoning_sample_516",
              "variance": 0.2414527587894013,
              "mean_reward": -0.4924228235449264,
              "min_reward": -0.6767669211645402,
              "max_reward": -0.34751315917899295,
              "num_responses": 7,
              "rvariance": 0.011054144221240824
            },
            {
              "id": "reasoning_sample_542",
              "variance": 0.2195025079903649,
              "mean_reward": -0.14178894714473325,
              "min_reward": -0.22445872288136415,
              "max_reward": 0.06488549219684406,
              "num_responses": 7,
              "rvariance": 0.010373333541819501
            },
            {
              "id": "reasoning_sample_151",
              "variance": 0.443661129786586,
              "mean_reward": -0.9178871003963804,
              "min_reward": -1.1423783017501628,
              "max_reward": -0.6767669211645402,
              "num_responses": 4,
              "rvariance": 0.04641990010749705
            },
            {
              "id": "reasoning_sample_223",
              "variance": 0.5198218484680913,
              "mean_reward": -0.17077088001791993,
              "min_reward": -0.5104771423839608,
              "max_reward": 0.03329043422853397,
              "num_responses": 7,
              "rvariance": 0.045723231685957225
            },
            {
              "id": "reasoning_sample_452",
              "variance": 1.3899539021598208,
              "mean_reward": 0.2697856789880393,
              "min_reward": -0.517128733535184,
              "max_reward": 1.2156107613584537,
              "num_responses": 4,
              "rvariance": 0.4251417474550356
            },
            {
              "id": "reasoning_sample_68",
              "variance": 0.7359985608828445,
              "mean_reward": 1.0176071461961496,
              "min_reward": 0.24198410659816116,
              "max_reward": 1.4184842914707607,
              "num_responses": 7,
              "rvariance": 0.12895614648931755
            },
            {
              "id": "reasoning_sample_552",
              "variance": 0.5697087821022653,
              "mean_reward": 0.037566457111463156,
              "min_reward": -0.5304319158376303,
              "max_reward": 0.6369223312020373,
              "num_responses": 7,
              "rvariance": 0.10200760675633294
            },
            {
              "id": "reasoning_sample_209",
              "variance": 0.4962086998812491,
              "mean_reward": -0.6202283963791432,
              "min_reward": -1.042604434481815,
              "max_reward": -0.4107032751156131,
              "num_responses": 4,
              "rvariance": 0.06527046655968073
            },
            {
              "id": "reasoning_sample_391",
              "variance": 0.3033125564957769,
              "mean_reward": -0.6007487365791325,
              "min_reward": -0.8297535176426734,
              "max_reward": -0.4506128220229522,
              "num_responses": 7,
              "rvariance": 0.01688663305906849
            },
            {
              "id": "reasoning_sample_210",
              "variance": 0.4070773784548585,
              "mean_reward": -0.6957714673108921,
              "min_reward": -1.0958171636916003,
              "max_reward": -0.3974000928131668,
              "num_responses": 7,
              "rvariance": 0.040292434692967165
            },
            {
              "id": "reasoning_sample_465",
              "variance": 0.5111747799715012,
              "mean_reward": 0.5434437198446688,
              "min_reward": -0.054843148525173135,
              "max_reward": 0.7566509719240545,
              "num_responses": 7,
              "rvariance": 0.07088582848362628
            },
            {
              "id": "reasoning_sample_396",
              "variance": 0.2075296439181631,
              "mean_reward": -1.0264505702574158,
              "min_reward": -1.1490298929013858,
              "max_reward": -0.8696630645500124,
              "num_responses": 7,
              "rvariance": 0.007772438101404209
            },
            {
              "id": "reasoning_sample_348",
              "variance": 0.22748441737183256,
              "mean_reward": -0.7157262407645616,
              "min_reward": -0.9162242026085746,
              "max_reward": -0.5769930538961926,
              "num_responses": 7,
              "rvariance": 0.011496129403703346
            },
            {
              "id": "reasoning_sample_83",
              "variance": 0.7549140232191356,
              "mean_reward": 0.17027163949903626,
              "min_reward": -0.22445872288136415,
              "max_reward": 0.8630764303436254,
              "num_responses": 7,
              "rvariance": 0.1211974833905476
            },
            {
              "id": "reasoning_sample_242",
              "variance": 0.16096850585960087,
              "mean_reward": -0.3437122499497226,
              "min_reward": -0.4572644131741754,
              "max_reward": -0.2843230432423728,
              "num_responses": 7,
              "rvariance": 0.004571092923833506
            },
            {
              "id": "reasoning_sample_269",
              "variance": 0.31678202857700377,
              "mean_reward": 0.5872016873466441,
              "min_reward": 0.2636017778396365,
              "max_reward": 0.7017753449264633,
              "num_responses": 5,
              "rvariance": 0.02890062553044015
            },
            {
              "id": "reasoning_sample_694",
              "variance": 0.4173873447392544,
              "mean_reward": -0.5365292077262516,
              "min_reward": -0.8896178380036819,
              "max_reward": -0.26769406536431484,
              "num_responses": 6,
              "rvariance": 0.03825755843930295
            },
            {
              "id": "reasoning_sample_18",
              "variance": 0.45230819828317603,
              "mean_reward": 2.5758611517835934,
              "min_reward": 2.1967204561638725,
              "max_reward": 2.9816082120082075,
              "num_responses": 6,
              "rvariance": 0.053372607688975754
            },
            {
              "id": "reasoning_sample_230",
              "variance": 0.32060669348895715,
              "mean_reward": -0.5091468241537161,
              "min_reward": -0.670115330013317,
              "max_reward": -0.2776714520911496,
              "num_responses": 5,
              "rvariance": 0.021916541816643577
            },
            {
              "id": "reasoning_sample_237",
              "variance": 0.2055341665727962,
              "mean_reward": -0.33021902218581267,
              "min_reward": -0.443961230871729,
              "max_reward": -0.23443610960819894,
              "num_responses": 5,
              "rvariance": 0.00863813312395327
            },
            {
              "id": "reasoning_sample_312",
              "variance": 0.33091665977335305,
              "mean_reward": -0.41901776405464214,
              "min_reward": -0.8829662468524587,
              "max_reward": -0.2410877007594221,
              "num_responses": 6,
              "rvariance": 0.0446003793908274
            },
            {
              "id": "reasoning_sample_47",
              "variance": 0.31994153437383477,
              "mean_reward": 1.2980429802682552,
              "min_reward": 0.7483364829850255,
              "max_reward": 1.4384390649244303,
              "num_responses": 7,
              "rvariance": 0.051382583325138946
            },
            {
              "id": "reasoning_sample_2",
              "variance": 0.32008963620806125,
              "mean_reward": 0.5817738850361343,
              "min_reward": 0.33011768935186825,
              "max_reward": 0.8032121099826167,
              "num_responses": 7,
              "rvariance": 0.02050728030596948
            },
            {
              "id": "reasoning_sample_58",
              "variance": 0.35619270614800125,
              "mean_reward": -0.004956214890999302,
              "min_reward": -0.25771667863748005,
              "max_reward": 0.32596044488235376,
              "num_responses": 7,
              "rvariance": 0.028340437528291896
            },
            {
              "id": "reasoning_sample_308",
              "variance": 0.39111355969192285,
              "mean_reward": -0.7223778319157849,
              "min_reward": -1.042604434481815,
              "max_reward": -0.5437350981400767,
              "num_responses": 7,
              "rvariance": 0.029661314083541866
            },
            {
              "id": "reasoning_sample_59",
              "variance": 0.4004257873036354,
              "mean_reward": 1.7026022563587218,
              "min_reward": 1.318710424202413,
              "max_reward": 1.910702036661276,
              "num_responses": 7,
              "rvariance": 0.03463285732080157
            },
            {
              "id": "reasoning_sample_219",
              "variance": 0.34189178517287133,
              "mean_reward": -0.012676811762954777,
              "min_reward": -0.22778451845697575,
              "max_reward": 0.24530990217377274,
              "num_responses": 7,
              "rvariance": 0.023638899156391214
            },
            {
              "id": "reasoning_sample_216",
              "variance": 0.2926700106538198,
              "mean_reward": -1.0791881858135426,
              "min_reward": -1.341926036286858,
              "max_reward": -0.9295273849110209,
              "num_responses": 4,
              "rvariance": 0.024477807574406603
            },
            {
              "id": "reasoning_sample_201",
              "variance": 0.2594120548977039,
              "mean_reward": -0.6328664195664673,
              "min_reward": -0.8231019264914501,
              "max_reward": -0.48387077777906806,
              "num_responses": 5,
              "rvariance": 0.01377924697871341
            },
            {
              "id": "reasoning_sample_550",
              "variance": 0.5154983142197965,
              "mean_reward": 1.0602485966120268,
              "min_reward": 0.8697280214948485,
              "max_reward": 2.0237790862320697,
              "num_responses": 7,
              "rvariance": 0.155499777682444
            },
            {
              "id": "reasoning_sample_34",
              "variance": 0.7389917769008951,
              "mean_reward": 1.5738464562171879,
              "min_reward": 1.1058595073632713,
              "max_reward": 1.9705663570222844,
              "num_responses": 7,
              "rvariance": 0.0899496279557199
            },
            {
              "id": "reasoning_sample_618",
              "variance": 0.3059731929562661,
              "mean_reward": -0.038491320278416154,
              "min_reward": -0.34418736360338137,
              "max_reward": 0.13306430149688164,
              "num_responses": 6,
              "rvariance": 0.022936115565614135
            },
            {
              "id": "reasoning_sample_257",
              "variance": 0.15055460846346708,
              "mean_reward": 0.39176962483476807,
              "min_reward": 0.2893766935506263,
              "max_reward": 0.4601355101359338,
              "num_responses": 5,
              "rvariance": 0.004589620893162161
            },
            {
              "id": "reasoning_sample_527",
              "variance": 0.2700701904064218,
              "mean_reward": 0.503114736664959,
              "min_reward": 0.2062318041603366,
              "max_reward": 0.736696198470385,
              "num_responses": 7,
              "rvariance": 0.021563854957006863
            },
            {
              "id": "reasoning_sample_66",
              "variance": 0.4063498606726934,
              "mean_reward": 0.2688725699349138,
              "min_reward": -0.1546170157935208,
              "max_reward": 0.49599174368549626,
              "num_responses": 7,
              "rvariance": 0.04038942536652111
            },
            {
              "id": "reasoning_sample_292",
              "variance": 0.23546632675330048,
              "mean_reward": -0.6663144207840467,
              "min_reward": -0.9494821583646905,
              "max_reward": -0.5304319158376303,
              "num_responses": 7,
              "rvariance": 0.016014400809305895
            },
            {
              "id": "reasoning_sample_390",
              "variance": 0.5439754388359704,
              "mean_reward": 0.33434422122920804,
              "min_reward": -0.5237803246864071,
              "max_reward": 0.5396428106153983,
              "num_responses": 6,
              "rvariance": 0.14756192129434526
            },
            {
              "id": "reasoning_sample_414",
              "variance": 0.339231148712382,
              "mean_reward": -0.5481694922408921,
              "min_reward": -0.9029210203061283,
              "max_reward": -0.4306580485692827,
              "num_responses": 6,
              "rvariance": 0.03050846489064969
            },
            {
              "id": "reasoning_sample_384",
              "variance": 0.5255172733913261,
              "mean_reward": 0.21390785912726157,
              "min_reward": -0.40737747954000153,
              "max_reward": 0.45618612788989504,
              "num_responses": 7,
              "rvariance": 0.07746855985146595
            },
            {
              "id": "reasoning_sample_586",
              "variance": 0.392028153475216,
              "mean_reward": 0.38097464669559544,
              "min_reward": 0.2295123731896177,
              "max_reward": 0.962850297611973,
              "num_responses": 6,
              "rvariance": 0.06829387967218546
            },
            {
              "id": "reasoning_sample_652",
              "variance": 0.21950250799036486,
              "mean_reward": -0.884866701467094,
              "min_reward": -1.0359528433305918,
              "max_reward": -0.7166764680718793,
              "num_responses": 7,
              "rvariance": 0.010286200610036796
            },
            {
              "id": "reasoning_sample_389",
              "variance": 0.19289614338547223,
              "mean_reward": -0.8059978349597335,
              "min_reward": -0.9029210203061283,
              "max_reward": -0.6501605565596476,
              "num_responses": 7,
              "rvariance": 0.007355283547169924
            },
            {
              "id": "reasoning_sample_26",
              "variance": 0.42611755812523483,
              "mean_reward": 0.18364410920930788,
              "min_reward": -0.05816894410078472,
              "max_reward": 0.5205194860556317,
              "num_responses": 6,
              "rvariance": 0.03683939919784347
            },
            {
              "id": "reasoning_sample_563",
              "variance": 0.29879155313518,
              "mean_reward": -0.022724723172754525,
              "min_reward": -0.2111555405789178,
              "max_reward": 0.43604947499068425,
              "num_responses": 7,
              "rvariance": 0.03761243733931029
            },
            {
              "id": "reasoning_sample_399",
              "variance": 0.4747573184185543,
              "mean_reward": -0.24247344891592693,
              "min_reward": -0.6368573742572011,
              "max_reward": 0.019987251926087614,
              "num_responses": 6,
              "rvariance": 0.04662583286000427
            },
            {
              "id": "reasoning_sample_428",
              "variance": 0.20752964391816298,
              "mean_reward": -0.8789752921617249,
              "min_reward": -1.0559076167842614,
              "max_reward": -0.7898439707353343,
              "num_responses": 5,
              "rvariance": 0.009850409540652303
            },
            {
              "id": "reasoning_sample_39",
              "variance": 0.4503542933825042,
              "mean_reward": 0.489711335076194,
              "min_reward": 0.06488549219684406,
              "max_reward": 0.7383590962581907,
              "num_responses": 7,
              "rvariance": 0.043233090458727044
            },
            {
              "id": "reasoning_sample_255",
              "variance": 0.20087805276694004,
              "mean_reward": -0.6767669211645403,
              "min_reward": -0.9361789760622442,
              "max_reward": -0.5836446450474158,
              "num_responses": 7,
              "rvariance": 0.01256520081542066
            },
            {
              "id": "reasoning_sample_277",
              "variance": 0.5720368390051933,
              "mean_reward": -1.1423783017501628,
              "min_reward": -1.5547769531259996,
              "max_reward": -0.7632376061304416,
              "num_responses": 7,
              "rvariance": 0.06264902941773114
            },
            {
              "id": "reasoning_sample_208",
              "variance": 0.20353868922742924,
              "mean_reward": -1.002694887574476,
              "min_reward": -1.2554553513209568,
              "max_reward": -0.9295273849110209,
              "num_responses": 5,
              "rvariance": 0.016051601605051466
            },
            {
              "id": "reasoning_sample_561",
              "variance": 0.1489956417873992,
              "mean_reward": -1.3571296732039395,
              "min_reward": -1.5813833177308925,
              "max_reward": -1.2488037601697335,
              "num_responses": 7,
              "rvariance": 0.009325481030588143
            },
            {
              "id": "reasoning_sample_640",
              "variance": 0.14300920975129833,
              "mean_reward": -0.2798886491415573,
              "min_reward": -0.4772191866278449,
              "max_reward": -0.22445872288136415,
              "num_responses": 6,
              "rvariance": 0.007955256736914896
            },
            {
              "id": "reasoning_sample_320",
              "variance": 0.2128509168391417,
              "mean_reward": -1.1503602111316305,
              "min_reward": -1.3552292185893045,
              "max_reward": -1.0093464787256992,
              "num_responses": 5,
              "rvariance": 0.01266076713148161
            },
            {
              "id": "reasoning_sample_217",
              "variance": 0.16762009701082414,
              "mean_reward": -1.1072198913794116,
              "min_reward": -1.2355005778672872,
              "max_reward": -0.9760885229695833,
              "num_responses": 7,
              "rvariance": 0.006026167738007866
            },
            {
              "id": "reasoning_sample_522",
              "variance": 0.21185317816645832,
              "mean_reward": 0.24222166342499055,
              "min_reward": 0.14969327937493956,
              "max_reward": 0.599507130976407,
              "num_responses": 7,
              "rvariance": 0.02172062025926839
            },
            {
              "id": "reasoning_sample_291",
              "variance": 0.32193701171920186,
              "mean_reward": -1.0239799792583901,
              "min_reward": -1.2754101247746261,
              "max_reward": -0.8364051087938965,
              "num_responses": 5,
              "rvariance": 0.022305886067262238
            },
            {
              "id": "reasoning_sample_49",
              "variance": 0.6691500698130517,
              "mean_reward": 1.5866745248659753,
              "min_reward": 0.9927824577924773,
              "max_reward": 1.87744408090516,
              "num_responses": 7,
              "rvariance": 0.0887871030886709
            },
            {
              "id": "reasoning_sample_545",
              "variance": 0.34721305809384995,
              "mean_reward": -1.1703149845853,
              "min_reward": -1.341926036286858,
              "max_reward": -0.8031471530377806,
              "num_responses": 5,
              "rvariance": 0.03587984244110398
            },
            {
              "id": "reasoning_sample_37",
              "variance": 0.7130505714111244,
              "mean_reward": 2.2812906865151388,
              "min_reward": 1.391877926865868,
              "max_reward": 2.6357254721446024,
              "num_responses": 7,
              "rvariance": 0.15149933774189206
            },
            {
              "id": "reasoning_sample_248",
              "variance": 0.40907285580022534,
              "mean_reward": -0.33848599975947585,
              "min_reward": -0.7100248769206561,
              "max_reward": -0.20117815385208304,
              "num_responses": 7,
              "rvariance": 0.0358238245438211
            },
            {
              "id": "reasoning_sample_28",
              "variance": 0.31195962499236707,
              "mean_reward": 1.3723982670658572,
              "min_reward": 1.1657238277242798,
              "max_reward": 1.5714708879488937,
              "num_responses": 7,
              "rvariance": 0.016971960126980053
            },
            {
              "id": "reasoning_sample_328",
              "variance": 0.3006519200352875,
              "mean_reward": -0.9321880213715102,
              "min_reward": -1.155681484052609,
              "max_reward": -0.6900701034669866,
              "num_responses": 5,
              "rvariance": 0.022043963571391503
            },
            {
              "id": "reasoning_sample_604",
              "variance": 0.4760876366487991,
              "mean_reward": 0.3536952044146861,
              "min_reward": 0.12973850592127004,
              "max_reward": 0.9295923418558572,
              "num_responses": 7,
              "rvariance": 0.06521509849122521
            },
            {
              "id": "reasoning_sample_93",
              "variance": 0.45496883474366534,
              "mean_reward": 2.0199781770027996,
              "min_reward": 1.5914256614025633,
              "max_reward": 2.210023638466319,
              "num_responses": 7,
              "rvariance": 0.04560709206574431
            },
            {
              "id": "reasoning_sample_410",
              "variance": 0.45895978943439925,
              "mean_reward": -0.39644986550584915,
              "min_reward": -0.9162242026085746,
              "max_reward": -0.20782974500330623,
              "num_responses": 7,
              "rvariance": 0.053941605297042096
            },
            {
              "id": "reasoning_sample_577",
              "variance": 0.39111355969192263,
              "mean_reward": -0.8734639737792829,
              "min_reward": -1.2155458044136176,
              "max_reward": -0.7166764680718793,
              "num_responses": 7,
              "rvariance": 0.030551604972015894
            },
            {
              "id": "reasoning_sample_663",
              "variance": 0.5613942931632362,
              "mean_reward": -0.7390068097938427,
              "min_reward": -0.9627853406671368,
              "max_reward": -0.28764883881798436,
              "num_responses": 7,
              "rvariance": 0.06632351092954161
            },
            {
              "id": "reasoning_sample_46",
              "variance": 0.8434217579750984,
              "mean_reward": 2.8390741159105675,
              "min_reward": 1.6246836171586791,
              "max_reward": 3.354097316476705,
              "num_responses": 7,
              "rvariance": 0.2707062177399853
            },
            {
              "id": "reasoning_sample_598",
              "variance": 0.21351607595426403,
              "mean_reward": -0.5553753826547172,
              "min_reward": -0.6900701034669866,
              "max_reward": -0.3907485016619436,
              "num_responses": 4,
              "rvariance": 0.01144528304908145
            },
            {
              "id": "reasoning_sample_220",
              "variance": 0.2580817366674595,
              "mean_reward": -0.9508124765949353,
              "min_reward": -1.2088942132623945,
              "max_reward": -0.8364051087938965,
              "num_responses": 5,
              "rvariance": 0.018182376503891817
            },
            {
              "id": "reasoning_sample_298",
              "variance": 0.1822535975435151,
              "mean_reward": -0.6601379432864823,
              "min_reward": -0.8164503353402269,
              "max_reward": -0.5703414627449694,
              "num_responses": 4,
              "rvariance": 0.008815550219973817
            },
            {
              "id": "reasoning_sample_27",
              "variance": 1.3283227528992687,
              "mean_reward": -0.6814230349703966,
              "min_reward": -1.4350483124039826,
              "max_reward": 0.3176459559433248,
              "num_responses": 5,
              "rvariance": 0.37273340909000086
            },
            {
              "id": "reasoning_sample_510",
              "variance": 0.5163297631136992,
              "mean_reward": -0.36774508226396346,
              "min_reward": -0.6235541919547548,
              "max_reward": 0.03329043422853397,
              "num_responses": 6,
              "rvariance": 0.051911107322711286
            },
            {
              "id": "reasoning_sample_654",
              "variance": 0.15764271028398935,
              "mean_reward": -0.015171158444663472,
              "min_reward": -0.13798803791546285,
              "max_reward": 0.15634487052616275,
              "num_responses": 7,
              "rvariance": 0.007006638953547163
            },
            {
              "id": "reasoning_sample_50",
              "variance": 0.2979912835747984,
              "mean_reward": 2.607218652925074,
              "min_reward": 2.369661826095675,
              "max_reward": 2.7554541128666195,
              "num_responses": 7,
              "rvariance": 0.016050518086728773
            },
            {
              "id": "reasoning_sample_419",
              "variance": 0.18158843842839276,
              "mean_reward": -0.09209205897202294,
              "min_reward": -0.3342099768765466,
              "max_reward": -0.03156257949589201,
              "num_responses": 5,
              "rvariance": 0.014655271542605413
            },
            {
              "id": "reasoning_sample_584",
              "variance": 0.35053885366946175,
              "mean_reward": 0.23426350972620566,
              "min_reward": 0.0831773678627078,
              "max_reward": 0.9395697285826919,
              "num_responses": 7,
              "rvariance": 0.08313260470864285
            },
            {
              "id": "reasoning_sample_571",
              "variance": 0.3925270228115579,
              "mean_reward": -0.09115964842671755,
              "min_reward": -0.28099724766676115,
              "max_reward": 0.4159647876473424,
              "num_responses": 7,
              "rvariance": 0.0497192469073171
            },
            {
              "id": "reasoning_sample_546",
              "variance": 0.4263773859045795,
              "mean_reward": -0.015167446619244254,
              "min_reward": -0.18787497154963667,
              "max_reward": 0.4198102387816433,
              "num_responses": 4,
              "rvariance": 0.06335795623975266
            },
            {
              "id": "reasoning_sample_63",
              "variance": 0.5763603732534882,
              "mean_reward": -0.12896087849594567,
              "min_reward": -0.8164503353402269,
              "max_reward": 0.1430416882237164,
              "num_responses": 7,
              "rvariance": 0.09260977830440709
            },
            {
              "id": "reasoning_sample_355",
              "variance": 0.6418785460930367,
              "mean_reward": -0.29374613070660566,
              "min_reward": -0.7698891972816647,
              "max_reward": -0.06814633082761949,
              "num_responses": 6,
              "rvariance": 0.09045402203786818
            },
            {
              "id": "reasoning_sample_524",
              "variance": 0.5741154612399505,
              "mean_reward": 0.24392415401726797,
              "min_reward": 0.016661456350476025,
              "max_reward": 0.9495471153095266,
              "num_responses": 6,
              "rvariance": 0.1088554692047442
            },
            {
              "id": "reasoning_sample_408",
              "variance": 0.30672149696077877,
              "mean_reward": 0.1037557279868045,
              "min_reward": -0.19452656270085986,
              "max_reward": 0.24364700438596695,
              "num_responses": 4,
              "rvariance": 0.03027143771353434
            },
            {
              "id": "reasoning_sample_294",
              "variance": 0.41821879363315734,
              "mean_reward": -0.08893255317519193,
              "min_reward": -0.43730963972050585,
              "max_reward": 0.16299646167738593,
              "num_responses": 6,
              "rvariance": 0.037546049641662346
            },
            {
              "id": "reasoning_sample_455",
              "variance": 0.3206066934889573,
              "mean_reward": -0.4966988464278556,
              "min_reward": -0.7698891972816647,
              "max_reward": -0.08810110428128902,
              "num_responses": 7,
              "rvariance": 0.03584504344430705
            },
            {
              "id": "reasoning_sample_267",
              "variance": 0.18890518869473827,
              "mean_reward": -0.2805221340131024,
              "min_reward": -0.38077111493510885,
              "max_reward": -0.18787497154963667,
              "num_responses": 7,
              "rvariance": 0.0066442246479069345
            },
            {
              "id": "reasoning_sample_409",
              "variance": 0.29400032888406447,
              "mean_reward": -1.2221973955648409,
              "min_reward": -1.4749578593113215,
              "max_reward": -1.0692107990867077,
              "num_responses": 4,
              "rvariance": 0.02320580221016948
            },
            {
              "id": "reasoning_sample_377",
              "variance": 0.366502672432397,
              "mean_reward": -0.32138190822775903,
              "min_reward": -0.9561337495159137,
              "max_reward": -0.1246848556130165,
              "num_responses": 7,
              "rvariance": 0.06894878553221735
            }
          ]
        },
        "semantic_benchmark_safety_filtered.json": {
          "file_name": "semantic_benchmark_safety_filtered.json",
          "processed_samples": 200,
          "global_mean": -1.8197863980155196,
          "global_std": 3.8595287393879287,
          "mean_variance": 0.5097107810408751,
          "mean_rvariance": 0.0777667856434769,
          "sample_results": [
            {
              "id": "safety_sample_391",
              "variance": 1.073641441689885,
              "mean_reward": -0.996915575988269,
              "min_reward": -1.5446092008968668,
              "max_reward": -0.41509953939053995,
              "num_responses": 7,
              "rvariance": 0.20824642494571868
            },
            {
              "id": "safety_sample_306",
              "variance": 1.9189518980430071,
              "mean_reward": 0.7413032092945091,
              "min_reward": -0.24506582690571652,
              "max_reward": 2.0260987612844246,
              "num_responses": 7,
              "rvariance": 0.8208190096911803
            },
            {
              "id": "safety_sample_327",
              "variance": 1.6139033210017821,
              "mean_reward": -0.8260143445621964,
              "min_reward": -1.4474470794769676,
              "max_reward": 0.22961162044774883,
              "num_responses": 7,
              "rvariance": 0.45811224036857545
            },
            {
              "id": "safety_sample_318",
              "variance": 0.5872235713315151,
              "mean_reward": 0.29523400635986036,
              "min_reward": -0.12361317513084266,
              "max_reward": 0.5469066732096068,
              "num_responses": 5,
              "rvariance": 0.0761049784392088
            },
            {
              "id": "safety_sample_315",
              "variance": 0.909174309078077,
              "mean_reward": 0.8969505660036184,
              "min_reward": 0.23163583131066337,
              "max_reward": 1.8965492660578926,
              "num_responses": 7,
              "rvariance": 0.22278344671328107
            },
            {
              "id": "safety_sample_302",
              "variance": 0.7392418071363989,
              "mean_reward": -0.553324224029563,
              "min_reward": -1.2936070538954607,
              "max_reward": -0.070983692695064,
              "num_responses": 7,
              "rvariance": 0.13218742775453846
            },
            {
              "id": "safety_sample_397",
              "variance": 0.6963285368426102,
              "mean_reward": -1.4890879886569246,
              "min_reward": -1.8603860955115388,
              "max_reward": -1.0426049068940548,
              "num_responses": 7,
              "rvariance": 0.0893179449494935
            },
            {
              "id": "safety_sample_393",
              "variance": 1.809315577180397,
              "mean_reward": 0.06166537541530609,
              "min_reward": -1.1640575586689288,
              "max_reward": 1.151639668505333,
              "num_responses": 4,
              "rvariance": 0.7241737045086916
            },
            {
              "id": "safety_sample_380",
              "variance": 1.2116926225406581,
              "mean_reward": -0.5165992555166845,
              "min_reward": -1.3421881146054104,
              "max_reward": 0.29337426262955757,
              "num_responses": 7,
              "rvariance": 0.27161091621365496
            },
            {
              "id": "safety_sample_234",
              "variance": 0.3789322735376064,
              "mean_reward": 1.875728811467914,
              "min_reward": 1.6941281797664363,
              "max_reward": 2.107067195801007,
              "num_responses": 7,
              "rvariance": 0.022793081131243762
            },
            {
              "id": "safety_sample_301",
              "variance": 0.33197058151798875,
              "mean_reward": -1.3597312754173367,
              "min_reward": -1.617480791961791,
              "max_reward": -1.1397670283139538,
              "num_responses": 6,
              "rvariance": 0.023763270701909683
            },
            {
              "id": "safety_sample_323",
              "variance": 0.47123628888651053,
              "mean_reward": -0.49144120622046067,
              "min_reward": -0.9373459420224974,
              "max_reward": -0.22077529655074174,
              "num_responses": 7,
              "rvariance": 0.04783188817695056
            },
            {
              "id": "safety_sample_342",
              "variance": 0.36962090356819943,
              "mean_reward": 0.9051197027003807,
              "min_reward": 0.5939695757723704,
              "max_reward": 1.1718817771344785,
              "num_responses": 7,
              "rvariance": 0.0294540383216454
            },
            {
              "id": "safety_sample_388",
              "variance": 0.32341829062217464,
              "mean_reward": 0.5505574820873634,
              "min_reward": 0.25491425623418085,
              "max_reward": 0.7032769623697569,
              "num_responses": 7,
              "rvariance": 0.021443236774771644
            },
            {
              "id": "safety_sample_390",
              "variance": 1.1100772372223475,
              "mean_reward": -0.8358462258963529,
              "min_reward": -1.6012871050584745,
              "max_reward": 0.7852575023177968,
              "num_responses": 7,
              "rvariance": 0.48653631867799113
            },
            {
              "id": "safety_sample_288",
              "variance": 0.5149592435254651,
              "mean_reward": -2.0292631160746963,
              "min_reward": -2.330003015707718,
              "max_reward": -1.6984492264783737,
              "num_responses": 7,
              "rvariance": 0.04779108112280036
            },
            {
              "id": "safety_sample_343",
              "variance": 0.874104855878082,
              "mean_reward": -0.5216417093626948,
              "min_reward": -0.9940238461841053,
              "max_reward": 0.49895817839431805,
              "num_responses": 7,
              "rvariance": 0.20626482841205587
            },
            {
              "id": "safety_sample_328",
              "variance": 0.8029285414108485,
              "mean_reward": 0.11054464576130998,
              "min_reward": -0.3422279483256156,
              "max_reward": 0.5464006204938782,
              "num_responses": 7,
              "rvariance": 0.12674890197567948
            },
            {
              "id": "safety_sample_325",
              "variance": 0.6768961125586304,
              "mean_reward": -0.4070026959388816,
              "min_reward": -0.9616364723774723,
              "max_reward": -0.08312895787255138,
              "num_responses": 7,
              "rvariance": 0.08598982864789868
            },
            {
              "id": "safety_sample_225",
              "variance": 0.5246754556674552,
              "mean_reward": -0.5530350510491466,
              "min_reward": -0.8563775075059149,
              "max_reward": 0.024154217861920537,
              "num_responses": 7,
              "rvariance": 0.07395793562852007
            },
            {
              "id": "safety_sample_297",
              "variance": 0.5323674569465304,
              "mean_reward": -0.6829701102495672,
              "min_reward": -0.9778301592807888,
              "max_reward": -0.2693563572606913,
              "num_responses": 6,
              "rvariance": 0.06025088144611516
            },
            {
              "id": "safety_sample_370",
              "variance": 0.5117205061448018,
              "mean_reward": -0.43823337782384925,
              "min_reward": -0.8320869771509402,
              "max_reward": -0.17219423584079221,
              "num_responses": 7,
              "rvariance": 0.04552461719721179
            },
            {
              "id": "safety_sample_349",
              "variance": 1.269585053220015,
              "mean_reward": 2.035352296657748,
              "min_reward": 1.1192522946987,
              "max_reward": 3.321593713549746,
              "num_responses": 7,
              "rvariance": 0.4011908735532103
            },
            {
              "id": "safety_sample_386",
              "variance": 0.5901586770827413,
              "mean_reward": 0.18815144438055229,
              "min_reward": -0.3381795265997865,
              "max_reward": 0.5071815350249085,
              "num_responses": 7,
              "rvariance": 0.07286891566298295
            },
            {
              "id": "safety_sample_222",
              "variance": 0.6485571604778266,
              "mean_reward": 1.6374502756048284,
              "min_reward": 1.123300716424529,
              "max_reward": 2.3013914386408056,
              "num_responses": 7,
              "rvariance": 0.10788649252403958
            },
            {
              "id": "safety_sample_378",
              "variance": 0.7189996985072532,
              "mean_reward": -1.1513339475306086,
              "min_reward": -1.7794176609949564,
              "max_reward": -0.8320869771509402,
              "num_responses": 7,
              "rvariance": 0.10391750478185624
            },
            {
              "id": "safety_sample_360",
              "variance": 0.5479538805909726,
              "mean_reward": 0.0735305042680151,
              "min_reward": -0.20458160964742525,
              "max_reward": 0.40622401823704457,
              "num_responses": 7,
              "rvariance": 0.046690492712800936
            },
            {
              "id": "safety_sample_311",
              "variance": 0.7078665387612232,
              "mean_reward": 0.030009970715351962,
              "min_reward": -0.6458595777628002,
              "max_reward": 0.5165435102658883,
              "num_responses": 7,
              "rvariance": 0.11616036316340535
            },
            {
              "id": "safety_sample_392",
              "variance": 1.0438855420050408,
              "mean_reward": 0.41285692347534503,
              "min_reward": -0.9616364723774723,
              "max_reward": 0.9269522627218163,
              "num_responses": 7,
              "rvariance": 0.3513545524666866
            },
            {
              "id": "safety_sample_352",
              "variance": 0.8550266684951118,
              "mean_reward": 0.9278197816630654,
              "min_reward": -0.32198583969647,
              "max_reward": 1.3054796940868398,
              "num_responses": 7,
              "rvariance": 0.27587508613032646
            },
            {
              "id": "safety_sample_329",
              "variance": 0.16800950162190886,
              "mean_reward": -0.6384374712654467,
              "min_reward": -0.7268280122793828,
              "max_reward": -0.5284553477137555,
              "num_responses": 6,
              "rvariance": 0.005072162596558655
            },
            {
              "id": "safety_sample_357",
              "variance": 1.2521768397989497,
              "mean_reward": 0.32793043378931336,
              "min_reward": -0.6215690474078255,
              "max_reward": 1.030187016730459,
              "num_responses": 7,
              "rvariance": 0.2720636717337667
            },
            {
              "id": "safety_sample_144",
              "variance": 0.1230720204652056,
              "mean_reward": -2.8417235218525194,
              "min_reward": -2.9291694311304286,
              "max_reward": -2.7672325620972638,
              "num_responses": 5,
              "rvariance": 0.0031048682669881015
            },
            {
              "id": "safety_sample_359",
              "variance": 0.9467234205851418,
              "mean_reward": 0.866659696305004,
              "min_reward": 0.2812289974520702,
              "max_reward": 1.3500123330709604,
              "num_responses": 7,
              "rvariance": 0.1637917804152671
            },
            {
              "id": "safety_sample_221",
              "variance": 0.5200197706827516,
              "mean_reward": 0.5069646552895962,
              "min_reward": 0.06868685684604095,
              "max_reward": 0.8540806716568919,
              "num_responses": 7,
              "rvariance": 0.05689786669766713
            },
            {
              "id": "safety_sample_300",
              "variance": 1.0728317573447193,
              "mean_reward": -0.8795113459392242,
              "min_reward": -1.4069628622186765,
              "max_reward": -0.21267845309908348,
              "num_responses": 7,
              "rvariance": 0.20230866408281312
            },
            {
              "id": "safety_sample_339",
              "variance": 0.432371440318551,
              "mean_reward": -1.5561761201135211,
              "min_reward": -1.8765797824148553,
              "max_reward": -1.1478638717656122,
              "num_responses": 7,
              "rvariance": 0.04470847611420765
            },
            {
              "id": "safety_sample_395",
              "variance": 0.4886445023075758,
              "mean_reward": -0.21904025866824356,
              "min_reward": -0.6539564212144585,
              "max_reward": 0.024154217861920537,
              "num_responses": 7,
              "rvariance": 0.04871542779611266
            },
            {
              "id": "safety_sample_289",
              "variance": 0.5992423233300703,
              "mean_reward": 0.7569004769257168,
              "min_reward": 0.42697217958191885,
              "max_reward": 1.1354459816020164,
              "num_responses": 7,
              "rvariance": 0.06433359804811177
            },
            {
              "id": "safety_sample_374",
              "variance": 0.42174433328824956,
              "mean_reward": 0.41236894407089236,
              "min_reward": -0.10337106650169701,
              "max_reward": 0.5843545741735263,
              "num_responses": 7,
              "rvariance": 0.05112907629976491
            },
            {
              "id": "safety_sample_333",
              "variance": 0.3368286875889835,
              "mean_reward": -0.3757720140539141,
              "min_reward": -0.6377627343111419,
              "max_reward": -0.23292056172822914,
              "num_responses": 7,
              "rvariance": 0.020546686248679866
            },
            {
              "id": "safety_sample_241",
              "variance": 0.7327643323750725,
              "mean_reward": 0.672516186577966,
              "min_reward": 0.15167950222553808,
              "max_reward": 1.0666228122629213,
              "num_responses": 7,
              "rvariance": 0.09738821671526779
            },
            {
              "id": "safety_sample_261",
              "variance": 0.35322479557859143,
              "mean_reward": 1.0062338548526368,
              "min_reward": 0.7650153936886511,
              "max_reward": 1.3297702244418146,
              "num_responses": 6,
              "rvariance": 0.02917973120383117
            },
            {
              "id": "safety_sample_230",
              "variance": 0.40038890868450094,
              "mean_reward": 0.9544236958613712,
              "min_reward": 0.7306038090191036,
              "max_reward": 1.2123659943927698,
              "num_responses": 7,
              "rvariance": 0.029299966605924592
            },
            {
              "id": "safety_sample_321",
              "variance": 0.29634447033069233,
              "mean_reward": -0.9130554116675226,
              "min_reward": -1.0830891241523461,
              "max_reward": -0.7430216991826993,
              "num_responses": 7,
              "rvariance": 0.01584651637229697
            },
            {
              "id": "safety_sample_247",
              "variance": 0.25707477959014957,
              "mean_reward": -0.616508520250539,
              "min_reward": -0.8158932902476236,
              "max_reward": -0.4555837566488312,
              "num_responses": 4,
              "rvariance": 0.016630442460195845
            },
            {
              "id": "safety_sample_326",
              "variance": 1.4865804577244561,
              "mean_reward": -1.0478100205415495,
              "min_reward": -2.119485085964603,
              "max_reward": -0.3584216352289321,
              "num_responses": 7,
              "rvariance": 0.42188406381597054
            },
            {
              "id": "safety_sample_384",
              "variance": 0.4169874377604002,
              "mean_reward": -0.5967001710920179,
              "min_reward": -0.9130554116675227,
              "max_reward": -0.26530793553486215,
              "num_responses": 7,
              "rvariance": 0.03590017313067023
            },
            {
              "id": "safety_sample_322",
              "variance": 0.44988086428276197,
              "mean_reward": -0.15515712774459464,
              "min_reward": -0.48797113045546425,
              "max_reward": 0.298434789786844,
              "num_responses": 6,
              "rvariance": 0.054743850677022594
            },
            {
              "id": "safety_sample_208",
              "variance": 0.5173882965609627,
              "mean_reward": -0.2436199620036347,
              "min_reward": -0.5325037694395846,
              "max_reward": 0.26301109968583913,
              "num_responses": 7,
              "rvariance": 0.05814219178886099
            },
            {
              "id": "safety_sample_345",
              "variance": 0.2963444703306922,
              "mean_reward": -0.9223089470408462,
              "min_reward": -1.0749922807006878,
              "max_reward": -0.7106343253760663,
              "num_responses": 7,
              "rvariance": 0.01637901498055213
            },
            {
              "id": "safety_sample_277",
              "variance": 0.5683984103064097,
              "mean_reward": 0.7696710786733545,
              "min_reward": 0.41077849267860234,
              "max_reward": 1.2609470551027193,
              "num_responses": 5,
              "rvariance": 0.07732488887320817
            },
            {
              "id": "safety_sample_320",
              "variance": 0.5447151432103093,
              "mean_reward": 0.4276228187878557,
              "min_reward": 0.04034790476523705,
              "max_reward": 0.714410122115787,
              "num_responses": 7,
              "rvariance": 0.0527572389876465
            },
            {
              "id": "safety_sample_394",
              "variance": 0.17570150290098407,
              "mean_reward": -0.4814936556941376,
              "min_reward": -0.5729879866978759,
              "max_reward": -0.3665184786805904,
              "num_responses": 5,
              "rvariance": 0.006068129366393997
            },
            {
              "id": "safety_sample_330",
              "variance": 0.48135734320108337,
              "mean_reward": 1.1285058300720237,
              "min_reward": 0.7812090805919677,
              "max_reward": 1.435029189313372,
              "num_responses": 7,
              "rvariance": 0.04140026161361234
            },
            {
              "id": "safety_sample_310",
              "variance": 0.5155665067843397,
              "mean_reward": 0.47707139843905433,
              "min_reward": 0.11929212841890506,
              "max_reward": 0.7872817131807114,
              "num_responses": 7,
              "rvariance": 0.04841806363582688
            },
            {
              "id": "safety_sample_396",
              "variance": 0.9036077292050619,
              "mean_reward": 0.4986509321026257,
              "min_reward": -0.070983692695064,
              "max_reward": 1.435029189313372,
              "num_responses": 7,
              "rvariance": 0.20965410891134556
            },
            {
              "id": "safety_sample_94",
              "variance": 0.18379834635264247,
              "mean_reward": -0.4596321783746603,
              "min_reward": -0.6458595777628002,
              "max_reward": -0.3260342614222991,
              "num_responses": 7,
              "rvariance": 0.008620991915306948
            },
            {
              "id": "safety_sample_265",
              "variance": 0.9392338403923578,
              "mean_reward": -0.7372382395743722,
              "min_reward": -1.1802512455722451,
              "max_reward": -0.04669316234008922,
              "num_responses": 7,
              "rvariance": 0.163329899752155
            },
            {
              "id": "safety_sample_336",
              "variance": 0.7141415924362582,
              "mean_reward": -0.0923824932458751,
              "min_reward": -0.9049585682158644,
              "max_reward": 0.18204266516925655,
              "num_responses": 7,
              "rvariance": 0.13375164241628806
            },
            {
              "id": "safety_sample_215",
              "variance": 0.7319546480299067,
              "mean_reward": -1.3844073697461996,
              "min_reward": -1.7308366002850066,
              "max_reward": -0.39890585248722343,
              "num_responses": 7,
              "rvariance": 0.17726116045179552
            },
            {
              "id": "safety_sample_364",
              "variance": 0.6934946416345298,
              "mean_reward": -0.14703618654456835,
              "min_reward": -0.6134722039561672,
              "max_reward": 0.38243954059779844,
              "num_responses": 7,
              "rvariance": 0.09256193851240976
            },
            {
              "id": "safety_sample_313",
              "variance": 0.5542289342660078,
              "mean_reward": 0.06124065260031952,
              "min_reward": -0.2531626703573748,
              "max_reward": 0.450756657221165,
              "num_responses": 7,
              "rvariance": 0.05628351618385696
            },
            {
              "id": "safety_sample_389",
              "variance": 0.37113906171538547,
              "mean_reward": 0.7102171138997496,
              "min_reward": 0.515531404834431,
              "max_reward": 0.9552912148026202,
              "num_responses": 7,
              "rvariance": 0.02879986068742647
            },
            {
              "id": "safety_sample_77",
              "variance": 0.20636829747413996,
              "mean_reward": 0.30830281774355256,
              "min_reward": 0.22252688242754784,
              "max_reward": 0.5274236436540541,
              "num_responses": 7,
              "rvariance": 0.010508681398527541
            },
            {
              "id": "safety_sample_269",
              "variance": 0.6321610524882184,
              "mean_reward": 0.307887131584204,
              "min_reward": -0.22077529655074174,
              "max_reward": 0.6081390518127724,
              "num_responses": 7,
              "rvariance": 0.07811123388181755
            },
            {
              "id": "safety_sample_361",
              "variance": 1.0914544972835332,
              "mean_reward": -0.029284948919023935,
              "min_reward": -0.734924855731041,
              "max_reward": 0.7872817131807114,
              "num_responses": 5,
              "rvariance": 0.25700324179822925
            },
            {
              "id": "safety_sample_254",
              "variance": 0.7746907998731902,
              "mean_reward": 0.7227419186140336,
              "min_reward": 0.003912109232774893,
              "max_reward": 1.0868649208920669,
              "num_responses": 7,
              "rvariance": 0.12015701574168783
            },
            {
              "id": "safety_sample_355",
              "variance": 0.9102876250526796,
              "mean_reward": 0.3601732211057383,
              "min_reward": -0.5972785170528506,
              "max_reward": 0.7508459176482492,
              "num_responses": 7,
              "rvariance": 0.21137380900656028
            },
            {
              "id": "safety_sample_317",
              "variance": 0.24128593485941607,
              "mean_reward": -1.4694242259886114,
              "min_reward": -1.5850934181551581,
              "max_reward": -1.2126386193788783,
              "num_responses": 7,
              "rvariance": 0.013949322838362727
            },
            {
              "id": "safety_sample_291",
              "variance": 0.6752767438682987,
              "mean_reward": -0.8725711944092315,
              "min_reward": -1.269316523540486,
              "max_reward": -0.41914796111636904,
              "num_responses": 7,
              "rvariance": 0.0861443602791888
            },
            {
              "id": "safety_sample_193",
              "variance": 0.1586981316525018,
              "mean_reward": -1.246182685107177,
              "min_reward": -1.398866018767018,
              "max_reward": -1.1478638717656122,
              "num_responses": 7,
              "rvariance": 0.0054775108095393215
            },
            {
              "id": "safety_sample_213",
              "variance": 0.7360030697557356,
              "mean_reward": 1.5478066516757547,
              "min_reward": 1.2002207292152824,
              "max_reward": 1.9532271702195003,
              "num_responses": 7,
              "rvariance": 0.084914796909876
            },
            {
              "id": "safety_sample_332",
              "variance": 0.36435795532462156,
              "mean_reward": -0.9813002350457853,
              "min_reward": -1.2126386193788783,
              "max_reward": -0.7511185426343575,
              "num_responses": 7,
              "rvariance": 0.023167703267704693
            },
            {
              "id": "safety_sample_204",
              "variance": 0.7471362295017661,
              "mean_reward": -0.6155687080641858,
              "min_reward": -0.9616364723774723,
              "max_reward": 0.45682928980990867,
              "num_responses": 7,
              "rvariance": 0.2055276863208408
            },
            {
              "id": "safety_sample_351",
              "variance": 0.6096923119098667,
              "mean_reward": 1.5339263486157695,
              "min_reward": 1.1313975598761874,
              "max_reward": 1.872258735702918,
              "num_responses": 7,
              "rvariance": 0.06622784198148426
            },
            {
              "id": "safety_sample_399",
              "variance": 0.2963444703306921,
              "mean_reward": -1.3803589480203708,
              "min_reward": -1.6498681657684242,
              "max_reward": -1.236929149733853,
              "num_responses": 7,
              "rvariance": 0.01943753713751523
            },
            {
              "id": "safety_sample_368",
              "variance": 0.7741341418858887,
              "mean_reward": 0.7569004769257168,
              "min_reward": 0.08083212202352834,
              "max_reward": 1.123300716424529,
              "num_responses": 7,
              "rvariance": 0.11647126804813038
            },
            {
              "id": "safety_sample_366",
              "variance": 0.6074656799606608,
              "mean_reward": 0.16187284978521504,
              "min_reward": -0.2005331879215961,
              "max_reward": 0.6212964224217171,
              "num_responses": 7,
              "rvariance": 0.07375566685166031
            },
            {
              "id": "safety_sample_324",
              "variance": 1.2712044219103462,
              "mean_reward": 2.0839333573676977,
              "min_reward": -0.04669316234008922,
              "max_reward": 2.657652550513769,
              "num_responses": 7,
              "rvariance": 0.7726287218542139
            },
            {
              "id": "safety_sample_340",
              "variance": 0.30606068247268214,
              "mean_reward": -1.0055907654007599,
              "min_reward": -1.1964449324755617,
              "max_reward": -0.8563775075059149,
              "num_responses": 7,
              "rvariance": 0.017248673511622126
            },
            {
              "id": "safety_sample_206",
              "variance": 0.21254214060602916,
              "mean_reward": -0.7059111666959322,
              "min_reward": -0.8158932902476236,
              "max_reward": -0.5284553477137555,
              "num_responses": 6,
              "rvariance": 0.00916959221409998
            },
            {
              "id": "safety_sample_371",
              "variance": 0.5330000228411913,
              "mean_reward": 0.5776493756901218,
              "min_reward": 0.1172679175559905,
              "max_reward": 0.9755333234317658,
              "num_responses": 6,
              "rvariance": 0.06626529102046562
            },
            {
              "id": "safety_sample_308",
              "variance": 0.6615121100004796,
              "mean_reward": 0.48567429460644124,
              "min_reward": -0.030499475436772703,
              "max_reward": 0.7670396045515657,
              "num_responses": 7,
              "rvariance": 0.09227645637538354
            },
            {
              "id": "safety_sample_385",
              "variance": 0.7813453930850217,
              "mean_reward": -0.7690472674201724,
              "min_reward": -1.5931902616068163,
              "max_reward": -0.47177744355214773,
              "num_responses": 7,
              "rvariance": 0.14921601076098984
            },
            {
              "id": "safety_sample_171",
              "variance": 0.33197058151798864,
              "mean_reward": -0.81936336601262,
              "min_reward": -1.01831437653908,
              "max_reward": -0.5648911432462176,
              "num_responses": 7,
              "rvariance": 0.021313323692223125
            },
            {
              "id": "safety_sample_212",
              "variance": 0.469212078023596,
              "mean_reward": -0.17450761968412312,
              "min_reward": -0.5325037694395846,
              "max_reward": 0.18204266516925655,
              "num_responses": 7,
              "rvariance": 0.043374720963191636
            },
            {
              "id": "safety_sample_338",
              "variance": 0.18217897766231084,
              "mean_reward": -0.7470701209085284,
              "min_reward": -0.9292490985708393,
              "max_reward": -0.6296658908594837,
              "num_responses": 6,
              "rvariance": 0.008364219659274363
            },
            {
              "id": "safety_sample_369",
              "variance": 0.7692001279075344,
              "mean_reward": 0.40918804128631237,
              "min_reward": -0.18838792274410873,
              "max_reward": 0.8601533042456356,
              "num_responses": 7,
              "rvariance": 0.11587175569103307
            },
            {
              "id": "safety_sample_20",
              "variance": 0.22185351057543623,
              "mean_reward": -1.1050662706639902,
              "min_reward": -1.2612196800888278,
              "max_reward": -0.9373459420224974,
              "num_responses": 7,
              "rvariance": 0.009210352812132078
            },
            {
              "id": "safety_sample_377",
              "variance": 0.6447111598382886,
              "mean_reward": 1.0652733383543116,
              "min_reward": 0.6982164352124706,
              "max_reward": 1.6374502756048284,
              "num_responses": 6,
              "rvariance": 0.08952838187332042
            },
            {
              "id": "safety_sample_383",
              "variance": 0.45585228632835995,
              "mean_reward": -0.6059537064653416,
              "min_reward": -0.8401838206025984,
              "max_reward": -0.2531626703573748,
              "num_responses": 7,
              "rvariance": 0.04534533374619121
            },
            {
              "id": "safety_sample_278",
              "variance": 0.17813055593648164,
              "mean_reward": -1.4647974583019496,
              "min_reward": -1.6660618526717406,
              "max_reward": -1.3664786449603852,
              "num_responses": 7,
              "rvariance": 0.008324639046642318
            },
            {
              "id": "safety_sample_199",
              "variance": 0.27650720387412964,
              "mean_reward": 1.2093296780983982,
              "min_reward": 1.0018480646496553,
              "max_reward": 1.3500123330709604,
              "num_responses": 4,
              "rvariance": 0.017761333034637262
            },
            {
              "id": "safety_sample_379",
              "variance": 0.5716371476870729,
              "mean_reward": -0.4480652591580056,
              "min_reward": -1.1964449324755617,
              "max_reward": -0.20458160964742525,
              "num_responses": 7,
              "rvariance": 0.10359907596586446
            },
            {
              "id": "safety_sample_73",
              "variance": 0.12793012653620028,
              "mean_reward": -1.2010717001622238,
              "min_reward": -1.2936070538954607,
              "max_reward": -1.1316701848622956,
              "num_responses": 7,
              "rvariance": 0.0029006456851688447
            },
            {
              "id": "safety_sample_314",
              "variance": 0.2939154172951947,
              "mean_reward": -0.5533242240295629,
              "min_reward": -0.7106343253760663,
              "max_reward": -0.34627637005144474,
              "num_responses": 7,
              "rvariance": 0.017581150657731186
            },
            {
              "id": "safety_sample_97",
              "variance": 0.16517560641382856,
              "mean_reward": -1.070365513014026,
              "min_reward": -1.2531228366371696,
              "max_reward": -0.985927002732447,
              "num_responses": 7,
              "rvariance": 0.007096413613531169
            },
            {
              "id": "safety_sample_35",
              "variance": 0.49026387099790747,
              "mean_reward": 0.928976473584731,
              "min_reward": 0.5868848377521695,
              "max_reward": 1.123300716424529,
              "num_responses": 7,
              "rvariance": 0.04450862189408677
            },
            {
              "id": "safety_sample_107",
              "variance": 0.29452268055406927,
              "mean_reward": 1.1553507217540095,
              "min_reward": 0.9674364799801076,
              "max_reward": 1.3662060199742767,
              "num_responses": 6,
              "rvariance": 0.01667437601109504
            },
            {
              "id": "safety_sample_131",
              "variance": 0.2380471974787528,
              "mean_reward": 1.5368180784199328,
              "min_reward": 1.2973828506351817,
              "max_reward": 1.7346123970247276,
              "num_responses": 7,
              "rvariance": 0.014888554051918326
            },
            {
              "id": "safety_sample_187",
              "variance": 0.3775153259335663,
              "mean_reward": 0.6153683763231815,
              "min_reward": 0.12334055014473419,
              "max_reward": 0.8135964543986007,
              "num_responses": 7,
              "rvariance": 0.045445595340302083
            },
            {
              "id": "safety_sample_177",
              "variance": 0.38136132657310395,
              "mean_reward": 1.0669119852433375,
              "min_reward": 0.7245311764303599,
              "max_reward": 1.3378670678934728,
              "num_responses": 7,
              "rvariance": 0.03144768869361706
            },
            {
              "id": "safety_sample_72",
              "variance": 0.6736573751779671,
              "mean_reward": -0.002883455807009716,
              "min_reward": -0.4393900697455147,
              "max_reward": 0.30653163323850224,
              "num_responses": 7,
              "rvariance": 0.08062006351309817
            },
            {
              "id": "safety_sample_376",
              "variance": 0.5418559453664424,
              "mean_reward": -0.11842613479462406,
              "min_reward": -0.5729879866978759,
              "max_reward": 0.44190073469591373,
              "num_responses": 6,
              "rvariance": 0.0878946402956204
            },
            {
              "id": "safety_sample_224",
              "variance": 0.576900095930651,
              "mean_reward": 0.8078611902870093,
              "min_reward": 0.5251464064332753,
              "max_reward": 1.341915489619302,
              "num_responses": 6,
              "rvariance": 0.07324314785840245
            },
            {
              "id": "safety_sample_253",
              "variance": 0.37731290484727475,
              "mean_reward": -1.0247918513004068,
              "min_reward": -1.2450259931855112,
              "max_reward": -0.8482806640542566,
              "num_responses": 5,
              "rvariance": 0.03150497243209054
            },
            {
              "id": "safety_sample_307",
              "variance": 0.1570787629621701,
              "mean_reward": -0.4920195521812934,
              "min_reward": -0.6053753605045089,
              "max_reward": -0.4272448045680273,
              "num_responses": 5,
              "rvariance": 0.005539724842915867
            },
            {
              "id": "safety_sample_319",
              "variance": 0.33197058151798853,
              "mean_reward": -0.8226406597906721,
              "min_reward": -1.0264112199907383,
              "max_reward": -0.5729879866978759,
              "num_responses": 6,
              "rvariance": 0.02120647462056388
            },
            {
              "id": "safety_sample_205",
              "variance": 0.5222464026319575,
              "mean_reward": -0.8014346412268054,
              "min_reward": -1.0830891241523461,
              "max_reward": -0.5486974563429011,
              "num_responses": 7,
              "rvariance": 0.048025888926189274
            },
            {
              "id": "safety_sample_348",
              "variance": 0.4489699693944504,
              "mean_reward": 0.6806491766521763,
              "min_reward": 0.35157032493835133,
              "max_reward": 0.965412269117193,
              "num_responses": 7,
              "rvariance": 0.038675690423105445
            },
            {
              "id": "safety_sample_354",
              "variance": 0.3368286875889833,
              "mean_reward": -0.9338758662575011,
              "min_reward": -1.20454177592722,
              "max_reward": -0.7754090729893324,
              "num_responses": 7,
              "rvariance": 0.023467400976873404
            },
            {
              "id": "safety_sample_11",
              "variance": 0.30363162943718464,
              "mean_reward": -0.38097712770140874,
              "min_reward": -0.5891816736011924,
              "max_reward": -0.13980686203415918,
              "num_responses": 7,
              "rvariance": 0.019381343817046086
            },
            {
              "id": "safety_sample_341",
              "variance": 0.6356022109551732,
              "mean_reward": -0.48681443853379874,
              "min_reward": -0.8644743509575732,
              "max_reward": -0.04669316234008922,
              "num_responses": 7,
              "rvariance": 0.06990783550411199
            },
            {
              "id": "safety_sample_196",
              "variance": 0.14250444474918533,
              "mean_reward": -0.804326371030969,
              "min_reward": -0.8806680378608897,
              "max_reward": -0.670150108117775,
              "num_responses": 7,
              "rvariance": 0.004417865337835577
            },
            {
              "id": "safety_sample_236",
              "variance": 0.30646552464526505,
              "mean_reward": -0.06433271414548757,
              "min_reward": -0.23292056172822914,
              "max_reward": 0.12941318273347788,
              "num_responses": 7,
              "rvariance": 0.016803809724574785
            },
            {
              "id": "safety_sample_346",
              "variance": 0.44775544287670166,
              "mean_reward": -0.12823994281750453,
              "min_reward": -0.4393900697455147,
              "max_reward": 0.18811529775800026,
              "num_responses": 7,
              "rvariance": 0.03745017222027731
            },
            {
              "id": "safety_sample_267",
              "variance": 0.5364222043313063,
              "mean_reward": 0.25503625108529404,
              "min_reward": -0.1438552837599883,
              "max_reward": 0.6121874735386016,
              "num_responses": 7,
              "rvariance": 0.05502977176538753
            },
            {
              "id": "safety_sample_279",
              "variance": 0.3141575259243403,
              "mean_reward": -1.5365123574452084,
              "min_reward": -1.7308366002850066,
              "max_reward": -1.3098007407987773,
              "num_responses": 7,
              "rvariance": 0.018599989075284734
            },
            {
              "id": "safety_sample_56",
              "variance": 0.16841434379449172,
              "mean_reward": -0.804326371030969,
              "min_reward": -1.0021206896357635,
              "max_reward": -0.7268280122793828,
              "num_responses": 7,
              "rvariance": 0.007714540138691683
            },
            {
              "id": "safety_sample_257",
              "variance": 0.4554474441557771,
              "mean_reward": 0.4610765179597741,
              "min_reward": 0.022130006999005972,
              "max_reward": 0.6810106428776967,
              "num_responses": 7,
              "rvariance": 0.04611378929346943
            },
            {
              "id": "safety_sample_256",
              "variance": 0.6720380064876352,
              "mean_reward": -0.8049047169918018,
              "min_reward": -1.3826723318637015,
              "max_reward": -0.47987428700380597,
              "num_responses": 7,
              "rvariance": 0.08567006189570525
            },
            {
              "id": "safety_sample_202",
              "variance": 0.46475881412518416,
              "mean_reward": 2.1949757818475826,
              "min_reward": 1.7750966142830187,
              "max_reward": 2.414747246964021,
              "num_responses": 7,
              "rvariance": 0.04674213914070981
            },
            {
              "id": "safety_sample_356",
              "variance": 0.37245479877627985,
              "mean_reward": -0.3557226874117127,
              "min_reward": -0.5567942997945594,
              "max_reward": -0.07908053614672225,
              "num_responses": 6,
              "rvariance": 0.027445494118206806
            },
            {
              "id": "safety_sample_272",
              "variance": 0.6388409483358364,
              "mean_reward": -0.46368060010048945,
              "min_reward": -0.9697333158291305,
              "max_reward": -0.11956475340501353,
              "num_responses": 7,
              "rvariance": 0.07230207233695776
            },
            {
              "id": "safety_sample_268",
              "variance": 1.0610913343398147,
              "mean_reward": 0.5520394936119973,
              "min_reward": -0.386760587309736,
              "max_reward": 1.054477547085434,
              "num_responses": 7,
              "rvariance": 0.23299209853174613
            },
            {
              "id": "safety_sample_138",
              "variance": 0.3275173176195766,
              "mean_reward": 1.033946265475872,
              "min_reward": 0.7265553872932744,
              "max_reward": 1.1718817771344785,
              "num_responses": 7,
              "rvariance": 0.02481453548990589
            },
            {
              "id": "safety_sample_283",
              "variance": 0.7518994506885616,
              "mean_reward": 0.606699964402419,
              "min_reward": 0.06868685684604095,
              "max_reward": 0.9573154256655347,
              "num_responses": 4,
              "rvariance": 0.13090855752360547
            },
            {
              "id": "safety_sample_305",
              "variance": 0.42103585948622935,
              "mean_reward": -0.317262681016336,
              "min_reward": -0.5891816736011924,
              "max_reward": -0.11956475340501353,
              "num_responses": 6,
              "rvariance": 0.03169999187108721
            },
            {
              "id": "safety_sample_334",
              "variance": 0.21213729843344636,
              "mean_reward": -0.16698912219329762,
              "min_reward": -0.3827121655839069,
              "max_reward": -0.04669316234008922,
              "num_responses": 7,
              "rvariance": 0.010474033554586861
            },
            {
              "id": "safety_sample_363",
              "variance": 0.6534152665488213,
              "mean_reward": -0.3422279483256156,
              "min_reward": -0.6944406384727497,
              "max_reward": 0.11929212841890506,
              "num_responses": 7,
              "rvariance": 0.0775655133542337
            },
            {
              "id": "safety_sample_167",
              "variance": 0.40808090996357627,
              "mean_reward": 1.3881831664859205,
              "min_reward": 1.1718817771344785,
              "max_reward": 1.6941281797664363,
              "num_responses": 7,
              "rvariance": 0.030666835677931343
            },
            {
              "id": "safety_sample_1",
              "variance": 0.2461440409304111,
              "mean_reward": -0.8390271286809329,
              "min_reward": -0.9697333158291305,
              "max_reward": -0.6944406384727497,
              "num_responses": 7,
              "rvariance": 0.009205001067325493
            },
            {
              "id": "safety_sample_29",
              "variance": 0.2801507834273756,
              "mean_reward": -0.43881172378468186,
              "min_reward": -0.670150108117775,
              "max_reward": -0.30984057451898256,
              "num_responses": 7,
              "rvariance": 0.014691877430276334
            },
            {
              "id": "safety_sample_179",
              "variance": 0.5141495591802991,
              "mean_reward": 1.2528502116510611,
              "min_reward": 0.7063132786641287,
              "max_reward": 1.4876586717491507,
              "num_responses": 7,
              "rvariance": 0.06642987034793284
            },
            {
              "id": "safety_sample_160",
              "variance": 0.38055164222793847,
              "mean_reward": 2.043641922096351,
              "min_reward": 1.8479682053479431,
              "max_reward": 2.277100908285831,
              "num_responses": 6,
              "rvariance": 0.02594856649793173
            },
            {
              "id": "safety_sample_23",
              "variance": 0.357880480563295,
              "mean_reward": -0.7690472674201724,
              "min_reward": -0.9292490985708393,
              "max_reward": -0.544649034617072,
              "num_responses": 7,
              "rvariance": 0.02289810912307298
            },
            {
              "id": "safety_sample_350",
              "variance": 0.3562611118729633,
              "mean_reward": -0.9144048855761325,
              "min_reward": -1.1640575586689288,
              "max_reward": -0.7268280122793828,
              "num_responses": 6,
              "rvariance": 0.02398180028151188
            },
            {
              "id": "safety_sample_367",
              "variance": 0.3538320588374659,
              "mean_reward": -0.4717774435521477,
              "min_reward": -0.6782469515694333,
              "max_reward": -0.054790005791747476,
              "num_responses": 7,
              "rvariance": 0.03530813636144181
            },
            {
              "id": "safety_sample_303",
              "variance": 0.464353971952601,
              "mean_reward": -0.6853316895896342,
              "min_reward": -1.0830891241523461,
              "max_reward": -0.447486913197173,
              "num_responses": 4,
              "rvariance": 0.0574162568732022
            },
            {
              "id": "safety_sample_18",
              "variance": 0.5175907176472542,
              "mean_reward": 0.014322336527764082,
              "min_reward": -0.2531626703573748,
              "max_reward": 0.3834516460292557,
              "num_responses": 7,
              "rvariance": 0.049374235943904464
            },
            {
              "id": "safety_sample_30",
              "variance": 0.13764633867819043,
              "mean_reward": -0.9130554116675228,
              "min_reward": -1.010217533087422,
              "max_reward": -0.8239901336992819,
              "num_responses": 7,
              "rvariance": 0.0037836835782553077
            },
            {
              "id": "safety_sample_263",
              "variance": 0.6183964186203993,
              "mean_reward": -0.35943374066038936,
              "min_reward": -0.6782469515694333,
              "max_reward": 0.09702580892684486,
              "num_responses": 6,
              "rvariance": 0.08079004412646669
            },
            {
              "id": "safety_sample_295",
              "variance": 0.497146187931817,
              "mean_reward": -0.47293413547381313,
              "min_reward": -0.8320869771509402,
              "max_reward": -0.2572110920832039,
              "num_responses": 7,
              "rvariance": 0.041708154182016156
            },
            {
              "id": "safety_sample_47",
              "variance": 0.6547816088812887,
              "mean_reward": 0.17622305893837717,
              "min_reward": -0.21267845309908348,
              "max_reward": 0.5114829831086019,
              "num_responses": 7,
              "rvariance": 0.06969323524104992
            },
            {
              "id": "safety_sample_375",
              "variance": 0.2655764652143908,
              "mean_reward": -2.5058201878008686,
              "min_reward": -2.751038875193947,
              "max_reward": -2.3785840764176673,
              "num_responses": 7,
              "rvariance": 0.014567449363523237
            },
            {
              "id": "safety_sample_28",
              "variance": 0.24938277831107425,
              "mean_reward": -1.1918181647889,
              "min_reward": -1.3259944277020939,
              "max_reward": -0.9940238461841053,
              "num_responses": 7,
              "rvariance": 0.01132964375553957
            },
            {
              "id": "safety_sample_347",
              "variance": 0.3222543693759986,
              "mean_reward": -0.9454427854741558,
              "min_reward": -1.3583818015087268,
              "max_reward": -0.7835059164409905,
              "num_responses": 7,
              "rvariance": 0.03206765488105484
            },
            {
              "id": "safety_sample_10",
              "variance": 0.18217897766231084,
              "mean_reward": -0.48392270872963516,
              "min_reward": -0.6215690474078255,
              "max_reward": -0.29364688761566604,
              "num_responses": 7,
              "rvariance": 0.008625674692012709
            },
            {
              "id": "safety_sample_365",
              "variance": 0.4473506007041188,
              "mean_reward": 1.008788216179648,
              "min_reward": 0.7731122371403094,
              "max_reward": 1.3297702244418146,
              "num_responses": 7,
              "rvariance": 0.03773833022970683
            },
            {
              "id": "safety_sample_387",
              "variance": 0.14493349778468279,
              "mean_reward": -0.542335650773741,
              "min_reward": -0.6215690474078255,
              "max_reward": -0.3503247917772739,
              "num_responses": 7,
              "rvariance": 0.006859598905839793
            },
            {
              "id": "safety_sample_170",
              "variance": 0.2736733086660492,
              "mean_reward": 1.7033817151397599,
              "min_reward": 1.5483849976365875,
              "max_reward": 1.8317745184446266,
              "num_responses": 7,
              "rvariance": 0.012838835790996438
            },
            {
              "id": "safety_sample_82",
              "variance": 0.2590989904530643,
              "mean_reward": -0.22549845523087572,
              "min_reward": -0.4393900697455147,
              "max_reward": -0.0871773795983805,
              "num_responses": 6,
              "rvariance": 0.013556573524614228
            },
            {
              "id": "safety_sample_286",
              "variance": 0.21051792974311478,
              "mean_reward": -1.1465143978570025,
              "min_reward": -1.2450259931855112,
              "max_reward": -1.0021206896357635,
              "num_responses": 6,
              "rvariance": 0.008553611961596269
            },
            {
              "id": "safety_sample_290",
              "variance": 0.39026785436992784,
              "mean_reward": 1.6704159953722943,
              "min_reward": 1.2204628378444282,
              "max_reward": 1.9289366398645256,
              "num_responses": 7,
              "rvariance": 0.04355183026788453
            },
            {
              "id": "safety_sample_296",
              "variance": 0.5568604083877966,
              "mean_reward": 1.0403803642901361,
              "min_reward": 0.5873908904678982,
              "max_reward": 1.3662060199742767,
              "num_responses": 7,
              "rvariance": 0.05768598690197937
            },
            {
              "id": "safety_sample_183",
              "variance": 0.39188722306026014,
              "mean_reward": 2.4656416915173014,
              "min_reward": 2.1718419434142735,
              "max_reward": 2.7386209850303516,
              "num_responses": 7,
              "rvariance": 0.030676201231342872
            },
            {
              "id": "safety_sample_304",
              "variance": 0.3141575259243403,
              "mean_reward": -1.0125309169307528,
              "min_reward": -1.334091271153752,
              "max_reward": -0.8644743509575732,
              "num_responses": 7,
              "rvariance": 0.02207862319956471
            },
            {
              "id": "safety_sample_353",
              "variance": 0.36759669270528494,
              "mean_reward": -0.9951805381057708,
              "min_reward": -1.1964449324755617,
              "max_reward": -0.7996996033443071,
              "num_responses": 7,
              "rvariance": 0.021530069356889798
            },
            {
              "id": "safety_sample_141",
              "variance": 0.18622739938814004,
              "mean_reward": 1.3452891743908264,
              "min_reward": 1.248801789925232,
              "max_reward": 1.5079007803782962,
              "num_responses": 6,
              "rvariance": 0.007579789522493945
            },
            {
              "id": "safety_sample_156",
              "variance": 0.5149592435254651,
              "mean_reward": -0.6955973303944152,
              "min_reward": -0.9778301592807888,
              "max_reward": -0.34627637005144474,
              "num_responses": 7,
              "rvariance": 0.04912098970723663
            },
            {
              "id": "safety_sample_372",
              "variance": 0.17003371248482324,
              "mean_reward": -1.2380858416555183,
              "min_reward": -1.3502849580570686,
              "max_reward": -1.1559607152172704,
              "num_responses": 7,
              "rvariance": 0.0047844598570866235
            },
            {
              "id": "safety_sample_85",
              "variance": 0.6022533369886558,
              "mean_reward": 0.288946301366932,
              "min_reward": -0.06693527096923486,
              "max_reward": 0.5889090486150841,
              "num_responses": 7,
              "rvariance": 0.05957120760546071
            },
            {
              "id": "safety_sample_98",
              "variance": 0.21942445753993883,
              "mean_reward": -0.38097712770140874,
              "min_reward": -0.544649034617072,
              "max_reward": -0.20863003137325437,
              "num_responses": 7,
              "rvariance": 0.009917452094702062
            },
            {
              "id": "safety_sample_382",
              "variance": 0.47204597323167635,
              "mean_reward": -0.37808539789724505,
              "min_reward": -0.7835059164409905,
              "max_reward": -0.11956475340501353,
              "num_responses": 7,
              "rvariance": 0.048866781828923865
            },
            {
              "id": "safety_sample_148",
              "variance": 0.3692160613956166,
              "mean_reward": 2.198445857612579,
              "min_reward": 1.7022250232180944,
              "max_reward": 2.3823598731573883,
              "num_responses": 7,
              "rvariance": 0.045829666651187144
            },
            {
              "id": "safety_sample_37",
              "variance": 0.7408611758267307,
              "mean_reward": 0.5132963386732962,
              "min_reward": 0.14155844791096528,
              "max_reward": 1.0220901732788008,
              "num_responses": 6,
              "rvariance": 0.10042241753376364
            },
            {
              "id": "safety_sample_271",
              "variance": 0.44694575853153584,
              "mean_reward": -0.2725950946413546,
              "min_reward": -0.5163100825362682,
              "max_reward": -0.006208945081797929,
              "num_responses": 5,
              "rvariance": 0.040544229962756126
            },
            {
              "id": "safety_sample_111",
              "variance": 0.432371440318551,
              "mean_reward": 1.8826689629979074,
              "min_reward": 1.5402881541849294,
              "max_reward": 2.123260882704324,
              "num_responses": 7,
              "rvariance": 0.036351726598725806
            },
            {
              "id": "safety_sample_209",
              "variance": 0.6361715202603679,
              "mean_reward": 0.09733757354635622,
              "min_reward": -0.2774532007123496,
              "max_reward": 0.4772295399127195,
              "num_responses": 7,
              "rvariance": 0.06577036036342929
            },
            {
              "id": "safety_sample_7",
              "variance": 0.4605079713130634,
              "mean_reward": 0.11596663914411685,
              "min_reward": -0.23696898345405826,
              "max_reward": 0.30248321151267316,
              "num_responses": 7,
              "rvariance": 0.04006633922057114
            },
            {
              "id": "safety_sample_49",
              "variance": 0.1497916038556778,
              "mean_reward": -0.3989058524872234,
              "min_reward": -0.5001163956329516,
              "max_reward": -0.3138889962448117,
              "num_responses": 6,
              "rvariance": 0.004359665113063969
            },
            {
              "id": "safety_sample_358",
              "variance": 0.380551642227938,
              "mean_reward": -0.43264270020246615,
              "min_reward": -0.6863437950210916,
              "max_reward": -0.196484766195767,
              "num_responses": 6,
              "rvariance": 0.026959265803591894
            },
            {
              "id": "safety_sample_335",
              "variance": 0.21456635146894387,
              "mean_reward": -0.5972785170528506,
              "min_reward": -0.702537481924408,
              "max_reward": -0.3665184786805904,
              "num_responses": 7,
              "rvariance": 0.011102863569360546
            },
            {
              "id": "safety_sample_132",
              "variance": 0.43682470421696284,
              "mean_reward": 1.1111554512470416,
              "min_reward": 0.8135964543986007,
              "max_reward": 1.3257218027159854,
              "num_responses": 7,
              "rvariance": 0.03154669597253888
            },
            {
              "id": "safety_sample_38",
              "variance": 0.34168679365997834,
              "mean_reward": -0.7673122295376741,
              "min_reward": -1.0911859676040043,
              "max_reward": -0.5891816736011924,
              "num_responses": 7,
              "rvariance": 0.026036238484034017
            },
            {
              "id": "safety_sample_53",
              "variance": 0.2291406696819287,
              "mean_reward": 0.06434926213979546,
              "min_reward": -0.11146790995335527,
              "max_reward": 0.20633319552423132,
              "num_responses": 7,
              "rvariance": 0.010688939556976276
            },
            {
              "id": "safety_sample_219",
              "variance": 0.3758959572432346,
              "mean_reward": 0.13062770925122663,
              "min_reward": -0.20458160964742525,
              "max_reward": 0.31462847669016053,
              "num_responses": 5,
              "rvariance": 0.033361026100244426
            },
            {
              "id": "safety_sample_270",
              "variance": 0.450994180257365,
              "mean_reward": 0.030516023431080598,
              "min_reward": -0.2572110920832039,
              "max_reward": 0.305519527807045,
              "num_responses": 7,
              "rvariance": 0.03949269907411535
            },
            {
              "id": "safety_sample_112",
              "variance": 0.4078784888772846,
              "mean_reward": 1.023777015664563,
              "min_reward": 0.6557080070912646,
              "max_reward": 1.2366565247477446,
              "num_responses": 6,
              "rvariance": 0.03582849366322823
            },
            {
              "id": "safety_sample_362",
              "variance": 0.16679497510416008,
              "mean_reward": -0.6707284540786077,
              "min_reward": -0.7673122295376741,
              "max_reward": -0.544649034617072,
              "num_responses": 7,
              "rvariance": 0.005377834562516683
            },
            {
              "id": "safety_sample_258",
              "variance": 0.4079796994204306,
              "mean_reward": 0.6553465408657442,
              "min_reward": 0.42545402143473293,
              "max_reward": 0.9816059560205095,
              "num_responses": 7,
              "rvariance": 0.0344782396218645
            },
            {
              "id": "safety_sample_78",
              "variance": 0.40372885660831,
              "mean_reward": 0.5647992513728695,
              "min_reward": 0.3419553233395071,
              "max_reward": 0.7690638154144803,
              "num_responses": 7,
              "rvariance": 0.024790523193505644
            },
            {
              "id": "safety_sample_12",
              "variance": 0.019432424283979843,
              "mean_reward": -0.8344003609942712,
              "min_reward": -0.8482806640542566,
              "max_reward": -0.8239901336992819,
              "num_responses": 7,
              "rvariance": 6.95726824855997e-05
            },
            {
              "id": "safety_sample_173",
              "variance": 0.858265405875775,
              "mean_reward": 1.7831934577346769,
              "min_reward": 1.2366565247477446,
              "max_reward": 2.220423004124223,
              "num_responses": 6,
              "rvariance": 0.13405150736748203
            },
            {
              "id": "safety_sample_67",
              "variance": 0.45726923393240015,
              "mean_reward": 0.45903423378558345,
              "min_reward": 0.050468959079809875,
              "max_reward": 0.7275674927247318,
              "num_responses": 7,
              "rvariance": 0.04689363167082316
            },
            {
              "id": "safety_sample_154",
              "variance": 0.1918445845327279,
              "mean_reward": 0.4708406243766455,
              "min_reward": 0.3419553233395071,
              "max_reward": 0.5828364160263404,
              "num_responses": 7,
              "rvariance": 0.006450888753418575
            },
            {
              "id": "safety_sample_17",
              "variance": 0.7655565483542883,
              "mean_reward": 0.18568624472250278,
              "min_reward": -0.2774532007123496,
              "max_reward": 0.8257417195760881,
              "num_responses": 5,
              "rvariance": 0.13547151257573714
            },
            {
              "id": "safety_sample_249",
              "variance": 0.1457431821298485,
              "mean_reward": -0.6526069473058488,
              "min_reward": -0.7268280122793828,
              "max_reward": -0.5163100825362682,
              "num_responses": 6,
              "rvariance": 0.004991579814080338
            },
            {
              "id": "safety_sample_266",
              "variance": 0.31739626330500365,
              "mean_reward": -0.5897600195620252,
              "min_reward": -0.7754090729893324,
              "max_reward": -0.37056690040641954,
              "num_responses": 7,
              "rvariance": 0.018405319357945215
            },
            {
              "id": "safety_sample_133",
              "variance": 0.7125222237459266,
              "mean_reward": 2.1097661436182267,
              "min_reward": 1.6698376494114615,
              "max_reward": 2.471425151125629,
              "num_responses": 6,
              "rvariance": 0.09957664510540427
            },
            {
              "id": "safety_sample_125",
              "variance": 0.23076003837226033,
              "mean_reward": 1.6347513277876091,
              "min_reward": 1.4512228762166886,
              "max_reward": 1.783193457734677,
              "num_responses": 6,
              "rvariance": 0.010809929870989022
            },
            {
              "id": "safety_sample_182",
              "variance": 0.380551642227938,
              "mean_reward": 1.916213028726206,
              "min_reward": 1.6050629017981954,
              "max_reward": 2.1556482565109567,
              "num_responses": 7,
              "rvariance": 0.030360448287754357
            },
            {
              "id": "safety_sample_117",
              "variance": 0.4718941574169577,
              "mean_reward": 0.8836847555270175,
              "min_reward": 0.5863787850364408,
              "max_reward": 1.1921238857636243,
              "num_responses": 6,
              "rvariance": 0.04318739900680851
            },
            {
              "id": "safety_sample_242",
              "variance": 0.6740622173505499,
              "mean_reward": 1.4093891850497873,
              "min_reward": 1.0058964863754842,
              "max_reward": 1.8965492660578926,
              "num_responses": 6,
              "rvariance": 0.08944779909084215
            },
            {
              "id": "safety_sample_70",
              "variance": 0.4574716550186916,
              "mean_reward": 0.05928873498250905,
              "min_reward": -0.2410174051798874,
              "max_reward": 0.3409432179080499,
              "num_responses": 7,
              "rvariance": 0.039893954503090294
            },
            {
              "id": "safety_sample_31",
              "variance": 0.43510412498348566,
              "mean_reward": 0.12735282524801125,
              "min_reward": -0.17219423584079221,
              "max_reward": 0.42975546951842636,
              "num_responses": 7,
              "rvariance": 0.038215636356487455
            },
            {
              "id": "safety_sample_59",
              "variance": 0.364674238271952,
              "mean_reward": 0.252658104543224,
              "min_reward": 0.003912109232774893,
              "max_reward": 0.44101514244338863,
              "num_responses": 6,
              "rvariance": 0.028010500585654016
            },
            {
              "id": "safety_sample_149",
              "variance": 0.2902718377419484,
              "mean_reward": 1.0336570924954553,
              "min_reward": 0.8905164671893542,
              "max_reward": 1.2123659943927698,
              "num_responses": 7,
              "rvariance": 0.012899544646146111
            },
            {
              "id": "safety_sample_309",
              "variance": 0.5659693572709122,
              "mean_reward": -0.5030081254371153,
              "min_reward": -0.7996996033443071,
              "max_reward": -0.16814581411496307,
              "num_responses": 7,
              "rvariance": 0.05778880938960119
            }
          ]
        }
      },
      "overall_stats": {
        "mean_variance_across_files": 0.5592522645511759,
        "mean_rvariance_across_files": 0.101378068730528,
        "total_processed_files": 4
      }
    }
  },
  "summary": {
    "model_comparison": {
      "GRM-gemma2-2B-rewardmodel-ft": {
        "mean_variance": 0.5592522645511759,
        "mean_rvariance": 0.101378068730528
      }
    }
  }
}