{
  "models": {
    "Eurus-RM-7b": {
      "model_name": "Eurus-RM-7b",
      "model_path": "openbmb/Eurus-RM-7b",
      "files": {
        "semantic_benchmark_chat_filtered.json": {
          "file_name": "semantic_benchmark_chat_filtered.json",
          "processed_samples": 200,
          "global_mean": -2.62361664539602,
          "global_std": 4.547933775340323,
          "mean_variance": 0.5579957609990567,
          "mean_rvariance": 0.13023354532967765,
          "sample_results": [
            {
              "id": "chat_sample_306",
              "variance": 0.8854467377767972,
              "mean_reward": 0.8870076198396916,
              "min_reward": 0.5012972391457958,
              "max_reward": 1.9580027074448036,
              "num_responses": 7,
              "rvariance": 0.22262433784958674
            },
            {
              "id": "chat_sample_202",
              "variance": 0.3463111113314623,
              "mean_reward": -0.47736539690144875,
              "min_reward": -0.6393306275411632,
              "max_reward": -0.08275919861559884,
              "num_responses": 7,
              "rvariance": 0.031739442488067385
            },
            {
              "id": "chat_sample_298",
              "variance": 0.773702998728624,
              "mean_reward": -0.9239967904836915,
              "min_reward": -1.402039622735455,
              "max_reward": -0.5912318620784601,
              "num_responses": 7,
              "rvariance": 0.09707027671927394
            },
            {
              "id": "chat_sample_268",
              "variance": 0.42945326305984904,
              "mean_reward": -0.14361886103779462,
              "min_reward": -0.5019055833620115,
              "max_reward": 0.05123021945907404,
              "num_responses": 7,
              "rvariance": 0.03516680122911339
            },
            {
              "id": "chat_sample_303",
              "variance": 0.42679065282887807,
              "mean_reward": 1.1785757102242531,
              "min_reward": 0.614458173962066,
              "max_reward": 1.635053853623797,
              "num_responses": 7,
              "rvariance": 0.07563257860770121
            },
            {
              "id": "chat_sample_65",
              "variance": 0.20201481494335294,
              "mean_reward": 1.2114902353144832,
              "min_reward": 1.0990961813251054,
              "max_reward": 1.4083025307281969,
              "num_responses": 7,
              "rvariance": 0.008902268037257277
            },
            {
              "id": "chat_sample_212",
              "variance": 0.4418215170359726,
              "mean_reward": 1.0260891266049312,
              "min_reward": 0.7855952992914158,
              "max_reward": 1.2846199909669602,
              "num_responses": 7,
              "rvariance": 0.030560806144231584
            },
            {
              "id": "chat_sample_262",
              "variance": 0.35867936530758593,
              "mean_reward": 1.6512503766877684,
              "min_reward": 1.4460944178774635,
              "max_reward": 1.9923589684895915,
              "num_responses": 7,
              "rvariance": 0.028755799996740713
            },
            {
              "id": "chat_sample_178",
              "variance": 0.4754906528598649,
              "mean_reward": -0.6452202722916983,
              "min_reward": -1.1684170476308973,
              "max_reward": -0.41257930464556286,
              "num_responses": 7,
              "rvariance": 0.05849731491956804
            },
            {
              "id": "chat_sample_290",
              "variance": 0.3887551851569695,
              "mean_reward": 0.37160570880533905,
              "min_reward": 0.21270464636957728,
              "max_reward": 0.6473113485861445,
              "num_responses": 7,
              "rvariance": 0.02594994984101898
            },
            {
              "id": "chat_sample_292",
              "variance": 0.24461657863889,
              "mean_reward": -0.12251430068171058,
              "min_reward": -0.3095105215111991,
              "max_reward": 0.013438332309807333,
              "num_responses": 7,
              "rvariance": 0.012069467413646992
            },
            {
              "id": "chat_sample_116",
              "variance": 0.29752522064786335,
              "mean_reward": 1.4799598751930403,
              "min_reward": 1.3017981214893544,
              "max_reward": 1.669410114668585,
              "num_responses": 7,
              "rvariance": 0.01458385949538991
            },
            {
              "id": "chat_sample_106",
              "variance": 0.4625211643154573,
              "mean_reward": 0.8440009430675554,
              "min_reward": 0.6511764279536831,
              "max_reward": 1.4323519134595484,
              "num_responses": 6,
              "rvariance": 0.07245293647234653
            },
            {
              "id": "chat_sample_251",
              "variance": 0.26488677265531485,
              "mean_reward": 0.13196743291432564,
              "min_reward": -0.010611050421544211,
              "max_reward": 0.31405561645170166,
              "num_responses": 7,
              "rvariance": 0.011881092762571792
            },
            {
              "id": "chat_sample_280",
              "variance": 0.5283992948688382,
              "mean_reward": -0.34435758628519825,
              "min_reward": -0.8866957070636363,
              "max_reward": -0.12742233797382313,
              "num_responses": 7,
              "rvariance": 0.06279957996842114
            },
            {
              "id": "chat_sample_58",
              "variance": 0.1985791888388742,
              "mean_reward": 0.007303285694666632,
              "min_reward": -0.10680858134695038,
              "max_reward": 0.14227431122776205,
              "num_responses": 7,
              "rvariance": 0.006845925059119846
            },
            {
              "id": "chat_sample_90",
              "variance": 0.5909276899703523,
              "mean_reward": -0.8443229851083979,
              "min_reward": -1.1959020564667275,
              "max_reward": -0.48816307894409633,
              "num_responses": 6,
              "rvariance": 0.06398167239023646
            },
            {
              "id": "chat_sample_180",
              "variance": 0.6410019404431305,
              "mean_reward": 0.9058422129481736,
              "min_reward": 0.6254092321700921,
              "max_reward": 1.2949268692803966,
              "num_responses": 5,
              "rvariance": 0.08754919223213746
            },
            {
              "id": "chat_sample_291",
              "variance": 0.36975925949453003,
              "mean_reward": 0.22659030187517903,
              "min_reward": 0.01000270620532854,
              "max_reward": 0.46865879115324727,
              "num_responses": 6,
              "rvariance": 0.02743789215814786
            },
            {
              "id": "chat_sample_129",
              "variance": 0.5357858909934674,
              "mean_reward": 0.7519752438404448,
              "min_reward": 0.02374521062324371,
              "max_reward": 0.9651067632504327,
              "num_responses": 7,
              "rvariance": 0.09664694564199351
            },
            {
              "id": "chat_sample_31",
              "variance": 0.6458977076420129,
              "mean_reward": -1.12260869957118,
              "min_reward": -1.5257221624966917,
              "max_reward": -0.7561419150934421,
              "num_responses": 6,
              "rvariance": 0.07545863488048879
            },
            {
              "id": "chat_sample_294",
              "variance": 0.9722821875674982,
              "mean_reward": 0.4713275364308335,
              "min_reward": -0.39196554801869016,
              "max_reward": 0.9359039413623629,
              "num_responses": 7,
              "rvariance": 0.18975794649562258
            },
            {
              "id": "chat_sample_128",
              "variance": 0.3353171077971302,
              "mean_reward": -1.2292767100530928,
              "min_reward": -1.402039622735455,
              "max_reward": -0.9347944725263394,
              "num_responses": 7,
              "rvariance": 0.024381750234306523
            },
            {
              "id": "chat_sample_173",
              "variance": 0.6158359792278234,
              "mean_reward": 0.6984776373564178,
              "min_reward": -0.39196554801869016,
              "max_reward": 0.9788492676683478,
              "num_responses": 7,
              "rvariance": 0.2009381502823583
            },
            {
              "id": "chat_sample_174",
              "variance": 0.3449368608896707,
              "mean_reward": -0.00594841499403728,
              "min_reward": -0.20987736448131414,
              "max_reward": 0.19380870279494392,
              "num_responses": 7,
              "rvariance": 0.02186916481481816
            },
            {
              "id": "chat_sample_297",
              "variance": 1.4192571437601889,
              "mean_reward": 0.4603151277566559,
              "min_reward": -1.2508720741383883,
              "max_reward": 1.1300168162654147,
              "num_responses": 7,
              "rvariance": 0.5706747423365105
            },
            {
              "id": "chat_sample_264",
              "variance": 0.37104761928370955,
              "mean_reward": -1.465255143057865,
              "min_reward": -1.8143147552729102,
              "max_reward": -1.2233870653025578,
              "num_responses": 5,
              "rvariance": 0.037061185367220265
            },
            {
              "id": "chat_sample_275",
              "variance": 0.4452571431404515,
              "mean_reward": -2.142171646386029,
              "min_reward": -2.432727454079093,
              "max_reward": -1.6906322155116735,
              "num_responses": 7,
              "rvariance": 0.04772286300998791
            },
            {
              "id": "chat_sample_172",
              "variance": 1.121216579196654,
              "mean_reward": 0.003990360522490648,
              "min_reward": -0.5156480877799267,
              "max_reward": 0.9255970630489265,
              "num_responses": 7,
              "rvariance": 0.24415489651910383
            },
            {
              "id": "chat_sample_145",
              "variance": 0.765457496077875,
              "mean_reward": 0.8262093078836471,
              "min_reward": 0.3346693730785744,
              "max_reward": 1.5113713138625606,
              "num_responses": 7,
              "rvariance": 0.12152778632412156
            },
            {
              "id": "chat_sample_270",
              "variance": 0.46020211669493427,
              "mean_reward": 0.4161427921276429,
              "min_reward": 0.17834838532478936,
              "max_reward": 0.7297663750936355,
              "num_responses": 7,
              "rvariance": 0.04080193135626633
            },
            {
              "id": "chat_sample_278",
              "variance": 0.5809643742673638,
              "mean_reward": 0.0384693224995814,
              "min_reward": -0.33699553034702945,
              "max_reward": 0.48927254778012,
              "num_responses": 7,
              "rvariance": 0.0678229441451433
            },
            {
              "id": "chat_sample_165",
              "variance": 0.24324232819709848,
              "mean_reward": 0.07331638727358057,
              "min_reward": -0.02435355483945938,
              "max_reward": 0.22301152468301366,
              "num_responses": 7,
              "rvariance": 0.010113454412712665
            },
            {
              "id": "chat_sample_127",
              "variance": 1.8060227524718893,
              "mean_reward": 1.346890714110638,
              "min_reward": 0.5545494437652171,
              "max_reward": 2.693226693803265,
              "num_responses": 7,
              "rvariance": 0.6290363392819641
            },
            {
              "id": "chat_sample_256",
              "variance": 0.3868514993643122,
              "mean_reward": -0.2550313075687497,
              "min_reward": -0.46754932231722357,
              "max_reward": 0.26767466404123796,
              "num_responses": 7,
              "rvariance": 0.05116130261286185
            },
            {
              "id": "chat_sample_114",
              "variance": 0.3944098767941655,
              "mean_reward": -0.8729532026457212,
              "min_reward": -1.2371295697204732,
              "max_reward": -0.6118456187053328,
              "num_responses": 7,
              "rvariance": 0.037636388086943307
            },
            {
              "id": "chat_sample_119",
              "variance": 0.606044444830059,
              "mean_reward": 0.026321930201602794,
              "min_reward": -0.2682830082574536,
              "max_reward": 0.7237540294107976,
              "num_responses": 7,
              "rvariance": 0.10057342494189865
            },
            {
              "id": "chat_sample_179",
              "variance": 0.574436684668854,
              "mean_reward": -1.955666229285752,
              "min_reward": -2.309044914317856,
              "max_reward": -1.4295246315712855,
              "num_responses": 7,
              "rvariance": 0.07212773852115276
            },
            {
              "id": "chat_sample_191",
              "variance": 0.3493172841728812,
              "mean_reward": 0.43853571227290644,
              "min_reward": 0.2436252813098864,
              "max_reward": 0.7606870100339446,
              "num_responses": 7,
              "rvariance": 0.026075699347457883
            },
            {
              "id": "chat_sample_156",
              "variance": 0.45135537947590126,
              "mean_reward": -0.27014397239737964,
              "min_reward": -0.4538068178993084,
              "max_reward": 0.35957766233604566,
              "num_responses": 6,
              "rvariance": 0.08073573347922447
            },
            {
              "id": "chat_sample_166",
              "variance": 0.3703604940628138,
              "mean_reward": 0.1349122552895932,
              "min_reward": -0.07588794640664126,
              "max_reward": 0.324362494765138,
              "num_responses": 7,
              "rvariance": 0.02432261215650734
            },
            {
              "id": "chat_sample_245",
              "variance": 0.5551971784837728,
              "mean_reward": 1.730269777090781,
              "min_reward": 1.4289162873550696,
              "max_reward": 2.0748139949970823,
              "num_responses": 7,
              "rvariance": 0.047826926755850395
            },
            {
              "id": "chat_sample_161",
              "variance": 0.21060388020454995,
              "mean_reward": 0.3089021772949835,
              "min_reward": 0.18350182448150754,
              "max_reward": 0.43687924968681846,
              "num_responses": 7,
              "rvariance": 0.008392939836659917
            },
            {
              "id": "chat_sample_296",
              "variance": 0.31813897727473606,
              "mean_reward": -1.214798000041361,
              "min_reward": -1.4432671359892006,
              "max_reward": -1.0447345078696608,
              "num_responses": 4,
              "rvariance": 0.022836873340434348
            },
            {
              "id": "chat_sample_130",
              "variance": 0.5634426811345221,
              "mean_reward": -1.8516158386929653,
              "min_reward": -2.1716198701387044,
              "max_reward": -1.484494649242946,
              "num_responses": 7,
              "rvariance": 0.059771132253181425
            },
            {
              "id": "chat_sample_18",
              "variance": 0.17195308652916363,
              "mean_reward": 0.7009316560024742,
              "min_reward": 0.5665741351308928,
              "max_reward": 0.8173748407578447,
              "num_responses": 7,
              "rvariance": 0.00601154820789001
            },
            {
              "id": "chat_sample_44",
              "variance": 1.6671375671983344,
              "mean_reward": 1.195048310385906,
              "min_reward": 0.6619127595301794,
              "max_reward": 3.0505318086690596,
              "num_responses": 7,
              "rvariance": 0.7374037729398587
            },
            {
              "id": "chat_sample_215",
              "variance": 0.2860158731978595,
              "mean_reward": 0.22988277689197123,
              "min_reward": 0.08215085439938317,
              "max_reward": 0.43258471705622,
              "num_responses": 6,
              "rvariance": 0.015306223286837181
            },
            {
              "id": "chat_sample_300",
              "variance": 0.8507469141215607,
              "mean_reward": 0.6756552639480945,
              "min_reward": -0.1480360946006959,
              "max_reward": 1.0990961813251054,
              "num_responses": 6,
              "rvariance": 0.17329987126018667
            },
            {
              "id": "chat_sample_169",
              "variance": 0.7524021168808555,
              "mean_reward": -0.36791616528733856,
              "min_reward": -0.7698844195113572,
              "max_reward": 0.04435896725011646,
              "num_responses": 6,
              "rvariance": 0.09850436506889164
            },
            {
              "id": "chat_sample_82",
              "variance": 0.5400804236240662,
              "mean_reward": 0.051475621323679666,
              "min_reward": -0.3988368002276477,
              "max_reward": 0.33295156002633497,
              "num_responses": 7,
              "rvariance": 0.05965032677042666
            },
            {
              "id": "chat_sample_77",
              "variance": 0.22675132289560027,
              "mean_reward": 0.02832604542921543,
              "min_reward": -0.16864985122756865,
              "max_reward": 0.13368524596656506,
              "num_responses": 6,
              "rvariance": 0.010696618223117115
            },
            {
              "id": "chat_sample_277",
              "variance": 1.018319577367514,
              "mean_reward": -1.8294315101326166,
              "min_reward": -2.377757436407432,
              "max_reward": -1.0928332733323638,
              "num_responses": 5,
              "rvariance": 0.20926047612257803
            },
            {
              "id": "chat_sample_73",
              "variance": 0.30233509719413343,
              "mean_reward": -2.068551087004341,
              "min_reward": -2.281559905482026,
              "max_reward": -1.7730872420191646,
              "num_responses": 6,
              "rvariance": 0.023213602568559713
            },
            {
              "id": "chat_sample_6",
              "variance": 0.2099167549836542,
              "mean_reward": 0.09393014390045332,
              "min_reward": -0.09306607692903522,
              "max_reward": 0.1972443288994227,
              "num_responses": 7,
              "rvariance": 0.009173387819591209
            },
            {
              "id": "chat_sample_80",
              "variance": 1.8770543221819884,
              "mean_reward": -0.9858994108304613,
              "min_reward": -1.8143147552729102,
              "max_reward": 0.8671914192727872,
              "num_responses": 4,
              "rvariance": 1.1612993832443865
            },
            {
              "id": "chat_sample_224",
              "variance": 0.5442031749494407,
              "mean_reward": -1.7809401016865445,
              "min_reward": -2.1716198701387044,
              "max_reward": -1.5119796580787765,
              "num_responses": 7,
              "rvariance": 0.05130728092303007
            },
            {
              "id": "chat_sample_267",
              "variance": 0.5128423504144951,
              "mean_reward": 0.3888495034985357,
              "min_reward": 0.006567080100849749,
              "max_reward": 0.7143060576234809,
              "num_responses": 7,
              "rvariance": 0.05030222330155939
            },
            {
              "id": "chat_sample_308",
              "variance": 1.0770687837541013,
              "mean_reward": 1.214189655825145,
              "min_reward": 0.4772478564144443,
              "max_reward": 1.8274489154746094,
              "num_responses": 7,
              "rvariance": 0.20946116980134638
            },
            {
              "id": "chat_sample_252",
              "variance": 0.7049904766390485,
              "mean_reward": 0.23994425334080197,
              "min_reward": -0.12742233797382313,
              "max_reward": 1.2846199909669602,
              "num_responses": 7,
              "rvariance": 0.1949794469454141
            },
            {
              "id": "chat_sample_159",
              "variance": 0.2717580248642725,
              "mean_reward": 0.1631334697192404,
              "min_reward": -0.031224807048416965,
              "max_reward": 0.30546655119050464,
              "num_responses": 7,
              "rvariance": 0.013771704589891133
            },
            {
              "id": "chat_sample_188",
              "variance": 0.40879656110667034,
              "mean_reward": 0.46402683095881603,
              "min_reward": 0.17147713311583176,
              "max_reward": 0.7280485620413961,
              "num_responses": 7,
              "rvariance": 0.031125265772690685
            },
            {
              "id": "chat_sample_88",
              "variance": 0.15529029992244137,
              "mean_reward": -0.36938857647497236,
              "min_reward": -0.46067807010826595,
              "max_reward": -0.2270554950037081,
              "num_responses": 7,
              "rvariance": 0.0052031872931258
            },
            {
              "id": "chat_sample_27",
              "variance": 0.48579753117330116,
              "mean_reward": -0.38264027716367627,
              "min_reward": -0.7011718974217814,
              "max_reward": -0.048402937570810926,
              "num_responses": 7,
              "rvariance": 0.04720977092969354
            },
            {
              "id": "chat_sample_167",
              "variance": 0.22537707245380867,
              "mean_reward": 1.6134584895385018,
              "min_reward": 1.4564012961908999,
              "max_reward": 1.7106376279223305,
              "num_responses": 7,
              "rvariance": 0.00838291286114712
            },
            {
              "id": "chat_sample_76",
              "variance": 0.5960811291270705,
              "mean_reward": 0.05981928472027103,
              "min_reward": -0.2373623733171445,
              "max_reward": 0.7589691969817052,
              "num_responses": 6,
              "rvariance": 0.10622682243184768
            },
            {
              "id": "chat_sample_209",
              "variance": 0.19651781317618688,
              "mean_reward": -1.1586009730466722,
              "min_reward": -1.2783570829742186,
              "max_reward": -0.9828932379890425,
              "num_responses": 7,
              "rvariance": 0.007957022345672747
            },
            {
              "id": "chat_sample_61",
              "variance": 0.36134197553855696,
              "mean_reward": 0.34675541491040157,
              "min_reward": 0.1165071154441711,
              "max_reward": 0.5811755460749277,
              "num_responses": 7,
              "rvariance": 0.023442669777665685
            },
            {
              "id": "chat_sample_118",
              "variance": 0.5391785717716405,
              "mean_reward": 0.691851787012066,
              "min_reward": 0.43859706273905785,
              "max_reward": 1.239956851608736,
              "num_responses": 7,
              "rvariance": 0.06784861945049633
            },
            {
              "id": "chat_sample_150",
              "variance": 0.2748500883583034,
              "mean_reward": -0.3203082035538468,
              "min_reward": -0.5225193399888842,
              "max_reward": -0.1446004684962171,
              "num_responses": 7,
              "rvariance": 0.01429720241766678
            },
            {
              "id": "chat_sample_120",
              "variance": 2.49976155361877,
              "mean_reward": 2.5219361923085364,
              "min_reward": 1.4186094090416332,
              "max_reward": 4.69963233881888,
              "num_responses": 7,
              "rvariance": 1.2566049009817697
            },
            {
              "id": "chat_sample_244",
              "variance": 0.26282539699262764,
              "mean_reward": 0.9625300436720736,
              "min_reward": 0.8397064104369568,
              "max_reward": 1.126581190160936,
              "num_responses": 6,
              "rvariance": 0.013562989932933365
            },
            {
              "id": "chat_sample_8",
              "variance": 0.4115021166639474,
              "mean_reward": 0.9391248408353119,
              "min_reward": 0.6148876272251259,
              "max_reward": 1.3189762520117483,
              "num_responses": 7,
              "rvariance": 0.04013100286281834
            },
            {
              "id": "chat_sample_40",
              "variance": 0.515000353061371,
              "mean_reward": -0.03380152662677606,
              "min_reward": -0.29920364319776277,
              "max_reward": 0.4317258105301003,
              "num_responses": 7,
              "rvariance": 0.05756010887501629
            },
            {
              "id": "chat_sample_286",
              "variance": 0.6307809527823063,
              "mean_reward": 0.6308694236575674,
              "min_reward": 0.10620023713073472,
              "max_reward": 1.044126163653445,
              "num_responses": 7,
              "rvariance": 0.0821598027992976
            },
            {
              "id": "chat_sample_307",
              "variance": 0.4728280426288938,
              "mean_reward": 0.5774331676396918,
              "min_reward": 0.13712087207104384,
              "max_reward": 0.9307505022056447,
              "num_responses": 7,
              "rvariance": 0.05391570224736335
            },
            {
              "id": "chat_sample_206",
              "variance": 0.659983774670376,
              "mean_reward": 0.6597654932148801,
              "min_reward": 0.21957589857853485,
              "max_reward": 1.1506305728922874,
              "num_responses": 7,
              "rvariance": 0.08331630000275565
            },
            {
              "id": "chat_sample_261",
              "variance": 0.6871252208957586,
              "mean_reward": -2.578005357925625,
              "min_reward": -2.9686851263777845,
              "max_reward": -2.0754223392132984,
              "num_responses": 7,
              "rvariance": 0.08373662750403787
            },
            {
              "id": "chat_sample_79",
              "variance": 0.45590758406433585,
              "mean_reward": 1.0835131629226482,
              "min_reward": 0.7563924774033461,
              "max_reward": 1.3189762520117483,
              "num_responses": 7,
              "rvariance": 0.038182813085834204
            },
            {
              "id": "chat_sample_69",
              "variance": 0.1498791888078873,
              "mean_reward": 0.4942112603053083,
              "min_reward": 0.4179833061121851,
              "max_reward": 0.6052249288062793,
              "num_responses": 6,
              "rvariance": 0.004550981905573878
            },
            {
              "id": "chat_sample_203",
              "variance": 0.3461393300262383,
              "mean_reward": 0.22301152468301363,
              "min_reward": 0.05466584556355284,
              "max_reward": 0.44031487579129724,
              "num_responses": 6,
              "rvariance": 0.02171922690320867
            },
            {
              "id": "chat_sample_168",
              "variance": 0.6156641979225995,
              "mean_reward": -0.5313538071146867,
              "min_reward": -0.9210519681084242,
              "max_reward": -0.17552110343652624,
              "num_responses": 7,
              "rvariance": 0.07294531341341519
            },
            {
              "id": "chat_sample_265",
              "variance": 0.6424620815375339,
              "mean_reward": -1.4581548491086087,
              "min_reward": -1.8692847729445707,
              "max_reward": -1.0653482644965335,
              "num_responses": 6,
              "rvariance": 0.07866525964207792
            },
            {
              "id": "chat_sample_301",
              "variance": 1.0932162264451522,
              "mean_reward": -0.5816611893588407,
              "min_reward": -1.072219516705491,
              "max_reward": 0.9393395674668417,
              "num_responses": 7,
              "rvariance": 0.4121318188527128
            },
            {
              "id": "chat_sample_196",
              "variance": 0.5411970021080218,
              "mean_reward": 1.0729302075115306,
              "min_reward": 0.6307773979583403,
              "max_reward": 1.3498968869520573,
              "num_responses": 7,
              "rvariance": 0.05655249381491269
            },
            {
              "id": "chat_sample_225",
              "variance": 0.569483209687748,
              "mean_reward": 0.8333192517499751,
              "min_reward": 0.4746711368360852,
              "max_reward": 1.239956851608736,
              "num_responses": 7,
              "rvariance": 0.06160434306810051
            },
            {
              "id": "chat_sample_126",
              "variance": 0.26523033526576273,
              "mean_reward": -0.49896076098674397,
              "min_reward": -0.6874293930038663,
              "max_reward": -0.30263926930224155,
              "num_responses": 7,
              "rvariance": 0.01356875619662917
            },
            {
              "id": "chat_sample_162",
              "variance": 0.3861643741434162,
              "mean_reward": 0.792405201034222,
              "min_reward": 0.5214815425096088,
              "max_reward": 1.006334276504178,
              "num_responses": 7,
              "rvariance": 0.026603169448194738
            },
            {
              "id": "chat_sample_49",
              "variance": 0.384102998480729,
              "mean_reward": -0.40080001514449276,
              "min_reward": -0.5912318620784601,
              "max_reward": -0.0999373291379928,
              "num_responses": 7,
              "rvariance": 0.02598076677374028
            },
            {
              "id": "chat_sample_177",
              "variance": 0.48923315727777994,
              "mean_reward": -1.8775302755953198,
              "min_reward": -2.281559905482026,
              "max_reward": -1.5394646669146068,
              "num_responses": 5,
              "rvariance": 0.05723105184306169
            },
            {
              "id": "chat_sample_273",
              "variance": 0.5002271608121123,
              "mean_reward": -1.8575054834435005,
              "min_reward": -2.0891648436312136,
              "max_reward": -1.3745546138996247,
              "num_responses": 7,
              "rvariance": 0.05484544828235567
            },
            {
              "id": "chat_sample_285",
              "variance": 0.6493333337464917,
              "mean_reward": 0.0457086775054474,
              "min_reward": -0.2751542604664112,
              "max_reward": 0.4489039410524942,
              "num_responses": 7,
              "rvariance": 0.08284302224189612
            },
            {
              "id": "chat_sample_293",
              "variance": 0.4136493829792468,
              "mean_reward": -0.901419818939974,
              "min_reward": -1.2371295697204732,
              "max_reward": -0.6462018797501208,
              "num_responses": 7,
              "rvariance": 0.03203043555520148
            },
            {
              "id": "chat_sample_233",
              "variance": 0.8327957677256591,
              "mean_reward": 0.4302533993424665,
              "min_reward": 0.0271808367277225,
              "max_reward": 0.9444930066235598,
              "num_responses": 7,
              "rvariance": 0.11387172379902048
            },
            {
              "id": "chat_sample_235",
              "variance": 2.8769932998905405,
              "mean_reward": -0.6449135199609412,
              "min_reward": -1.883027277362486,
              "max_reward": 1.2124718427729058,
              "num_responses": 7,
              "rvariance": 1.7927818717053072
            },
            {
              "id": "chat_sample_158",
              "variance": 0.3684708997053504,
              "mean_reward": 0.5229386160807046,
              "min_reward": 0.30031311203378647,
              "max_reward": 0.8311173451757599,
              "num_responses": 7,
              "rvariance": 0.02735328949998255
            },
            {
              "id": "chat_sample_216",
              "variance": 0.5230740744068959,
              "mean_reward": 0.7589691969817052,
              "min_reward": 0.44289159536965633,
              "max_reward": 1.0303836592355298,
              "num_responses": 7,
              "rvariance": 0.04610647240187279
            },
            {
              "id": "chat_sample_242",
              "variance": 0.8767717818629881,
              "mean_reward": -0.2525772889226935,
              "min_reward": -0.5568756010336722,
              "max_reward": 1.0784824246982327,
              "num_responses": 7,
              "rvariance": 0.3105570513562254
            },
            {
              "id": "chat_sample_92",
              "variance": 0.26110758394038824,
              "mean_reward": -0.044721909601726506,
              "min_reward": -0.1480360946006959,
              "max_reward": 0.19037307669046513,
              "num_responses": 7,
              "rvariance": 0.014312980601356587
            },
            {
              "id": "chat_sample_250",
              "variance": 3.143168432335035,
              "mean_reward": 4.636789011324455,
              "min_reward": 0.6395811898510672,
              "max_reward": 6.183822815953718,
              "num_responses": 6,
              "rvariance": 3.3595621762608303
            },
            {
              "id": "chat_sample_283",
              "variance": 0.7201072314987549,
              "mean_reward": 0.234668113251781,
              "min_reward": -0.47442057452618114,
              "max_reward": 0.7151649641496006,
              "num_responses": 7,
              "rvariance": 0.12097558000601605
            },
            {
              "id": "chat_sample_140",
              "variance": 0.85375308696298,
              "mean_reward": 0.10742724645376286,
              "min_reward": -0.5774893576605449,
              "max_reward": 1.044126163653445,
              "num_responses": 7,
              "rvariance": 0.2039790338561169
            },
            {
              "id": "chat_sample_232",
              "variance": 0.30010194022622255,
              "mean_reward": 0.36608081174809476,
              "min_reward": 0.2539321596233228,
              "max_reward": 0.6498880681645036,
              "num_responses": 7,
              "rvariance": 0.0190576069032381
            },
            {
              "id": "chat_sample_0",
              "variance": 0.36142786619116907,
              "mean_reward": -0.13036716034909068,
              "min_reward": -0.38509429580973253,
              "max_reward": 0.26080341183228034,
              "num_responses": 7,
              "rvariance": 0.0345048401790435
            },
            {
              "id": "chat_sample_34",
              "variance": 0.29567857161670613,
              "mean_reward": 0.6559004138473414,
              "min_reward": 0.4343025301084594,
              "max_reward": 0.862037980116069,
              "num_responses": 7,
              "rvariance": 0.017885570522450996
            },
            {
              "id": "chat_sample_68",
              "variance": 0.2693530865911373,
              "mean_reward": -0.06950749792689492,
              "min_reward": -0.2270554950037081,
              "max_reward": 0.1165071154441711,
              "num_responses": 7,
              "rvariance": 0.012219781713226185
            },
            {
              "id": "chat_sample_149",
              "variance": 0.2830955910090527,
              "mean_reward": 1.6860974414617675,
              "min_reward": 1.504500061653603,
              "max_reward": 1.8824189331462702,
              "num_responses": 7,
              "rvariance": 0.014297202417666785
            },
            {
              "id": "chat_sample_309",
              "variance": 0.666511464268886,
              "mean_reward": -1.1536929357545596,
              "min_reward": -1.4432671359892006,
              "max_reward": -0.6324593753322055,
              "num_responses": 7,
              "rvariance": 0.08307563000717044
            },
            {
              "id": "chat_sample_243",
              "variance": 0.4273918873971617,
              "mean_reward": -0.29969444692697395,
              "min_reward": -0.6943006452128239,
              "max_reward": -0.02778918094393817,
              "num_responses": 7,
              "rvariance": 0.041327278628854096
            },
            {
              "id": "chat_sample_281",
              "variance": 0.3009608467523422,
              "mean_reward": -0.45920565892063214,
              "min_reward": -0.8592106982278058,
              "max_reward": -0.29233239098880515,
              "num_responses": 7,
              "rvariance": 0.02984557866868983
            },
            {
              "id": "chat_sample_99",
              "variance": 2.1809354511231374,
              "mean_reward": 1.0647399202803176,
              "min_reward": -0.1033729552424716,
              "max_reward": 2.597029162877859,
              "num_responses": 7,
              "rvariance": 0.9568006215880691
            },
            {
              "id": "chat_sample_43",
              "variance": 0.2081989419314148,
              "mean_reward": 0.25785858945701284,
              "min_reward": 0.10963586323521352,
              "max_reward": 0.39307501685471385,
              "num_responses": 7,
              "rvariance": 0.00764254266922943
            },
            {
              "id": "chat_sample_148",
              "variance": 0.3418447973956398,
              "mean_reward": 1.2975035888587558,
              "min_reward": 1.0235124070265722,
              "max_reward": 1.4838863050267301,
              "num_responses": 4,
              "rvariance": 0.028944460702672856
            },
            {
              "id": "chat_sample_249",
              "variance": 0.5300312172684657,
              "mean_reward": 0.40912583256157575,
              "min_reward": 0.04435896725011646,
              "max_reward": 0.719459496780199,
              "num_responses": 7,
              "rvariance": 0.057286438476081426
            },
            {
              "id": "chat_sample_100",
              "variance": 0.46681569694605585,
              "mean_reward": 0.5904803667745577,
              "min_reward": 0.3724612602278411,
              "max_reward": 1.0132055287131356,
              "num_responses": 6,
              "rvariance": 0.05002246511473322
            },
            {
              "id": "chat_sample_141",
              "variance": 0.475490652859865,
              "mean_reward": 0.3491480830903065,
              "min_reward": 0.16117025480239539,
              "max_reward": 1.2159074688773845,
              "num_responses": 7,
              "rvariance": 0.1261762078609479
            },
            {
              "id": "chat_sample_97",
              "variance": 0.26780705484412193,
              "mean_reward": 0.399578166266763,
              "min_reward": 0.18350182448150754,
              "max_reward": 0.7125882445712415,
              "num_responses": 7,
              "rvariance": 0.021782535359712123
            },
            {
              "id": "chat_sample_137",
              "variance": 0.5417982366763054,
              "mean_reward": 0.12362376951773431,
              "min_reward": -0.3644805391828598,
              "max_reward": 0.4669409781010079,
              "num_responses": 7,
              "rvariance": 0.06443918618650725
            },
            {
              "id": "chat_sample_207",
              "variance": 0.19802089959689645,
              "mean_reward": 0.5097329282416142,
              "min_reward": 0.3741790732800805,
              "max_reward": 0.7246129359369173,
              "num_responses": 7,
              "rvariance": 0.010602263823141857
            },
            {
              "id": "chat_sample_190",
              "variance": 0.4930123459927067,
              "mean_reward": -0.020917928734980596,
              "min_reward": -0.39196554801869016,
              "max_reward": 0.30718436424274403,
              "num_responses": 7,
              "rvariance": 0.048633059453834
            },
            {
              "id": "chat_sample_254",
              "variance": 0.2140395063090288,
              "mean_reward": 1.0352916965276422,
              "min_reward": 0.853448914854872,
              "max_reward": 1.1952937122505116,
              "num_responses": 7,
              "rvariance": 0.010067083414845678
            },
            {
              "id": "chat_sample_171",
              "variance": 0.5634426811345219,
              "mean_reward": -1.720080439264349,
              "min_reward": -2.0754223392132984,
              "max_reward": -1.3470696050637945,
              "num_responses": 7,
              "rvariance": 0.06558328517024341
            },
            {
              "id": "chat_sample_131",
              "variance": 0.1471306879243044,
              "mean_reward": 0.6734159719335681,
              "min_reward": 0.5620648758687644,
              "max_reward": 0.7933254580264931,
              "num_responses": 7,
              "rvariance": 0.004605112455092851
            },
            {
              "id": "chat_sample_272",
              "variance": 0.4741164024180733,
              "mean_reward": -0.9917277051148451,
              "min_reward": -1.6219196934220979,
              "max_reward": -0.7355281584665694,
              "num_responses": 7,
              "rvariance": 0.07421672186402255
            },
            {
              "id": "chat_sample_317",
              "variance": 0.5996885365367732,
              "mean_reward": 0.4716649639946663,
              "min_reward": -0.12055108576486556,
              "max_reward": 0.975413641563869,
              "num_responses": 7,
              "rvariance": 0.09383324231898617
            },
            {
              "id": "chat_sample_221",
              "variance": 0.9949573198570584,
              "mean_reward": -1.1478032910040243,
              "min_reward": -1.8143147552729102,
              "max_reward": -0.6462018797501208,
              "num_responses": 7,
              "rvariance": 0.17146814658535345
            },
            {
              "id": "chat_sample_263",
              "variance": 0.6644500886061984,
              "mean_reward": -0.40472644497818283,
              "min_reward": -0.9966357424069576,
              "max_reward": -0.031224807048416965,
              "num_responses": 7,
              "rvariance": 0.09256229306170193
            },
            {
              "id": "chat_sample_112",
              "variance": 0.7628807764995159,
              "mean_reward": 0.15515790911955749,
              "min_reward": -0.15834297291413227,
              "max_reward": 0.8276817190712811,
              "num_responses": 7,
              "rvariance": 0.13202940212222594
            },
            {
              "id": "chat_sample_138",
              "variance": 0.555197178483773,
              "mean_reward": -0.6736868885859512,
              "min_reward": -0.9347944725263394,
              "max_reward": -0.24766925163058087,
              "num_responses": 7,
              "rvariance": 0.05360824597043466
            },
            {
              "id": "chat_sample_1",
              "variance": 0.6785361556345615,
              "mean_reward": 0.26309382923526625,
              "min_reward": -0.20644173837683535,
              "max_reward": 0.6511764279536831,
              "num_responses": 6,
              "rvariance": 0.0922310160265886
            },
            {
              "id": "chat_sample_42",
              "variance": 0.2968380954269676,
              "mean_reward": -1.472715359741876,
              "min_reward": -1.7043747199295889,
              "max_reward": -1.2920995873921337,
              "num_responses": 7,
              "rvariance": 0.017343957643752673
            },
            {
              "id": "chat_sample_101",
              "variance": 0.5495283954113829,
              "mean_reward": 0.5490432394281284,
              "min_reward": 0.16975932006359237,
              "max_reward": 1.0372549114444873,
              "num_responses": 7,
              "rvariance": 0.06523518322695179
            },
            {
              "id": "chat_sample_21",
              "variance": 0.5551971784837728,
              "mean_reward": 0.06031008844948228,
              "min_reward": -0.21674861669027173,
              "max_reward": 0.43945596926517755,
              "num_responses": 7,
              "rvariance": 0.060083925711520485
            },
            {
              "id": "chat_sample_66",
              "variance": 1.243009524600427,
              "mean_reward": 0.6665753949576861,
              "min_reward": 0.09589335881729834,
              "max_reward": 1.4770150528177726,
              "num_responses": 7,
              "rvariance": 0.27536992517674824
            },
            {
              "id": "chat_sample_151",
              "variance": 0.8396670199346168,
              "mean_reward": -1.6562759544668857,
              "min_reward": -1.9517397994520618,
              "max_reward": -1.0172494990338303,
              "num_responses": 7,
              "rvariance": 0.1318622557526418
            },
            {
              "id": "chat_sample_33",
              "variance": 0.4342631396061192,
              "mean_reward": -2.348309212654757,
              "min_reward": -2.61138001151199,
              "max_reward": -2.144134861302874,
              "num_responses": 7,
              "rvariance": 0.03158912818848819
            },
            {
              "id": "chat_sample_219",
              "variance": 0.3930356263523742,
              "mean_reward": -2.3640149319895167,
              "min_reward": -2.625122515929905,
              "max_reward": -2.116649852467044,
              "num_responses": 4,
              "rvariance": 0.03427744162326987
            },
            {
              "id": "chat_sample_5",
              "variance": 0.28721834233442706,
              "mean_reward": -0.45282521044088586,
              "min_reward": -0.6049743664963753,
              "max_reward": -0.2682830082574536,
              "num_responses": 7,
              "rvariance": 0.014291421098452198
            },
            {
              "id": "chat_sample_86",
              "variance": 0.24461657863889008,
              "mean_reward": -0.382149473434465,
              "min_reward": -0.5156480877799267,
              "max_reward": -0.15147172070517467,
              "num_responses": 7,
              "rvariance": 0.012826820230757529
            },
            {
              "id": "chat_sample_108",
              "variance": 0.30439647285682114,
              "mean_reward": 1.16339146985178,
              "min_reward": 0.8895229889518992,
              "max_reward": 1.356768139161015,
              "num_responses": 7,
              "rvariance": 0.019855940842489508
            },
            {
              "id": "chat_sample_28",
              "variance": 0.5538229280419812,
              "mean_reward": -1.2547985039720781,
              "min_reward": -1.5806921801683522,
              "max_reward": -0.8866957070636363,
              "num_responses": 7,
              "rvariance": 0.05754532435556648
            },
            {
              "id": "chat_sample_255",
              "variance": 0.39217671982625407,
              "mean_reward": 0.5092727997454787,
              "min_reward": 0.33295156002633497,
              "max_reward": 0.7400732534070719,
              "num_responses": 7,
              "rvariance": 0.029438356996512555
            },
            {
              "id": "chat_sample_29",
              "variance": 0.20338906538514454,
              "mean_reward": -0.11171661863906295,
              "min_reward": -0.22361986889922933,
              "max_reward": 0.0271808367277225,
              "num_responses": 7,
              "rvariance": 0.007294097742400427
            },
            {
              "id": "chat_sample_60",
              "variance": 0.28721834233442706,
              "mean_reward": -0.1735578885196812,
              "min_reward": -0.3644805391828598,
              "max_reward": 0.013438332309807333,
              "num_responses": 7,
              "rvariance": 0.016821230031434008
            },
            {
              "id": "chat_sample_125",
              "variance": 0.6472719580838047,
              "mean_reward": -1.4285430241128627,
              "min_reward": -1.9792248082878923,
              "max_reward": -1.0309920034517455,
              "num_responses": 7,
              "rvariance": 0.08385803520754417
            },
            {
              "id": "chat_sample_314",
              "variance": 0.5613813054718346,
              "mean_reward": -0.41994136058373177,
              "min_reward": -0.708043149630739,
              "max_reward": -0.1033729552424716,
              "num_responses": 7,
              "rvariance": 0.04861174083923022
            },
            {
              "id": "chat_sample_310",
              "variance": 0.2267513228956004,
              "mean_reward": -0.6746684960443735,
              "min_reward": -0.8179831849740603,
              "max_reward": -0.3644805391828598,
              "num_responses": 7,
              "rvariance": 0.018014590672644437
            },
            {
              "id": "chat_sample_222",
              "variance": 0.3476853617732538,
              "mean_reward": -0.6383490200827406,
              "min_reward": -0.9279232203173818,
              "max_reward": -0.44006431348139324,
              "num_responses": 7,
              "rvariance": 0.022803450088725037
            },
            {
              "id": "chat_sample_143",
              "variance": 0.2824084657881567,
              "mean_reward": -0.23687156958793323,
              "min_reward": -0.5843606098695024,
              "max_reward": -0.07932357251112006,
              "num_responses": 7,
              "rvariance": 0.023423014797887977
            },
            {
              "id": "chat_sample_12",
              "variance": 0.36280211663296047,
              "mean_reward": -0.3477932123896771,
              "min_reward": -0.5912318620784601,
              "max_reward": -0.1480360946006959,
              "num_responses": 7,
              "rvariance": 0.0234331321065135
            },
            {
              "id": "chat_sample_248",
              "variance": 0.4425086422568685,
              "mean_reward": -0.4895373293858878,
              "min_reward": -0.6943006452128239,
              "max_reward": -0.1995704861678778,
              "num_responses": 5,
              "rvariance": 0.03898752092951972
            },
            {
              "id": "chat_sample_64",
              "variance": 0.27275650370088667,
              "mean_reward": 0.2692582729487711,
              "min_reward": 0.08558648050386197,
              "max_reward": 0.5742237713791464,
              "num_responses": 7,
              "rvariance": 0.020459545613740714
            },
            {
              "id": "chat_sample_4",
              "variance": 0.11354744275302409,
              "mean_reward": 0.4041181007619671,
              "min_reward": 0.3295159339218562,
              "max_reward": 0.4652231650487685,
              "num_responses": 7,
              "rvariance": 0.00259138600482465
            },
            {
              "id": "chat_sample_311",
              "variance": 0.3682991184001265,
              "mean_reward": -0.4484079768779846,
              "min_reward": -0.6599443841680359,
              "max_reward": -0.12055108576486556,
              "num_responses": 7,
              "rvariance": 0.027808627198751323
            },
            {
              "id": "chat_sample_117",
              "variance": 0.549013051495711,
              "mean_reward": -0.5338078257607431,
              "min_reward": -0.8385969416009331,
              "max_reward": -0.2339267472126657,
              "num_responses": 7,
              "rvariance": 0.04745258633670608
            },
            {
              "id": "chat_sample_39",
              "variance": 0.4167414464732775,
              "mean_reward": 0.04362276165629957,
              "min_reward": -0.22361986889922933,
              "max_reward": 0.27454591625019553,
              "num_responses": 7,
              "rvariance": 0.03331617685969492
            },
            {
              "id": "chat_sample_287",
              "variance": 0.1747874780653585,
              "mean_reward": 0.34798242423342973,
              "min_reward": 0.2041155811083803,
              "max_reward": 0.4652231650487685,
              "num_responses": 6,
              "rvariance": 0.006575978352624803
            },
            {
              "id": "chat_sample_313",
              "variance": 0.685750970453967,
              "mean_reward": -0.43024823889716807,
              "min_reward": -0.8866957070636363,
              "max_reward": -0.0587098158842473,
              "num_responses": 7,
              "rvariance": 0.08025193734744725
            },
            {
              "id": "chat_sample_3",
              "variance": 0.34905961221504545,
              "mean_reward": -0.9985989573238025,
              "min_reward": -1.3058420918100488,
              "max_reward": -0.7630131673023997,
              "num_responses": 7,
              "rvariance": 0.02564015071668103
            },
            {
              "id": "chat_sample_170",
              "variance": 0.591357143233412,
              "mean_reward": 0.14728459929679363,
              "min_reward": -0.673686888585951,
              "max_reward": 0.40939424085098813,
              "num_responses": 6,
              "rvariance": 0.1381726781735425
            },
            {
              "id": "chat_sample_83",
              "variance": 0.23499682554634943,
              "mean_reward": -0.5686548905347423,
              "min_reward": -0.673686888585951,
              "max_reward": -0.3644805391828598,
              "num_responses": 7,
              "rvariance": 0.010410228799061325
            },
            {
              "id": "chat_sample_279",
              "variance": 0.3147033511702575,
              "mean_reward": -1.1419136462534893,
              "min_reward": -1.3333271006458793,
              "max_reward": -0.8454681938098907,
              "num_responses": 7,
              "rvariance": 0.02203453463318534
            },
            {
              "id": "chat_sample_55",
              "variance": 0.36997398612605986,
              "mean_reward": 0.4621454166635062,
              "min_reward": 0.2779815423546743,
              "max_reward": 0.6859621422615308,
              "num_responses": 6,
              "rvariance": 0.024985755587563163
            },
            {
              "id": "chat_sample_103",
              "variance": 0.6665114642688856,
              "mean_reward": -0.22656469127449688,
              "min_reward": -0.6462018797501208,
              "max_reward": 0.0718439760859468,
              "num_responses": 7,
              "rvariance": 0.06956131456647859
            },
            {
              "id": "chat_sample_113",
              "variance": 0.1195597884358619,
              "mean_reward": -0.987801275281155,
              "min_reward": -1.0997045255413214,
              "max_reward": -0.9141807158994666,
              "num_responses": 7,
              "rvariance": 0.003193215312855351
            },
            {
              "id": "chat_sample_104",
              "variance": 0.6943400357151639,
              "mean_reward": 0.6071881437231242,
              "min_reward": 0.14742775038448022,
              "max_reward": 0.9736958285116296,
              "num_responses": 7,
              "rvariance": 0.08991604474641383
            },
            {
              "id": "chat_sample_282",
              "variance": 0.519069422728863,
              "mean_reward": 0.3669780623155591,
              "min_reward": 0.07527960219042559,
              "max_reward": 0.6649189323715983,
              "num_responses": 7,
              "rvariance": 0.053242676214332985
            },
            {
              "id": "chat_sample_62",
              "variance": 3.0501488555562717,
              "mean_reward": 1.1624098623933576,
              "min_reward": -1.3745546138996247,
              "max_reward": 3.091759321922805,
              "num_responses": 7,
              "rvariance": 1.8784329966172213
            },
            {
              "id": "chat_sample_91",
              "variance": 0.2384324516508281,
              "mean_reward": 0.27650913116704057,
              "min_reward": 0.09245773271281955,
              "max_reward": 0.415406586533826,
              "num_responses": 7,
              "rvariance": 0.01081997979839498
            },
            {
              "id": "chat_sample_284",
              "variance": 0.9289932986510657,
              "mean_reward": -0.2685284101220593,
              "min_reward": -0.6668156363769935,
              "max_reward": 1.0114877156608963,
              "num_responses": 7,
              "rvariance": 0.29861103919663995
            },
            {
              "id": "chat_sample_84",
              "variance": 1.2856112882959638,
              "mean_reward": 0.8782345031800405,
              "min_reward": 0.14055649817552263,
              "max_reward": 1.4632725483998574,
              "num_responses": 7,
              "rvariance": 0.37502068770524444
            },
            {
              "id": "chat_sample_175",
              "variance": 0.5455774253912322,
              "mean_reward": 0.986702127335728,
              "min_reward": 0.7314841881458749,
              "max_reward": 1.3945600263102818,
              "num_responses": 7,
              "rvariance": 0.053286900977423994
            },
            {
              "id": "chat_sample_185",
              "variance": 0.26660458570755435,
              "mean_reward": -0.1490177020591184,
              "min_reward": -0.3232530259291143,
              "max_reward": 0.09589335881729834,
              "num_responses": 7,
              "rvariance": 0.015862976371616676
            },
            {
              "id": "chat_sample_154",
              "variance": 0.43808527364735195,
              "mean_reward": 0.755686947042605,
              "min_reward": 0.4574930063136912,
              "max_reward": 0.9616711371459539,
              "num_responses": 7,
              "rvariance": 0.03162337008403159
            },
            {
              "id": "chat_sample_189",
              "variance": 0.44937989446582605,
              "mean_reward": -1.373573006441202,
              "min_reward": -1.5944346845862674,
              "max_reward": -1.058477012287576,
              "num_responses": 7,
              "rvariance": 0.034080876769973976
            },
            {
              "id": "chat_sample_218",
              "variance": 0.17435802480229867,
              "mean_reward": 0.1296770155113398,
              "min_reward": 0.02374521062324371,
              "max_reward": 0.25908559878004095,
              "num_responses": 6,
              "rvariance": 0.00586110677281883
            },
            {
              "id": "chat_sample_257",
              "variance": 0.44018959463634527,
              "mean_reward": 0.4273852650498883,
              "min_reward": 0.17491275922031055,
              "max_reward": 0.6692134650021968,
              "num_responses": 7,
              "rvariance": 0.03534506751077736
            },
            {
              "id": "chat_sample_13",
              "variance": 0.2923717814911451,
              "mean_reward": 0.5326473273491648,
              "min_reward": 0.35871875580992596,
              "max_reward": 0.6790908900525733,
              "num_responses": 5,
              "rvariance": 0.01665846481781716
            },
            {
              "id": "chat_sample_237",
              "variance": 0.21919294546574697,
              "mean_reward": -0.18680958920838514,
              "min_reward": -0.3301242781380719,
              "max_reward": -0.07588794640664126,
              "num_responses": 7,
              "rvariance": 0.00838628529735563
            },
            {
              "id": "chat_sample_89",
              "variance": 0.31332910072846587,
              "mean_reward": -0.3973643890400139,
              "min_reward": -0.5568756010336722,
              "max_reward": -0.15490734680965348,
              "num_responses": 7,
              "rvariance": 0.01767108395597789
            },
            {
              "id": "chat_sample_23",
              "variance": 0.4195758380094725,
              "mean_reward": 0.5966512011616201,
              "min_reward": 0.2917240467725895,
              "max_reward": 0.892958615056378,
              "num_responses": 7,
              "rvariance": 0.03482008909839988
            },
            {
              "id": "chat_sample_236",
              "variance": 0.6383393302121596,
              "mean_reward": -0.2687738119866649,
              "min_reward": -0.8935669592725939,
              "max_reward": 0.11994274154864988,
              "num_responses": 7,
              "rvariance": 0.09443977647663813
            },
            {
              "id": "chat_sample_234",
              "variance": 0.28584409189263554,
              "mean_reward": -0.44791717314877333,
              "min_reward": -0.9210519681084242,
              "max_reward": -0.28889676488432636,
              "num_responses": 7,
              "rvariance": 0.03872134899288027
            },
            {
              "id": "chat_sample_194",
              "variance": 0.2820649031777089,
              "mean_reward": 0.13098582545590315,
              "min_reward": -0.02435355483945938,
              "max_reward": 0.3226446817128986,
              "num_responses": 7,
              "rvariance": 0.013602601002864548
            },
            {
              "id": "chat_sample_70",
              "variance": 0.23980670209261967,
              "mean_reward": 1.0264572294018397,
              "min_reward": 0.8723448584295054,
              "max_reward": 1.2811843648624814,
              "num_responses": 7,
              "rvariance": 0.014310692162500803
            },
            {
              "id": "chat_sample_74",
              "variance": 0.3765446210508758,
              "mean_reward": -1.5159060879124664,
              "min_reward": -1.9379972950341466,
              "max_reward": -1.2646145785563034,
              "num_responses": 7,
              "rvariance": 0.038727130312094835
            },
            {
              "id": "chat_sample_200",
              "variance": 0.3201144622848115,
              "mean_reward": 0.5664744406233968,
              "min_reward": 0.3295159339218562,
              "max_reward": 0.7864542058175356,
              "num_responses": 7,
              "rvariance": 0.020143993260989066
            },
            {
              "id": "chat_sample_260",
              "variance": 0.19222328054558852,
              "mean_reward": 0.5783457558236941,
              "min_reward": 0.4828307488342223,
              "max_reward": 0.7495212251943886,
              "num_responses": 7,
              "rvariance": 0.007273355824738974
            },
            {
              "id": "chat_sample_315",
              "variance": 0.4136493829792465,
              "mean_reward": -0.2506140740058484,
              "min_reward": -0.7011718974217814,
              "max_reward": -0.03809605925737455,
              "num_responses": 7,
              "rvariance": 0.04300675186069081
            },
            {
              "id": "chat_sample_240",
              "variance": 0.3028504411098055,
              "mean_reward": 0.6966677986049514,
              "min_reward": 0.5012972391457958,
              "max_reward": 0.9479286327280386,
              "num_responses": 7,
              "rvariance": 0.018731939094395446
            },
            {
              "id": "chat_sample_20",
              "variance": 0.2544725310261135,
              "mean_reward": 0.37187076199113384,
              "min_reward": 0.23503621604868943,
              "max_reward": 0.5684529931567797,
              "num_responses": 7,
              "rvariance": 0.011399595982287661
            },
            {
              "id": "chat_sample_210",
              "variance": 0.24049382731351554,
              "mean_reward": -0.11834246898341491,
              "min_reward": -0.24766925163058087,
              "max_reward": 0.16288806785463478,
              "num_responses": 7,
              "rvariance": 0.01630801750698935
            },
            {
              "id": "chat_sample_93",
              "variance": 0.5510744271583983,
              "mean_reward": -1.0211759288675204,
              "min_reward": -1.319584596227964,
              "max_reward": -0.7355281584665694,
              "num_responses": 7,
              "rvariance": 0.04657816180550022
            },
            {
              "id": "chat_sample_226",
              "variance": 0.38753862458520816,
              "mean_reward": -1.877137632611951,
              "min_reward": -2.047937330377468,
              "max_reward": -1.3470696050637945,
              "num_responses": 7,
              "rvariance": 0.05195478867506355
            },
            {
              "id": "chat_sample_30",
              "variance": 0.3332557321344429,
              "mean_reward": 0.11478930239193168,
              "min_reward": -0.13429359018278073,
              "max_reward": 0.3226446817128986,
              "num_responses": 7,
              "rvariance": 0.02095378927250899
            },
            {
              "id": "chat_sample_142",
              "variance": 0.4513983248022073,
              "mean_reward": 0.33032882759836235,
              "min_reward": 0.07527960219042559,
              "max_reward": 0.5872952550735305,
              "num_responses": 7,
              "rvariance": 0.03207091937473736
            },
            {
              "id": "chat_sample_136",
              "variance": 0.6366215171599202,
              "mean_reward": 0.12092434900707241,
              "min_reward": -0.30263926930224155,
              "max_reward": 0.48755473472788063,
              "num_responses": 7,
              "rvariance": 0.06812814962201322
            },
            {
              "id": "chat_sample_16",
              "variance": 0.29202821888069735,
              "mean_reward": -0.12545912305697812,
              "min_reward": -0.3301242781380719,
              "max_reward": 0.06497272387698921,
              "num_responses": 7,
              "rvariance": 0.015145129235805799
            },
            {
              "id": "chat_sample_22",
              "variance": 3.738648326893822,
              "mean_reward": 1.4583645111077448,
              "min_reward": -0.9622794813621697,
              "max_reward": 4.369812232788916,
              "num_responses": 7,
              "rvariance": 2.6331774752087744
            },
            {
              "id": "chat_sample_217",
              "variance": 0.3174518520538404,
              "mean_reward": -0.7158960092981191,
              "min_reward": -0.9691507335711272,
              "max_reward": -0.4331930612724356,
              "num_responses": 7,
              "rvariance": 0.023019286006069516
            }
          ]
        },
        "semantic_benchmark_chat_hard_filtered.json": {
          "file_name": "semantic_benchmark_chat_hard_filtered.json",
          "processed_samples": 200,
          "global_mean": -8.063807165575593,
          "global_std": 6.906930745949853,
          "mean_variance": 0.5246370063651529,
          "mean_rvariance": 0.0931039936449189,
          "sample_results": [
            {
              "id": "chat_hard_sample_121",
              "variance": 1.2699716803235754,
              "mean_reward": 1.7993526213082396,
              "min_reward": 1.164366781146452,
              "max_reward": 2.4343384614700274,
              "num_responses": 6,
              "rvariance": 0.4032070172059714
            },
            {
              "id": "chat_hard_sample_77",
              "variance": 1.2908229904039539,
              "mean_reward": 1.3670147724502342,
              "min_reward": 0.7444597831809396,
              "max_reward": 2.3528985251669385,
              "num_responses": 7,
              "rvariance": 0.3185560832097586
            },
            {
              "id": "chat_hard_sample_265",
              "variance": 1.3564273835369982,
              "mean_reward": 0.7512464445395304,
              "min_reward": 0.23093574038090894,
              "max_reward": 3.0044180155916473,
              "num_responses": 7,
              "rvariance": 0.8685426996325544
            },
            {
              "id": "chat_hard_sample_334",
              "variance": 0.4230352246854879,
              "mean_reward": 0.39758598040852533,
              "min_reward": -0.017908509434083893,
              "max_reward": 0.5747932492161718,
              "num_responses": 6,
              "rvariance": 0.04478561694686656
            },
            {
              "id": "chat_hard_sample_61",
              "variance": 0.27689578343050114,
              "mean_reward": -0.7521606335635173,
              "min_reward": -0.8866011633336952,
              "max_reward": -0.47940148181825243,
              "num_responses": 7,
              "rvariance": 0.01711172169930045
            },
            {
              "id": "chat_hard_sample_133",
              "variance": 0.5791284359330742,
              "mean_reward": -1.087184710154265,
              "min_reward": -1.384289662963681,
              "max_reward": -0.5517925363098867,
              "num_responses": 6,
              "rvariance": 0.07670775797834331
            },
            {
              "id": "chat_hard_sample_62",
              "variance": 0.39068547220953853,
              "mean_reward": 1.9066755408395994,
              "min_reward": 1.7353123415351839,
              "max_reward": 2.235263061618033,
              "num_responses": 4,
              "rvariance": 0.03972665074947072
            },
            {
              "id": "chat_hard_sample_84",
              "variance": 0.9953769992599713,
              "mean_reward": -0.15665803054304958,
              "min_reward": -0.6060858271786124,
              "max_reward": 0.45715778566726606,
              "num_responses": 6,
              "rvariance": 0.17132271176286884
            },
            {
              "id": "chat_hard_sample_343",
              "variance": 0.3966803564096273,
              "mean_reward": 1.6716873912983958,
              "min_reward": 1.369963738397717,
              "max_reward": 1.9230766391228602,
              "num_responses": 4,
              "rvariance": 0.03900050541591206
            },
            {
              "id": "chat_hard_sample_87",
              "variance": 0.44610987330469637,
              "mean_reward": 0.2472237276415266,
              "min_reward": 0.009238136000278962,
              "max_reward": 0.710526476387986,
              "num_responses": 5,
              "rvariance": 0.058141318982466675
            },
            {
              "id": "chat_hard_sample_110",
              "variance": 1.1157271273523137,
              "mean_reward": -0.5605182437709318,
              "min_reward": -0.9499433360138753,
              "max_reward": 0.6177754378205796,
              "num_responses": 7,
              "rvariance": 0.3065093283889674
            },
            {
              "id": "chat_hard_sample_150",
              "variance": 0.6551390431492903,
              "mean_reward": -0.06767735939708246,
              "min_reward": -0.497499245441161,
              "max_reward": 0.32594899940117894,
              "num_responses": 7,
              "rvariance": 0.07423796800315156
            },
            {
              "id": "chat_hard_sample_65",
              "variance": 0.5338840268758029,
              "mean_reward": 0.21962463811659108,
              "min_reward": -0.21698390928607816,
              "max_reward": 0.6494465241606696,
              "num_responses": 7,
              "rvariance": 0.06839654591671436
            },
            {
              "id": "chat_hard_sample_46",
              "variance": 0.8725384286694795,
              "mean_reward": 1.6808574634912536,
              "min_reward": 1.0159262375245681,
              "max_reward": 2.2488363843352146,
              "num_responses": 7,
              "rvariance": 0.15124985429532037
            },
            {
              "id": "chat_hard_sample_114",
              "variance": 0.4307267742252239,
              "mean_reward": -0.687525763481701,
              "min_reward": -1.0947254449971437,
              "max_reward": -0.47940148181825243,
              "num_responses": 4,
              "rvariance": 0.05723570116433005
            },
            {
              "id": "chat_hard_sample_371",
              "variance": 0.17554830714221317,
              "mean_reward": 0.1562824654364111,
              "min_reward": 0.06353142686900468,
              "max_reward": 0.28522903124963467,
              "num_responses": 4,
              "rvariance": 0.0070469921766168194
            },
            {
              "id": "chat_hard_sample_223",
              "variance": 0.26241757253217424,
              "mean_reward": 0.4046742711608312,
              "min_reward": 0.27165570853245324,
              "max_reward": 0.6879042718593503,
              "num_responses": 5,
              "rvariance": 0.02120423057727455
            },
            {
              "id": "chat_hard_sample_52",
              "variance": 0.6761776933609215,
              "mean_reward": 0.9338399525206614,
              "min_reward": 0.5928910128390803,
              "max_reward": 1.385799281567762,
              "num_responses": 7,
              "rvariance": 0.07764480275638848
            },
            {
              "id": "chat_hard_sample_372",
              "variance": 2.276019997626039,
              "mean_reward": -0.3374471484010634,
              "min_reward": -1.9634180988967551,
              "max_reward": 0.7625575468038481,
              "num_responses": 4,
              "rvariance": 1.1859503782423912
            },
            {
              "id": "chat_hard_sample_346",
              "variance": 0.15292610261357736,
              "mean_reward": 0.4933533129130831,
              "min_reward": 0.40286449479854036,
              "max_reward": 0.5702688083104446,
              "num_responses": 5,
              "rvariance": 0.004560841995498116
            },
            {
              "id": "chat_hard_sample_108",
              "variance": 0.798111375770268,
              "mean_reward": 1.4575116699235373,
              "min_reward": 0.7195753581994403,
              "max_reward": 1.9864188118030401,
              "num_responses": 5,
              "rvariance": 0.1689751018201034
            },
            {
              "id": "chat_hard_sample_64",
              "variance": 0.5180484837057578,
              "mean_reward": 0.0024514746416882485,
              "min_reward": -0.434157072760981,
              "max_reward": 0.2897534721553618,
              "num_responses": 6,
              "rvariance": 0.05537799734435045
            },
            {
              "id": "chat_hard_sample_233",
              "variance": 0.45063431421042344,
              "mean_reward": -0.7793072789978801,
              "min_reward": -1.1399698540544152,
              "max_reward": -0.4613037181953438,
              "num_responses": 7,
              "rvariance": 0.040459863846041264
            },
            {
              "id": "chat_hard_sample_47",
              "variance": 0.9293201620363553,
              "mean_reward": -1.2553430971504573,
              "min_reward": -1.9453203352738466,
              "max_reward": -0.6332324726129752,
              "num_responses": 4,
              "rvariance": 0.21651205375172677
            },
            {
              "id": "chat_hard_sample_26",
              "variance": 0.6011850853484944,
              "mean_reward": 1.3241537742272296,
              "min_reward": 1.0125329068452729,
              "max_reward": 1.8733077891598615,
              "num_responses": 7,
              "rvariance": 0.08034706101091506
            },
            {
              "id": "chat_hard_sample_379",
              "variance": 1.6586600360395711,
              "mean_reward": 0.6465379550069879,
              "min_reward": -0.40701042732661813,
              "max_reward": 3.0406135428374643,
              "num_responses": 7,
              "rvariance": 1.0497331059227646
            },
            {
              "id": "chat_hard_sample_247",
              "variance": 0.4688310499781449,
              "mean_reward": 0.6359085486380642,
              "min_reward": 0.4616822265729932,
              "max_reward": 1.1314408693989142,
              "num_responses": 4,
              "rvariance": 0.08188146615447546
            },
            {
              "id": "chat_hard_sample_215",
              "variance": 0.2316513743732297,
              "mean_reward": -0.8697960971124231,
              "min_reward": -1.067578799562781,
              "max_reward": -0.6784768816702467,
              "num_responses": 7,
              "rvariance": 0.012105206248997318
            },
            {
              "id": "chat_hard_sample_49",
              "variance": 0.6189435159034733,
              "mean_reward": -1.000358534677692,
              "min_reward": -1.6014628264385837,
              "max_reward": -0.2712772001548039,
              "num_responses": 7,
              "rvariance": 0.13011926971071575
            },
            {
              "id": "chat_hard_sample_415",
              "variance": 0.7377100896788107,
              "mean_reward": 0.7327447129786104,
              "min_reward": 0.0454336632460961,
              "max_reward": 1.1296028152809625,
              "num_responses": 7,
              "rvariance": 0.11618478082867376
            },
            {
              "id": "chat_hard_sample_297",
              "variance": 0.7347692030900879,
              "mean_reward": 0.1349529583094117,
              "min_reward": -0.18078838204026101,
              "max_reward": 0.6042021151033982,
              "num_responses": 7,
              "rvariance": 0.09496859324786684
            },
            {
              "id": "chat_hard_sample_80",
              "variance": 2.517398919946582,
              "mean_reward": 0.5811274664841897,
              "min_reward": -0.5970369453671581,
              "max_reward": 2.751049324870927,
              "num_responses": 5,
              "rvariance": 1.5004154825139537
            },
            {
              "id": "chat_hard_sample_413",
              "variance": 0.3438575088352628,
              "mean_reward": 0.016778870843157535,
              "min_reward": -0.40701042732661813,
              "max_reward": 0.17664244951218322,
              "num_responses": 6,
              "rvariance": 0.03843462399756991
            },
            {
              "id": "chat_hard_sample_306",
              "variance": 0.4280121096817877,
              "mean_reward": 0.03509208403300549,
              "min_reward": -0.23508167290898674,
              "max_reward": 0.3123756766839975,
              "num_responses": 7,
              "rvariance": 0.03435963532423499
            },
            {
              "id": "chat_hard_sample_43",
              "variance": 0.43344143876866026,
              "mean_reward": -0.0179085094340839,
              "min_reward": -0.35271713645789243,
              "max_reward": 0.31690011758972464,
              "num_responses": 7,
              "rvariance": 0.0378939411244323
            },
            {
              "id": "chat_hard_sample_102",
              "variance": 0.46488630306346385,
              "mean_reward": 0.77424568581031,
              "min_reward": 0.2988023539668161,
              "max_reward": 0.9774684898258874,
              "num_responses": 6,
              "rvariance": 0.05466607656607852
            },
            {
              "id": "chat_hard_sample_187",
              "variance": 0.6605683722361628,
              "mean_reward": -1.3179311963463494,
              "min_reward": -1.8367337535363952,
              "max_reward": -1.040432154128418,
              "num_responses": 6,
              "rvariance": 0.08446610230641238
            },
            {
              "id": "chat_hard_sample_360",
              "variance": 0.7736793948793415,
              "mean_reward": -0.924304837548088,
              "min_reward": -1.3480941357178637,
              "max_reward": -0.1445928547944439,
              "num_responses": 6,
              "rvariance": 0.156242728504265
            },
            {
              "id": "chat_hard_sample_236",
              "variance": 0.48682984145624053,
              "mean_reward": -0.6022077349737034,
              "min_reward": -0.9770899814482381,
              "max_reward": -0.370814900080801,
              "num_responses": 7,
              "rvariance": 0.0434878364748628
            },
            {
              "id": "chat_hard_sample_259",
              "variance": 0.8638783659983611,
              "mean_reward": 0.8339866526430929,
              "min_reward": 0.049958104151823245,
              "max_reward": 1.1702344154460669,
              "num_responses": 7,
              "rvariance": 0.15395761637803412
            },
            {
              "id": "chat_hard_sample_127",
              "variance": 0.1619749844250317,
              "mean_reward": -0.0405307139627196,
              "min_reward": -0.11744620936008103,
              "max_reward": 0.10425139502054895,
              "num_responses": 5,
              "rvariance": 0.006304934176900449
            },
            {
              "id": "chat_hard_sample_280",
              "variance": 0.6026555286428554,
              "mean_reward": 1.2202734189676103,
              "min_reward": 0.7218375786523039,
              "max_reward": 1.4751569894558731,
              "num_responses": 7,
              "rvariance": 0.07142769014503109
            },
            {
              "id": "chat_hard_sample_421",
              "variance": 0.4823054005505134,
              "mean_reward": 0.02927494572564202,
              "min_reward": -0.1988861456631696,
              "max_reward": 0.2942779130610889,
              "num_responses": 7,
              "rvariance": 0.03763576133902781
            },
            {
              "id": "chat_hard_sample_270",
              "variance": 0.2873019975136735,
              "mean_reward": 0.33575195469692104,
              "min_reward": 0.1721180086064561,
              "max_reward": 0.5114510765359918,
              "num_responses": 6,
              "rvariance": 0.015273885004123642
            },
            {
              "id": "chat_hard_sample_276",
              "variance": 0.8008260403137042,
              "mean_reward": 1.1513295575470064,
              "min_reward": 0.7783930899738931,
              "max_reward": 1.791867852856773,
              "num_responses": 6,
              "rvariance": 0.13101802741798338
            },
            {
              "id": "chat_hard_sample_349",
              "variance": 0.9856494513126581,
              "mean_reward": 1.948445825629973,
              "min_reward": 1.4106837065492612,
              "max_reward": 2.4071918160356645,
              "num_responses": 7,
              "rvariance": 0.2201451613630053
            },
            {
              "id": "chat_hard_sample_267",
              "variance": 0.50673738144144,
              "mean_reward": -0.7780145815962438,
              "min_reward": -1.0223343905055096,
              "max_reward": -0.3798637818922553,
              "num_responses": 7,
              "rvariance": 0.04566690728500809
            },
            {
              "id": "chat_hard_sample_14",
              "variance": 0.23979536800353862,
              "mean_reward": -1.109806914682901,
              "min_reward": -1.293800844849138,
              "max_reward": -0.9318455723909667,
              "num_responses": 6,
              "rvariance": 0.012136770839805485
            },
            {
              "id": "chat_hard_sample_13",
              "variance": 1.5541454511172732,
              "mean_reward": 0.4041571922001767,
              "min_reward": -1.0494810359398723,
              "max_reward": 1.0883172920162023,
              "num_responses": 7,
              "rvariance": 0.4910287081743157
            },
            {
              "id": "chat_hard_sample_147",
              "variance": 0.1303038980849418,
              "mean_reward": -1.4494416120061515,
              "min_reward": -1.5290717719469495,
              "max_reward": -1.3480941357178637,
              "num_responses": 5,
              "rvariance": 0.0037469323108436994
            },
            {
              "id": "chat_hard_sample_173",
              "variance": 0.06334217268017994,
              "mean_reward": -2.2831452562348065,
              "min_reward": -2.3253733713549263,
              "max_reward": -2.2529823168632923,
              "num_responses": 6,
              "rvariance": 0.000946195027990824
            },
            {
              "id": "chat_hard_sample_345",
              "variance": 1.0315725265057885,
              "mean_reward": 0.2437549896138025,
              "min_reward": -0.20793502747462386,
              "max_reward": 1.2715571486981516,
              "num_responses": 6,
              "rvariance": 0.2613914941238447
            },
            {
              "id": "chat_hard_sample_412",
              "variance": 0.2063145053011577,
              "mean_reward": -1.1205793930298702,
              "min_reward": -1.2214097903575039,
              "max_reward": -1.0042366268826008,
              "num_responses": 7,
              "rvariance": 0.006256473246306736
            },
            {
              "id": "chat_hard_sample_21",
              "variance": 0.8539882209559981,
              "mean_reward": 0.18682244155006933,
              "min_reward": -0.3165216092120753,
              "max_reward": 0.7173131377465768,
              "num_responses": 6,
              "rvariance": 0.1391380072973929
            },
            {
              "id": "chat_hard_sample_357",
              "variance": 0.7673451776113236,
              "mean_reward": -1.282166568234411,
              "min_reward": -1.8548315171593037,
              "max_reward": -0.5336947726869781,
              "num_responses": 7,
              "rvariance": 0.14848094920601979
            },
            {
              "id": "chat_hard_sample_184",
              "variance": 0.5514162353854954,
              "mean_reward": 0.8628493202141332,
              "min_reward": 0.27618014943818037,
              "max_reward": 1.0713506386197256,
              "num_responses": 6,
              "rvariance": 0.0805191213941279
            },
            {
              "id": "chat_hard_sample_348",
              "variance": 0.28503977706080996,
              "mean_reward": 1.793375999825349,
              "min_reward": 1.6742323893078674,
              "max_reward": 2.067858748106129,
              "num_responses": 6,
              "rvariance": 0.02031134999989935
            },
            {
              "id": "chat_hard_sample_283",
              "variance": 0.34385750883526284,
              "mean_reward": -0.349700842520741,
              "min_reward": -0.5698902999327953,
              "max_reward": -0.11744620936008103,
              "num_responses": 6,
              "rvariance": 0.022426641769205783
            },
            {
              "id": "chat_hard_sample_0",
              "variance": 0.6693910320023311,
              "mean_reward": 0.1261464572607642,
              "min_reward": -0.244130554720441,
              "max_reward": 1.1035872800730315,
              "num_responses": 7,
              "rvariance": 0.17151653662772168
            },
            {
              "id": "chat_hard_sample_258",
              "variance": 0.40177035242857023,
              "mean_reward": -0.5013773376460698,
              "min_reward": -0.8413567542764238,
              "max_reward": -0.244130554720441,
              "num_responses": 7,
              "rvariance": 0.03270277281790135
            },
            {
              "id": "chat_hard_sample_161",
              "variance": 0.15766969612567583,
              "mean_reward": 1.2740102440017256,
              "min_reward": 1.1724082679124905,
              "max_reward": 1.3473415338690813,
              "num_responses": 5,
              "rvariance": 0.005141784050459794
            },
            {
              "id": "chat_hard_sample_4",
              "variance": 0.7486818588751991,
              "mean_reward": 0.8901306216278331,
              "min_reward": 0.44810890385581176,
              "max_reward": 1.6878057120250487,
              "num_responses": 7,
              "rvariance": 0.14209842793038047
            },
            {
              "id": "chat_hard_sample_238",
              "variance": 0.5700795541216199,
              "mean_reward": -0.30294828649489386,
              "min_reward": -0.6694279998587924,
              "max_reward": -0.06315291849135532,
              "num_responses": 6,
              "rvariance": 0.062469342412904354
            },
            {
              "id": "chat_hard_sample_8",
              "variance": 0.7003834522065616,
              "mean_reward": -0.9874315606613288,
              "min_reward": -1.3480941357178637,
              "max_reward": -0.39796154551516383,
              "num_responses": 7,
              "rvariance": 0.09492326556709597
            },
            {
              "id": "chat_hard_sample_32",
              "variance": 0.33842817974839035,
              "mean_reward": 0.3812118133211319,
              "min_reward": 0.17664244951218322,
              "max_reward": 0.663019846877851,
              "num_responses": 7,
              "rvariance": 0.022590522339570856
            },
            {
              "id": "chat_hard_sample_109",
              "variance": 0.481400512369368,
              "mean_reward": 0.057067939860823036,
              "min_reward": -0.5155970090640696,
              "max_reward": 0.44358446295008463,
              "num_responses": 7,
              "rvariance": 0.07130106850251482
            },
            {
              "id": "chat_hard_sample_188",
              "variance": 0.3316415183897996,
              "mean_reward": 0.6087265560091252,
              "min_reward": 0.14949580407782037,
              "max_reward": 0.853046364918391,
              "num_responses": 7,
              "rvariance": 0.04054341717465113
            },
            {
              "id": "chat_hard_sample_53",
              "variance": 0.24612958527155637,
              "mean_reward": -1.9996136261425723,
              "min_reward": -2.1986890259945664,
              "max_reward": -1.7462449354218523,
              "num_responses": 7,
              "rvariance": 0.01618929295144753
            },
            {
              "id": "chat_hard_sample_356",
              "variance": 0.5845577650199467,
              "mean_reward": -0.8866011633336951,
              "min_reward": -1.420485190209498,
              "max_reward": -0.5155970090640696,
              "num_responses": 7,
              "rvariance": 0.07219676018521255
            },
            {
              "id": "chat_hard_sample_63",
              "variance": 0.40267524060971566,
              "mean_reward": 0.21219162805718222,
              "min_reward": -0.017908509434083893,
              "max_reward": 0.4390600220443575,
              "num_responses": 7,
              "rvariance": 0.02704119927129687
            },
            {
              "id": "chat_hard_sample_159",
              "variance": 0.2918264384194007,
              "mean_reward": -0.06880846962351425,
              "min_reward": -0.2712772001548039,
              "max_reward": 0.12234915864345752,
              "num_responses": 4,
              "rvariance": 0.019768169230375176
            },
            {
              "id": "chat_hard_sample_152",
              "variance": 0.19455095894626728,
              "mean_reward": -1.2500645827604424,
              "min_reward": -1.3661918993407722,
              "max_reward": -1.103774326808598,
              "num_responses": 6,
              "rvariance": 0.007708305167934928
            },
            {
              "id": "chat_hard_sample_318",
              "variance": 0.8652993232203159,
              "mean_reward": 1.0771947081229565,
              "min_reward": 0.6426598628020789,
              "max_reward": 1.6878057120250487,
              "num_responses": 6,
              "rvariance": 0.14537531042192453
            },
            {
              "id": "chat_hard_sample_176",
              "variance": 0.7058127812934343,
              "mean_reward": 0.4746092005893564,
              "min_reward": -0.16269061841735244,
              "max_reward": 0.8281619399368917,
              "num_responses": 7,
              "rvariance": 0.11018678763754619
            },
            {
              "id": "chat_hard_sample_274",
              "variance": 0.13573322717181424,
              "mean_reward": -0.6633954119844895,
              "min_reward": -0.7599168179733352,
              "max_reward": -0.5879880635557039,
              "num_responses": 6,
              "rvariance": 0.0034026628891208736
            },
            {
              "id": "chat_hard_sample_389",
              "variance": 0.18459718895366745,
              "mean_reward": 0.11330027683200325,
              "min_reward": 0.02733589962318753,
              "max_reward": 0.24450906309809037,
              "num_responses": 7,
              "rvariance": 0.006223051914862782
            },
            {
              "id": "chat_hard_sample_42",
              "variance": 1.4080060098622869,
              "mean_reward": -1.5652672991927667,
              "min_reward": -2.090102444257115,
              "max_reward": -0.497499245441161,
              "num_responses": 7,
              "rvariance": 0.37216657842720735
            },
            {
              "id": "chat_hard_sample_5",
              "variance": 0.8904099702471016,
              "mean_reward": -0.28485052287198526,
              "min_reward": -1.420485190209498,
              "max_reward": 0.16759356770072895,
              "num_responses": 7,
              "rvariance": 0.24208490771436592
            },
            {
              "id": "chat_hard_sample_17",
              "variance": 0.12442212490749682,
              "mean_reward": 2.159855713189247,
              "min_reward": 2.076907629917583,
              "max_reward": 2.244311943429487,
              "num_responses": 6,
              "rvariance": 0.0028977222732219296
            },
            {
              "id": "chat_hard_sample_182",
              "variance": 0.23074648619208432,
              "mean_reward": -0.39569932506230027,
              "min_reward": -0.5517925363098867,
              "max_reward": -0.2531794365318953,
              "num_responses": 4,
              "rvariance": 0.011847339788575115
            },
            {
              "id": "chat_hard_sample_140",
              "variance": 0.4506343142104233,
              "mean_reward": -0.8250687670158061,
              "min_reward": -1.0042366268826008,
              "max_reward": -0.4884503636297067,
              "num_responses": 5,
              "rvariance": 0.04734104861969822
            },
            {
              "id": "chat_hard_sample_251",
              "variance": 0.8053504812194314,
              "mean_reward": -1.1309209722429607,
              "min_reward": -1.4747784810782236,
              "max_reward": -0.34366825464643813,
              "num_responses": 6,
              "rvariance": 0.1545664166397716
            },
            {
              "id": "chat_hard_sample_98",
              "variance": 0.28865932978539177,
              "mean_reward": 0.7297553502373264,
              "min_reward": 0.45263334476153894,
              "max_reward": 0.9605018364294107,
              "num_responses": 7,
              "rvariance": 0.020220166627739355
            },
            {
              "id": "chat_hard_sample_409",
              "variance": 0.24884424981499287,
              "mean_reward": -0.3662904591750738,
              "min_reward": -0.560841418121341,
              "max_reward": -0.1355439729829896,
              "num_responses": 6,
              "rvariance": 0.01579645305143349
            },
            {
              "id": "chat_hard_sample_248",
              "variance": 0.24703447345270196,
              "mean_reward": 0.37830324416745015,
              "min_reward": 0.1630691267950018,
              "max_reward": 0.5024021947245375,
              "num_responses": 7,
              "rvariance": 0.012421873364428704
            },
            {
              "id": "chat_hard_sample_382",
              "variance": 0.15654565533815923,
              "mean_reward": 0.41773051491735813,
              "min_reward": 0.33047344030690606,
              "max_reward": 0.5928910128390803,
              "num_responses": 7,
              "rvariance": 0.006478725100408969
            },
            {
              "id": "chat_hard_sample_254",
              "variance": 0.35290639064671714,
              "mean_reward": -0.723721290727518,
              "min_reward": -0.8866011633336952,
              "max_reward": -0.370814900080801,
              "num_responses": 6,
              "rvariance": 0.029777849294365322
            },
            {
              "id": "chat_hard_sample_2",
              "variance": 0.7908722703211046,
              "mean_reward": -1.328703674693319,
              "min_reward": -1.8548315171593037,
              "max_reward": -0.7870634634076981,
              "num_responses": 7,
              "rvariance": 0.11431766420401794
            },
            {
              "id": "chat_hard_sample_203",
              "variance": 0.17192875441763145,
              "mean_reward": -0.7095016193095185,
              "min_reward": -0.7961123452191524,
              "max_reward": -0.5698902999327953,
              "num_responses": 7,
              "rvariance": 0.005494466889384756
            },
            {
              "id": "chat_hard_sample_68",
              "variance": 0.5221204805209122,
              "mean_reward": -0.14911729570017102,
              "min_reward": -0.560841418121341,
              "max_reward": 0.1947402131350918,
              "num_responses": 5,
              "rvariance": 0.060838520693987465
            },
            {
              "id": "chat_hard_sample_220",
              "variance": 0.23889047982239298,
              "mean_reward": -1.0417248515300543,
              "min_reward": -1.2033120267345951,
              "max_reward": -0.9046989269566038,
              "num_responses": 7,
              "rvariance": 0.010490955940254709
            },
            {
              "id": "chat_hard_sample_11",
              "variance": 0.17102386623648597,
              "mean_reward": -0.006597407169766036,
              "min_reward": -0.15364173660589817,
              "max_reward": 0.0771047495861861,
              "num_responses": 4,
              "rvariance": 0.007783932534955832
            },
            {
              "id": "chat_hard_sample_6",
              "variance": 0.5700795541216199,
              "mean_reward": -0.3934371046094367,
              "min_reward": -1.0494810359398723,
              "max_reward": -0.045055154868446745,
              "num_responses": 6,
              "rvariance": 0.09762412691440986
            },
            {
              "id": "chat_hard_sample_286",
              "variance": 0.3234975247594907,
              "mean_reward": 0.3877830251127832,
              "min_reward": 0.009238136000278962,
              "max_reward": 0.5385977219703546,
              "num_responses": 6,
              "rvariance": 0.03133816128763867
            },
            {
              "id": "chat_hard_sample_400",
              "variance": 0.40584234924372464,
              "mean_reward": 0.429364791532085,
              "min_reward": 0.12687359954918467,
              "max_reward": 0.6901664923122139,
              "num_responses": 7,
              "rvariance": 0.031359026410533196
            },
            {
              "id": "chat_hard_sample_209",
              "variance": 0.7655354012490324,
              "mean_reward": -1.2084828163411405,
              "min_reward": -1.547169535569858,
              "max_reward": -0.7056235271046095,
              "num_responses": 7,
              "rvariance": 0.09685167639141168
            },
            {
              "id": "chat_hard_sample_337",
              "variance": 0.4633027487464596,
              "mean_reward": -0.9938950476695103,
              "min_reward": -1.2757030812262296,
              "max_reward": -0.5789391817442495,
              "num_responses": 7,
              "rvariance": 0.04862469511779734
            },
            {
              "id": "chat_hard_sample_268",
              "variance": 0.3981507997039886,
              "mean_reward": -1.9151573959023322,
              "min_reward": -2.0720046806342065,
              "max_reward": -1.637658353684401,
              "num_responses": 6,
              "rvariance": 0.03391745254182523
            },
            {
              "id": "chat_hard_sample_249",
              "variance": 0.27463356297763775,
              "mean_reward": 1.4773384163211343,
              "min_reward": 1.2766471447170946,
              "max_reward": 1.6900679324779124,
              "num_responses": 7,
              "rvariance": 0.014681638412720504
            },
            {
              "id": "chat_hard_sample_295",
              "variance": 0.4795907360070772,
              "mean_reward": 0.41352924836204,
              "min_reward": 0.018287017811733246,
              "max_reward": 0.8032775149553925,
              "num_responses": 7,
              "rvariance": 0.051800348254936776
            },
            {
              "id": "chat_hard_sample_153",
              "variance": 0.8664304334467474,
              "mean_reward": 2.2269682532908663,
              "min_reward": 0.837210821748346,
              "max_reward": 2.5700716886418413,
              "num_responses": 6,
              "rvariance": 0.3871694721355395
            },
            {
              "id": "chat_hard_sample_192",
              "variance": 0.28051533615508284,
              "mean_reward": -0.3255704910235296,
              "min_reward": -0.624183590801521,
              "max_reward": -0.21698390928607816,
              "num_responses": 5,
              "rvariance": 0.0235165856572183
            },
            {
              "id": "chat_hard_sample_363",
              "variance": 0.4354774371762375,
              "mean_reward": 0.5186147746367263,
              "min_reward": 0.27165570853245324,
              "max_reward": 0.7693442081624389,
              "num_responses": 6,
              "rvariance": 0.03860137381244871
            },
            {
              "id": "chat_hard_sample_129",
              "variance": 0.228031821648648,
              "mean_reward": -0.5536023126721774,
              "min_reward": -0.6332324726129752,
              "max_reward": -0.2712772001548039,
              "num_responses": 5,
              "rvariance": 0.020025126003932126
            },
            {
              "id": "chat_hard_sample_359",
              "variance": 0.42529744513835144,
              "mean_reward": -1.0843838657840532,
              "min_reward": -1.547169535569858,
              "max_reward": -0.877552281522241,
              "num_responses": 7,
              "rvariance": 0.04352459993945114
            },
            {
              "id": "chat_hard_sample_7",
              "variance": 0.9116748425040191,
              "mean_reward": 1.612775400338407,
              "min_reward": 0.8485219240126639,
              "max_reward": 2.2578852661466686,
              "num_responses": 6,
              "rvariance": 0.18466397636351664
            },
            {
              "id": "chat_hard_sample_316",
              "variance": 0.5501720141364206,
              "mean_reward": -0.4522548363838896,
              "min_reward": -0.7056235271046095,
              "max_reward": -0.036006273056992465,
              "num_responses": 7,
              "rvariance": 0.056615735466044856
            },
            {
              "id": "chat_hard_sample_41",
              "variance": 0.9931147788071077,
              "mean_reward": 0.32971936682261827,
              "min_reward": -0.5246458908755238,
              "max_reward": 0.7919664126910746,
              "num_responses": 6,
              "rvariance": 0.2092939049023784
            },
            {
              "id": "chat_hard_sample_143",
              "variance": 0.2081242816634486,
              "mean_reward": 0.19474021313509182,
              "min_reward": 0.049958104151823245,
              "max_reward": 0.2988023539668161,
              "num_responses": 4,
              "rvariance": 0.009754224465237223
            },
            {
              "id": "chat_hard_sample_370",
              "variance": 0.3060218717611196,
              "mean_reward": 1.140398858424316,
              "min_reward": 0.9356174114479113,
              "max_reward": 1.391454832699921,
              "num_responses": 7,
              "rvariance": 0.01872166113769757
            },
            {
              "id": "chat_hard_sample_91",
              "variance": 0.3655748251827531,
              "mean_reward": -1.491583547299496,
              "min_reward": -1.6195605900614922,
              "max_reward": -0.9770899814482381,
              "num_responses": 7,
              "rvariance": 0.04754852824530225
            },
            {
              "id": "chat_hard_sample_245",
              "variance": 0.36105038427702596,
              "mean_reward": -0.006920581520175118,
              "min_reward": -0.434157072760981,
              "max_reward": 0.1630691267950018,
              "num_responses": 7,
              "rvariance": 0.03624961161739015
            },
            {
              "id": "chat_hard_sample_131",
              "variance": 0.3664797133638985,
              "mean_reward": -0.723721290727518,
              "min_reward": -1.0042366268826008,
              "max_reward": -0.4884503636297067,
              "num_responses": 6,
              "rvariance": 0.026393382463475033
            },
            {
              "id": "chat_hard_sample_171",
              "variance": 0.2171731634749029,
              "mean_reward": -0.28032608196625813,
              "min_reward": -0.4613037181953438,
              "max_reward": -0.08125068211426388,
              "num_responses": 7,
              "rvariance": 0.011486911617284308
            },
            {
              "id": "chat_hard_sample_329",
              "variance": 0.28458733297023725,
              "mean_reward": 0.46439689111642946,
              "min_reward": 0.33952232211836036,
              "max_reward": 0.6403976423492154,
              "num_responses": 5,
              "rvariance": 0.016850141293421547
            },
            {
              "id": "chat_hard_sample_384",
              "variance": 0.7383887558146696,
              "mean_reward": 0.04995810415182324,
              "min_reward": -0.3165216092120753,
              "max_reward": 0.45715778566726606,
              "num_responses": 7,
              "rvariance": 0.1055871768975731
            },
            {
              "id": "chat_hard_sample_29",
              "variance": 0.8605486602693027,
              "mean_reward": 0.17438022905931969,
              "min_reward": -0.41605930913807243,
              "max_reward": 0.9480596239386611,
              "num_responses": 7,
              "rvariance": 0.1600754357338893
            },
            {
              "id": "chat_hard_sample_106",
              "variance": 0.5637453368536023,
              "mean_reward": 0.1317212148053209,
              "min_reward": -0.10839732754862674,
              "max_reward": 1.0023529148073866,
              "num_responses": 7,
              "rvariance": 0.13072565799310182
            },
            {
              "id": "chat_hard_sample_320",
              "variance": 1.3573322717181424,
              "mean_reward": -1.5139903022611925,
              "min_reward": -2.053906917011298,
              "max_reward": -0.5970369453671581,
              "num_responses": 6,
              "rvariance": 0.370071432293799
            },
            {
              "id": "chat_hard_sample_23",
              "variance": 0.7171238835577521,
              "mean_reward": 0.5067650484550601,
              "min_reward": -0.370814900080801,
              "max_reward": 1.0351551113739086,
              "num_responses": 7,
              "rvariance": 0.15924214794349703
            },
            {
              "id": "chat_hard_sample_235",
              "variance": 0.21174383438803024,
              "mean_reward": -0.6112566167851577,
              "min_reward": -0.9046989269566038,
              "max_reward": -0.4703526000067981,
              "num_responses": 7,
              "rvariance": 0.016209345750313905
            },
            {
              "id": "chat_hard_sample_202",
              "variance": 0.3945312469794069,
              "mean_reward": 2.986320251968739,
              "min_reward": 2.6696093885678387,
              "max_reward": 3.167297888197824,
              "num_responses": 7,
              "rvariance": 0.030015697769808065
            },
            {
              "id": "chat_hard_sample_304",
              "variance": 0.6117044104543097,
              "mean_reward": 0.6990537869484637,
              "min_reward": 0.25355794490954464,
              "max_reward": 1.0261062295624541,
              "num_responses": 7,
              "rvariance": 0.06866355102245325
            },
            {
              "id": "chat_hard_sample_277",
              "variance": 0.30087532023085495,
              "mean_reward": 0.4737474023215989,
              "min_reward": 0.23093574038090894,
              "max_reward": 0.6381354218963518,
              "num_responses": 6,
              "rvariance": 0.01784123509509637
            },
            {
              "id": "chat_hard_sample_196",
              "variance": 0.25879801980759265,
              "mean_reward": 0.1016660002172763,
              "min_reward": -0.09029956392571817,
              "max_reward": 0.44810890385581176,
              "num_responses": 7,
              "rvariance": 0.023493524938521974
            },
            {
              "id": "chat_hard_sample_185",
              "variance": 0.39272147061711604,
              "mean_reward": -0.12261699896662634,
              "min_reward": -0.3255704910235296,
              "max_reward": 0.26260682672099894,
              "num_responses": 7,
              "rvariance": 0.0347849217668592
            },
            {
              "id": "chat_hard_sample_160",
              "variance": 0.3474770615598446,
              "mean_reward": -0.913747808768058,
              "min_reward": -1.1671164994887782,
              "max_reward": -0.5698902999327953,
              "num_responses": 7,
              "rvariance": 0.029267059945463685
            },
            {
              "id": "chat_hard_sample_163",
              "variance": 0.41851078377976064,
              "mean_reward": 0.055236618541838235,
              "min_reward": -0.16269061841735244,
              "max_reward": 0.6381354218963518,
              "num_responses": 6,
              "rvariance": 0.07025782396241782
            },
            {
              "id": "chat_hard_sample_266",
              "variance": 0.42348766877606053,
              "mean_reward": -0.6125493141867941,
              "min_reward": -0.9046989269566038,
              "max_reward": -0.28032608196625813,
              "num_responses": 7,
              "rvariance": 0.03445405058556413
            },
            {
              "id": "chat_hard_sample_289",
              "variance": 0.6488048258812724,
              "mean_reward": -0.02340247339103828,
              "min_reward": -0.34366825464643813,
              "max_reward": 0.884717451258481,
              "num_responses": 7,
              "rvariance": 0.14916002888429644
            },
            {
              "id": "chat_hard_sample_69",
              "variance": 0.3643306039336782,
              "mean_reward": 1.3705696903047342,
              "min_reward": 1.1462866911208314,
              "max_reward": 1.8009167346682273,
              "num_responses": 7,
              "rvariance": 0.037980448193760605
            },
            {
              "id": "chat_hard_sample_40",
              "variance": 0.3094717579517363,
              "mean_reward": -1.2084828163411407,
              "min_reward": -1.384289662963681,
              "max_reward": -1.0313832723169638,
              "num_responses": 7,
              "rvariance": 0.016981378506669056
            },
            {
              "id": "chat_hard_sample_313",
              "variance": 0.4664698573804684,
              "mean_reward": 1.8230541776712492,
              "min_reward": 1.3631770770391263,
              "max_reward": 2.1221520389748543,
              "num_responses": 7,
              "rvariance": 0.04986624536010952
            },
            {
              "id": "chat_hard_sample_226",
              "variance": 0.5972261995559829,
              "mean_reward": -1.1270428800380519,
              "min_reward": -1.4566807174553151,
              "max_reward": -0.4522548363838896,
              "num_responses": 7,
              "rvariance": 0.09872327095227262
            },
            {
              "id": "chat_hard_sample_28",
              "variance": 0.5293595859700757,
              "mean_reward": 0.4031876691489495,
              "min_reward": 0.05448254505755039,
              "max_reward": 0.6177754378205796,
              "num_responses": 7,
              "rvariance": 0.04743677566828656
            },
            {
              "id": "chat_hard_sample_323",
              "variance": 0.30494731704600947,
              "mean_reward": 0.08841585185050395,
              "min_reward": -0.045055154868446745,
              "max_reward": 0.38476673117563176,
              "num_responses": 4,
              "rvariance": 0.02974884932656032
            },
            {
              "id": "chat_hard_sample_116",
              "variance": 0.7347692030900881,
              "mean_reward": 1.697177768186912,
              "min_reward": 0.7716064286153025,
              "max_reward": 2.031663220860312,
              "num_responses": 7,
              "rvariance": 0.16085540605646237
            },
            {
              "id": "chat_hard_sample_36",
              "variance": 0.31190364493856493,
              "mean_reward": 1.0015045821375625,
              "min_reward": 0.7535086649923939,
              "max_reward": 1.212173861810483,
              "num_responses": 7,
              "rvariance": 0.01887429548533506
            },
            {
              "id": "chat_hard_sample_351",
              "variance": 0.33480862702380854,
              "mean_reward": -0.4884503636297067,
              "min_reward": -0.7870634634076981,
              "max_reward": -0.34366825464643813,
              "num_responses": 7,
              "rvariance": 0.023207772554676234
            },
            {
              "id": "chat_hard_sample_296",
              "variance": 0.2940886588722642,
              "mean_reward": -0.7297538786018211,
              "min_reward": -0.9137478087680581,
              "max_reward": -0.5879880635557039,
              "num_responses": 6,
              "rvariance": 0.016012531242921773
            },
            {
              "id": "chat_hard_sample_338",
              "variance": 0.20518339507472594,
              "mean_reward": 0.8166892504973694,
              "min_reward": 0.7150509172937132,
              "max_reward": 1.0023529148073866,
              "num_responses": 7,
              "rvariance": 0.008908508117214237
            },
            {
              "id": "chat_hard_sample_354",
              "variance": 0.5094520459848761,
              "mean_reward": 1.6237363970564485,
              "min_reward": 1.3083182310571848,
              "max_reward": 1.918552198217133,
              "num_responses": 7,
              "rvariance": 0.04309389558567485
            },
            {
              "id": "chat_hard_sample_186",
              "variance": 0.3891019178925341,
              "mean_reward": -1.2093446146088982,
              "min_reward": -1.4566807174553151,
              "max_reward": -0.9861388632596924,
              "num_responses": 6,
              "rvariance": 0.028021929675113105
            },
            {
              "id": "chat_hard_sample_54",
              "variance": 0.30313754068371856,
              "mean_reward": 0.6239157504783522,
              "min_reward": 0.46620666747872036,
              "max_reward": 0.8304241603897553,
              "num_responses": 7,
              "rvariance": 0.016181564268551125
            },
            {
              "id": "chat_hard_sample_241",
              "variance": 0.44882453784813237,
              "mean_reward": -2.3408857401745626,
              "min_reward": -2.6149375893214635,
              "max_reward": -2.144395735125841,
              "num_responses": 7,
              "rvariance": 0.03494534415779012
            },
            {
              "id": "chat_hard_sample_67",
              "variance": 0.42891699786293314,
              "mean_reward": 0.5240548762019459,
              "min_reward": 0.26260682672099894,
              "max_reward": 0.805539735408256,
              "num_responses": 7,
              "rvariance": 0.03572385229711256
            },
            {
              "id": "chat_hard_sample_262",
              "variance": 0.46601741328989565,
              "mean_reward": 0.13592248136063895,
              "min_reward": -0.12649509117153532,
              "max_reward": 0.38024229026990464,
              "num_responses": 7,
              "rvariance": 0.03312137499423678
            },
            {
              "id": "chat_hard_sample_244",
              "variance": 0.16378476078732257,
              "mean_reward": -0.010152325024265937,
              "min_reward": -0.18983726385171532,
              "max_reward": 0.06353142686900468,
              "num_responses": 7,
              "rvariance": 0.006636640891481615
            },
            {
              "id": "chat_hard_sample_85",
              "variance": 0.7139567749237432,
              "mean_reward": 0.1556361167355929,
              "min_reward": -0.2622283183433496,
              "max_reward": 0.7625575468038481,
              "num_responses": 7,
              "rvariance": 0.09779478458809553
            },
            {
              "id": "chat_hard_sample_398",
              "variance": 0.41262901060231516,
              "mean_reward": -1.9841012573229364,
              "min_reward": -2.307275607732018,
              "max_reward": -1.7100494081760351,
              "num_responses": 7,
              "rvariance": 0.03503892388583317
            },
            {
              "id": "chat_hard_sample_319",
              "variance": 0.5356938032380937,
              "mean_reward": -0.31328986570798445,
              "min_reward": -0.5427436544984324,
              "max_reward": 0.10425139502054895,
              "num_responses": 7,
              "rvariance": 0.05082966745981167
            },
            {
              "id": "chat_hard_sample_190",
              "variance": 0.3121864224951729,
              "mean_reward": -0.9122396617994823,
              "min_reward": -1.0856765631856895,
              "max_reward": -0.6603791180473381,
              "num_responses": 6,
              "rvariance": 0.019308292289937926
            },
            {
              "id": "chat_hard_sample_20",
              "variance": 0.5192927049548328,
              "mean_reward": 0.7923299838352849,
              "min_reward": 0.5069266356302646,
              "max_reward": 1.2367755092353743,
              "num_responses": 7,
              "rvariance": 0.05234210999592429
            },
            {
              "id": "chat_hard_sample_264",
              "variance": 0.4741614069202046,
              "mean_reward": -0.15299538790508,
              "min_reward": -0.47940148181825243,
              "max_reward": 0.25808238581527176,
              "num_responses": 7,
              "rvariance": 0.04904998156042153
            },
            {
              "id": "chat_hard_sample_27",
              "variance": 0.48140051236936793,
              "mean_reward": -0.4638891129986165,
              "min_reward": -0.7056235271046095,
              "max_reward": -0.15364173660589817,
              "num_responses": 7,
              "rvariance": 0.03927340657978118
            },
            {
              "id": "chat_hard_sample_115",
              "variance": 0.3728139306319166,
              "mean_reward": -0.6552083284407928,
              "min_reward": -0.8504056360878781,
              "max_reward": -0.3798637818922553,
              "num_responses": 7,
              "rvariance": 0.02767286243558745
            },
            {
              "id": "chat_hard_sample_260",
              "variance": 0.5791284359330742,
              "mean_reward": -0.7948196478175161,
              "min_reward": -1.5652672991927665,
              "max_reward": -0.4703526000067981,
              "num_responses": 7,
              "rvariance": 0.11153366729473724
            },
            {
              "id": "chat_hard_sample_175",
              "variance": 0.7818233885096502,
              "mean_reward": -0.04764054967171939,
              "min_reward": -0.8685033997107866,
              "max_reward": 0.4209622584214489,
              "num_responses": 7,
              "rvariance": 0.1468374552322637
            },
            {
              "id": "chat_hard_sample_200",
              "variance": 0.47235163055791385,
              "mean_reward": -1.9136492489337567,
              "min_reward": -2.1624934987487494,
              "max_reward": -1.5652672991927665,
              "num_responses": 4,
              "rvariance": 0.05115594320803321
            },
            {
              "id": "chat_hard_sample_240",
              "variance": 0.43977565603667834,
              "mean_reward": -1.6421827945901282,
              "min_reward": -1.9091248080280294,
              "max_reward": -1.420485190209498,
              "num_responses": 4,
              "rvariance": 0.04362277510056773
            },
            {
              "id": "chat_hard_sample_130",
              "variance": 0.48502006509394957,
              "mean_reward": -0.48327957402316146,
              "min_reward": -0.7599168179733352,
              "max_reward": -0.17173950022880674,
              "num_responses": 7,
              "rvariance": 0.041475872321937224
            },
            {
              "id": "chat_hard_sample_374",
              "variance": 0.26535845912089706,
              "mean_reward": 1.2163751283658009,
              "min_reward": 0.8507841444655274,
              "max_reward": 1.3462104236426495,
              "num_responses": 7,
              "rvariance": 0.024241888603506876
            },
            {
              "id": "chat_hard_sample_257",
              "variance": 0.7030981167499979,
              "mean_reward": -0.04117706266353776,
              "min_reward": -0.497499245441161,
              "max_reward": 0.24903350400381752,
              "num_responses": 7,
              "rvariance": 0.08688543535482691
            },
            {
              "id": "chat_hard_sample_237",
              "variance": 0.3809579242622254,
              "mean_reward": 0.821375278578301,
              "min_reward": 0.5340732810646275,
              "max_reward": 1.021581788656727,
              "num_responses": 7,
              "rvariance": 0.02925134147551895
            },
            {
              "id": "chat_hard_sample_22",
              "variance": 0.7503785242148465,
              "mean_reward": 0.31757878372558374,
              "min_reward": -0.1355439729829896,
              "max_reward": 0.8858485614849128,
              "num_responses": 5,
              "rvariance": 0.12209443621871192
            },
            {
              "id": "chat_hard_sample_292",
              "variance": 0.43977565603667834,
              "mean_reward": -1.0456029437349634,
              "min_reward": -1.5109740083240408,
              "max_reward": -0.7780145815962438,
              "num_responses": 7,
              "rvariance": 0.048026453284950685
            },
            {
              "id": "chat_hard_sample_92",
              "variance": 0.4083307917418746,
              "mean_reward": 0.5857273147383456,
              "min_reward": 0.30785123577827034,
              "max_reward": 0.8213752785783011,
              "num_responses": 6,
              "rvariance": 0.030539382762656626
            },
            {
              "id": "chat_hard_sample_407",
              "variance": 0.4379658796743874,
              "mean_reward": -0.3690051237185102,
              "min_reward": -0.6513302362358838,
              "max_reward": -0.07220180030280961,
              "num_responses": 5,
              "rvariance": 0.03875978755815061
            },
            {
              "id": "chat_hard_sample_44",
              "variance": 0.4207730042326242,
              "mean_reward": -0.2954075516520153,
              "min_reward": -0.5336947726869781,
              "max_reward": -0.017908509434083893,
              "num_responses": 6,
              "rvariance": 0.033862864367133434
            },
            {
              "id": "chat_hard_sample_119",
              "variance": 0.6175861836317549,
              "mean_reward": 0.18976332813879196,
              "min_reward": -0.34366825464643813,
              "max_reward": 0.5951532332919439,
              "num_responses": 5,
              "rvariance": 0.0932483388311169
            },
            {
              "id": "chat_hard_sample_303",
              "variance": 0.42710722150064234,
              "mean_reward": -0.12003160416335369,
              "min_reward": -0.3798637818922553,
              "max_reward": 0.3349978812126332,
              "num_responses": 7,
              "rvariance": 0.044958375058396415
            },
            {
              "id": "chat_hard_sample_365",
              "variance": 0.3366184033860994,
              "mean_reward": -0.3255704910235296,
              "min_reward": -0.497499245441161,
              "max_reward": -0.08125068211426388,
              "num_responses": 5,
              "rvariance": 0.024007879229444307
            },
            {
              "id": "chat_hard_sample_45",
              "variance": 0.45289653466328694,
              "mean_reward": 0.4704079340340384,
              "min_reward": 0.1721180086064561,
              "max_reward": 0.7783930899738931,
              "num_responses": 7,
              "rvariance": 0.03538253694974126
            },
            {
              "id": "chat_hard_sample_78",
              "variance": 0.4642076369276048,
              "mean_reward": -0.6988368657460188,
              "min_reward": -1.0042366268826008,
              "max_reward": -0.4613037181953438,
              "num_responses": 4,
              "rvariance": 0.04783459395413027
            },
            {
              "id": "chat_hard_sample_189",
              "variance": 0.15971276397216813,
              "mean_reward": -0.04166182418915139,
              "min_reward": -0.17173950022880674,
              "max_reward": 0.02733589962318753,
              "num_responses": 4,
              "rvariance": 0.006462301649254095
            },
            {
              "id": "chat_hard_sample_39",
              "variance": 1.3908131344205237,
              "mean_reward": 0.6069167796468344,
              "min_reward": -0.18078838204026101,
              "max_reward": 1.8190144982911358,
              "num_responses": 5,
              "rvariance": 0.4563101945930357
            },
            {
              "id": "chat_hard_sample_387",
              "variance": 0.40810456969658826,
              "mean_reward": -0.006920581520175114,
              "min_reward": -0.2531794365318953,
              "max_reward": 0.19021577222936464,
              "num_responses": 7,
              "rvariance": 0.029856946445449332
            },
            {
              "id": "chat_hard_sample_118",
              "variance": 0.3947574690246931,
              "mean_reward": 0.6283324666006096,
              "min_reward": 0.06805586777473181,
              "max_reward": 0.8010152945025288,
              "num_responses": 6,
              "rvariance": 0.06386588988210234
            },
            {
              "id": "chat_hard_sample_154",
              "variance": 0.5447426850495479,
              "mean_reward": -0.26998450275316754,
              "min_reward": -0.6332324726129752,
              "max_reward": -0.045055154868446745,
              "num_responses": 7,
              "rvariance": 0.05243806903555158
            },
            {
              "id": "chat_hard_sample_103",
              "variance": 0.6298021740772184,
              "mean_reward": -0.26352101574498593,
              "min_reward": -0.624183590801521,
              "max_reward": 0.19021577222936464,
              "num_responses": 7,
              "rvariance": 0.08109686074873544
            },
            {
              "id": "chat_hard_sample_162",
              "variance": 0.5746039950273472,
              "mean_reward": 0.016024797358869684,
              "min_reward": -0.2531794365318953,
              "max_reward": 0.44358446295008463,
              "num_responses": 4,
              "rvariance": 0.07743503168074733
            },
            {
              "id": "chat_hard_sample_321",
              "variance": 0.5628404486724565,
              "mean_reward": -0.668135302457156,
              "min_reward": -0.9861388632596924,
              "max_reward": -0.3798637818922553,
              "num_responses": 7,
              "rvariance": 0.04740815865323768
            },
            {
              "id": "chat_hard_sample_273",
              "variance": 0.12329101468106463,
              "mean_reward": 1.3158320347041956,
              "min_reward": 1.2806060305096059,
              "max_reward": 1.4038970451906705,
              "num_responses": 7,
              "rvariance": 0.0031021784287931617
            },
            {
              "id": "chat_hard_sample_291",
              "variance": 0.16107009624388635,
              "mean_reward": 0.5890129206341713,
              "min_reward": 0.5069266356302646,
              "max_reward": 0.726362019558031,
              "num_responses": 7,
              "rvariance": 0.005633374298198656
            },
            {
              "id": "chat_hard_sample_312",
              "variance": 0.7420083085392513,
              "mean_reward": -1.4321194668242252,
              "min_reward": -1.9815158625196636,
              "max_reward": -0.9951877450711466,
              "num_responses": 7,
              "rvariance": 0.10487279593795874
            },
            {
              "id": "chat_hard_sample_314",
              "variance": 0.6761211378495997,
              "mean_reward": 0.6557618895915804,
              "min_reward": 0.3123756766839975,
              "max_reward": 1.0809650755443958,
              "num_responses": 6,
              "rvariance": 0.08266935705846407
            },
            {
              "id": "chat_hard_sample_399",
              "variance": 0.30087532023085506,
              "mean_reward": 0.717636312096986,
              "min_reward": 0.49787775381881033,
              "max_reward": 0.8666196876355724,
              "num_responses": 7,
              "rvariance": 0.015030408283628702
            },
            {
              "id": "chat_hard_sample_219",
              "variance": 0.28775444160424624,
              "mean_reward": -0.09223861002817266,
              "min_reward": -0.28937496377771244,
              "max_reward": 0.049958104151823245,
              "num_responses": 7,
              "rvariance": 0.01339276304287534
            },
            {
              "id": "chat_hard_sample_406",
              "variance": 0.28684955342310087,
              "mean_reward": 0.18439863392200118,
              "min_reward": 0.03186034052891468,
              "max_reward": 0.3757178493641775,
              "num_responses": 7,
              "rvariance": 0.013614179363691482
            },
            {
              "id": "chat_hard_sample_253",
              "variance": 0.5854626532010923,
              "mean_reward": 0.30526584097499765,
              "min_reward": -0.017908509434083893,
              "max_reward": 0.7195753581994403,
              "num_responses": 7,
              "rvariance": 0.061978188096226024
            },
            {
              "id": "chat_hard_sample_24",
              "variance": 0.19681317939913068,
              "mean_reward": 0.2588364592995596,
              "min_reward": 0.14497136317209322,
              "max_reward": 0.42548669932717603,
              "num_responses": 6,
              "rvariance": 0.007986363682771176
            },
            {
              "id": "chat_hard_sample_60",
              "variance": 0.5139764868906035,
              "mean_reward": -0.553085233711523,
              "min_reward": -0.8594545178993324,
              "max_reward": -0.1445928547944439,
              "num_responses": 7,
              "rvariance": 0.05264862342364844
            },
            {
              "id": "chat_hard_sample_386",
              "variance": 0.7058127812934342,
              "mean_reward": 0.10500546850483682,
              "min_reward": -0.39796154551516383,
              "max_reward": 0.49787775381881033,
              "num_responses": 6,
              "rvariance": 0.09371709203620975
            },
            {
              "id": "chat_hard_sample_216",
              "variance": 0.3981507997039886,
              "mean_reward": -2.497302125772558,
              "min_reward": -2.723524171058915,
              "max_reward": -2.2891778441091093,
              "num_responses": 6,
              "rvariance": 0.027703498656077737
            },
            {
              "id": "chat_hard_sample_300",
              "variance": 0.36650799111955923,
              "mean_reward": 1.4852460887077064,
              "min_reward": 1.153285435646878,
              "max_reward": 1.6470857438735045,
              "num_responses": 7,
              "rvariance": 0.027560673121080164
            },
            {
              "id": "chat_hard_sample_352",
              "variance": 0.2759908952493557,
              "mean_reward": 0.5024021947245375,
              "min_reward": 0.33952232211836036,
              "max_reward": 0.6517087446135332,
              "num_responses": 6,
              "rvariance": 0.012944220923788045
            },
            {
              "id": "chat_hard_sample_311",
              "variance": 0.5031178287168583,
              "mean_reward": -1.2795811734311384,
              "min_reward": -1.6014628264385837,
              "max_reward": -0.7780145815962438,
              "num_responses": 7,
              "rvariance": 0.05890509666995515
            },
            {
              "id": "chat_hard_sample_419",
              "variance": 0.338315068725747,
              "mean_reward": 1.2483693890563001,
              "min_reward": 1.0645639772611348,
              "max_reward": 1.4887303121730544,
              "num_responses": 7,
              "rvariance": 0.02268741809034311
            },
            {
              "id": "chat_hard_sample_287",
              "variance": 0.2207927161994846,
              "mean_reward": -1.0688714969644173,
              "min_reward": -1.2576053176033208,
              "max_reward": -0.9499433360138753,
              "num_responses": 7,
              "rvariance": 0.009251024543684302
            },
            {
              "id": "chat_hard_sample_55",
              "variance": 0.745627861263833,
              "mean_reward": 0.0228114587174604,
              "min_reward": -0.5336947726869781,
              "max_reward": 0.3530956448355418,
              "num_responses": 7,
              "rvariance": 0.1029318521143516
            }
          ]
        },
        "semantic_benchmark_reasoning_filtered.json": {
          "file_name": "semantic_benchmark_reasoning_filtered.json",
          "processed_samples": 200,
          "global_mean": 6.004902469555153,
          "global_std": 6.809761933080696,
          "mean_variance": 0.8280490492830316,
          "mean_rvariance": 0.23377047191600775,
          "sample_results": [
            {
              "id": "reasoning_sample_9",
              "variance": 1.9269212534811393,
              "mean_reward": -2.2525260079793936,
              "min_reward": -3.01110415768659,
              "max_reward": -0.8456696102076364,
              "num_responses": 7,
              "rvariance": 0.6857859264684685
            },
            {
              "id": "reasoning_sample_5",
              "variance": 1.476740317623793,
              "mean_reward": -1.1039156057771795,
              "min_reward": -1.6206370469345415,
              "max_reward": 0.7518761420384258,
              "num_responses": 5,
              "rvariance": 0.8639432140096577
            },
            {
              "id": "reasoning_sample_85",
              "variance": 0.435496134687688,
              "mean_reward": -1.4864087862431308,
              "min_reward": -1.7674850586311273,
              "max_reward": -1.2741675193379087,
              "num_responses": 4,
              "rvariance": 0.042898345093351484
            },
            {
              "id": "reasoning_sample_65",
              "variance": 0.5587107945018545,
              "mean_reward": -0.8829347515686982,
              "min_reward": -1.2374555164137624,
              "max_reward": -0.5032154579308324,
              "num_responses": 7,
              "rvariance": 0.05389370323537457
            },
            {
              "id": "reasoning_sample_256",
              "variance": 1.36568650877825,
              "mean_reward": 0.8574231504453469,
              "min_reward": 0.29297610548659464,
              "max_reward": 2.1652882546180656,
              "num_responses": 4,
              "rvariance": 0.580573485535474
            },
            {
              "id": "reasoning_sample_263",
              "variance": 0.9246835736519398,
              "mean_reward": 0.3189804408911984,
              "min_reward": -0.23475893654801122,
              "max_reward": 1.0180381632384878,
              "num_responses": 6,
              "rvariance": 0.17924420458550247
            },
            {
              "id": "reasoning_sample_203",
              "variance": 0.6149260489794539,
              "mean_reward": 0.988974494256872,
              "min_reward": 0.6784521361901328,
              "max_reward": 1.2933781851695867,
              "num_responses": 6,
              "rvariance": 0.06742833590335266
            },
            {
              "id": "reasoning_sample_61",
              "variance": 1.4739869174044826,
              "mean_reward": -1.7347064845917106,
              "min_reward": -2.423712110900246,
              "max_reward": 0.44900211791421724,
              "num_responses": 7,
              "rvariance": 0.8468481121382085
            },
            {
              "id": "reasoning_sample_319",
              "variance": 0.8982968215502096,
              "mean_reward": -0.21602051838881142,
              "min_reward": -1.2971125211655004,
              "max_reward": 0.23790810110037489,
              "num_responses": 6,
              "rvariance": 0.2515495826298676
            },
            {
              "id": "reasoning_sample_528",
              "variance": 0.9577243762836718,
              "mean_reward": -0.09708892558246186,
              "min_reward": -0.5032154579308324,
              "max_reward": 0.8620121508108652,
              "num_responses": 7,
              "rvariance": 0.21376011587154084
            },
            {
              "id": "reasoning_sample_551",
              "variance": 0.7966504634539788,
              "mean_reward": 0.7407314268650241,
              "min_reward": 0.0038690824589409905,
              "max_reward": 1.183242176397147,
              "num_responses": 7,
              "rvariance": 0.13156326614934283
            },
            {
              "id": "reasoning_sample_596",
              "variance": 1.0921820869933587,
              "mean_reward": -0.28884358371304847,
              "min_reward": -0.8267399836998734,
              "max_reward": 1.063928166893671,
              "num_responses": 7,
              "rvariance": 0.35170788917908075
            },
            {
              "id": "reasoning_sample_456",
              "variance": 1.0701548852388703,
              "mean_reward": 0.46735811937629046,
              "min_reward": -0.21181393472041965,
              "max_reward": 1.1281741720109273,
              "num_responses": 4,
              "rvariance": 0.2487901323267471
            },
            {
              "id": "reasoning_sample_306",
              "variance": 1.2683997010292611,
              "mean_reward": 0.5296374100511818,
              "min_reward": -0.569755963230848,
              "max_reward": 1.1281741720109273,
              "num_responses": 7,
              "rvariance": 0.3293607173600005
            },
            {
              "id": "reasoning_sample_231",
              "variance": 0.8489650676208877,
              "mean_reward": 0.6122394166305114,
              "min_reward": 0.045170085748605794,
              "max_reward": 1.0180381632384878,
              "num_responses": 7,
              "rvariance": 0.12247784449916052
            },
            {
              "id": "reasoning_sample_526",
              "variance": 0.810188014532258,
              "mean_reward": 0.01465323331790902,
              "min_reward": -0.6535052199015572,
              "max_reward": 0.4214681157211074,
              "num_responses": 5,
              "rvariance": 0.14400913771812293
            },
            {
              "id": "reasoning_sample_591",
              "variance": 1.1580342422385461,
              "mean_reward": 0.08807723916620203,
              "min_reward": -0.5938482151498191,
              "max_reward": 1.0363941647005612,
              "num_responses": 5,
              "rvariance": 0.2987311608447392
            },
            {
              "id": "reasoning_sample_23",
              "variance": 2.4751920721514393,
              "mean_reward": 0.07418595264308103,
              "min_reward": -1.159442510199951,
              "max_reward": 1.7431002209903812,
              "num_responses": 6,
              "rvariance": 1.3146363785202448
            },
            {
              "id": "reasoning_sample_275",
              "variance": 1.1128325886381907,
              "mean_reward": 0.6425049666602393,
              "min_reward": 0.21496309927278334,
              "max_reward": 1.8532362297628207,
              "num_responses": 6,
              "rvariance": 0.3422104456149218
            },
            {
              "id": "reasoning_sample_656",
              "variance": 1.1545924919644075,
              "mean_reward": 2.004673241824925,
              "min_reward": 1.4677601990592823,
              "max_reward": 3.101444329183801,
              "num_responses": 4,
              "rvariance": 0.41214420854636574
            },
            {
              "id": "reasoning_sample_405",
              "variance": 0.8393568481055838,
              "mean_reward": -0.4350018795808884,
              "min_reward": -0.8086707947606451,
              "max_reward": 0.504070122300437,
              "num_responses": 6,
              "rvariance": 0.20046391574711128
            },
            {
              "id": "reasoning_sample_330",
              "variance": 1.0787018984196481,
              "mean_reward": 0.2592278319651787,
              "min_reward": -0.8135466076490083,
              "max_reward": 0.7426981413073892,
              "num_responses": 6,
              "rvariance": 0.28580386994651524
            },
            {
              "id": "reasoning_sample_451",
              "variance": 1.8154085445990442,
              "mean_reward": 0.4686692623378671,
              "min_reward": -0.20263593398938304,
              "max_reward": 1.7614562224524544,
              "num_responses": 7,
              "rvariance": 0.58623661709103
            },
            {
              "id": "reasoning_sample_314",
              "variance": 0.7516782598718994,
              "mean_reward": 0.4191736155383482,
              "min_reward": -0.2668819391066394,
              "max_reward": 0.7243421398453159,
              "num_responses": 4,
              "rvariance": 0.16372787212691528
            },
            {
              "id": "reasoning_sample_593",
              "variance": 1.1812086940844133,
              "mean_reward": -0.05257562203693426,
              "min_reward": -0.6523579698101776,
              "max_reward": 0.990504161045378,
              "num_responses": 5,
              "rvariance": 0.32666519223355406
            },
            {
              "id": "reasoning_sample_599",
              "variance": 0.688579504846023,
              "mean_reward": -0.010307650813106662,
              "min_reward": -0.7515951027145111,
              "max_reward": 0.8528341500798287,
              "num_responses": 7,
              "rvariance": 0.18605133922565992
            },
            {
              "id": "reasoning_sample_301",
              "variance": 0.4935469893114945,
              "mean_reward": -0.3936530742040828,
              "min_reward": -1.0189043740059527,
              "max_reward": 0.04975908611412411,
              "num_responses": 7,
              "rvariance": 0.08659815148189957
            },
            {
              "id": "reasoning_sample_77",
              "variance": 0.6584068274427399,
              "mean_reward": -1.4156480395355402,
              "min_reward": -1.92351107105875,
              "max_reward": -0.8144070452175429,
              "num_responses": 7,
              "rvariance": 0.10094883808061263
            },
            {
              "id": "reasoning_sample_511",
              "variance": 0.8191365652450191,
              "mean_reward": -0.09905564002482688,
              "min_reward": -0.43667495263081696,
              "max_reward": 1.28420018443855,
              "num_responses": 7,
              "rvariance": 0.3284988056703392
            },
            {
              "id": "reasoning_sample_12",
              "variance": 1.1352039654200925,
              "mean_reward": -0.6865842642030017,
              "min_reward": -1.3934815288413849,
              "max_reward": 0.09106008940378892,
              "num_responses": 6,
              "rvariance": 0.25129106239703375
            },
            {
              "id": "reasoning_sample_543",
              "variance": 1.1210927892961238,
              "mean_reward": -0.32989874769741767,
              "min_reward": -0.735533601435197,
              "max_reward": 0.7059861383832426,
              "num_responses": 7,
              "rvariance": 0.2698712840538003
            },
            {
              "id": "reasoning_sample_506",
              "variance": 1.009580080414029,
              "mean_reward": 0.08778223199984724,
              "min_reward": -0.4183189511687437,
              "max_reward": 1.183242176397147,
              "num_responses": 7,
              "rvariance": 0.26224807431131714
            },
            {
              "id": "reasoning_sample_531",
              "variance": 0.767280861114662,
              "mean_reward": 0.7374535694610825,
              "min_reward": 0.2654421032934848,
              "max_reward": 1.137352172741964,
              "num_responses": 7,
              "rvariance": 0.10543558763462275
            },
            {
              "id": "reasoning_sample_274",
              "variance": 0.3276546260980075,
              "mean_reward": 0.26085310292796643,
              "min_reward": 0.0864710890382706,
              "max_reward": 0.4214681157211074,
              "num_responses": 5,
              "rvariance": 0.021286360737758254
            },
            {
              "id": "reasoning_sample_597",
              "variance": 1.264728500736847,
              "mean_reward": 0.26281981737033144,
              "min_reward": -0.21181393472041965,
              "max_reward": 1.1465301734730007,
              "num_responses": 7,
              "rvariance": 0.32771812126033184
            },
            {
              "id": "reasoning_sample_73",
              "variance": 1.194057895107865,
              "mean_reward": -1.4298657460251374,
              "min_reward": -2.22179609481744,
              "max_reward": 0.17825109634863684,
              "num_responses": 7,
              "rvariance": 0.49266365047761507
            },
            {
              "id": "reasoning_sample_412",
              "variance": 1.404807736894293,
              "mean_reward": -1.2487368089789948,
              "min_reward": -1.7353620560724992,
              "max_reward": 0.41229011499007073,
              "num_responses": 6,
              "rvariance": 0.6069850693001906
            },
            {
              "id": "reasoning_sample_491",
              "variance": 0.9962719793540256,
              "mean_reward": -0.011045168728993526,
              "min_reward": -0.798058731415384,
              "max_reward": 0.7426981413073892,
              "num_responses": 7,
              "rvariance": 0.202032175267061
            },
            {
              "id": "reasoning_sample_64",
              "variance": 0.6612749526711887,
              "mean_reward": -1.5454102195140804,
              "min_reward": -1.9418670725208231,
              "max_reward": -1.1215832571844249,
              "num_responses": 7,
              "rvariance": 0.0793244016958641
            },
            {
              "id": "reasoning_sample_535",
              "variance": 0.8076640643312228,
              "mean_reward": 1.2612551826109584,
              "min_reward": 0.6325621325349498,
              "max_reward": 1.8715922312248938,
              "num_responses": 6,
              "rvariance": 0.14047004508748198
            },
            {
              "id": "reasoning_sample_548",
              "variance": 0.701199255851198,
              "mean_reward": 0.6115838451497232,
              "min_reward": -0.09249992521694356,
              "max_reward": 1.0822841683557443,
              "num_responses": 7,
              "rvariance": 0.1171529450551795
            },
            {
              "id": "reasoning_sample_235",
              "variance": 0.8471294674746803,
              "mean_reward": 0.7748211438660173,
              "min_reward": 0.25167510219692985,
              "max_reward": 1.357624190286843,
              "num_responses": 5,
              "rvariance": 0.14508756523432847
            },
            {
              "id": "reasoning_sample_156",
              "variance": 0.6057480482484171,
              "mean_reward": 0.54996012595562,
              "min_reward": 0.3021541062176313,
              "max_reward": 1.28420018443855,
              "num_responses": 6,
              "rvariance": 0.11453246992390965
            },
            {
              "id": "reasoning_sample_587",
              "variance": 1.4360129393798184,
              "mean_reward": -0.49108738553624837,
              "min_reward": -1.1032272557223517,
              "max_reward": 1.5411842049075755,
              "num_responses": 7,
              "rvariance": 0.7395642960406728
            },
            {
              "id": "reasoning_sample_594",
              "variance": 0.627775250002905,
              "mean_reward": 0.5099702656275319,
              "min_reward": 0.17825109634863684,
              "max_reward": 0.9354361566591582,
              "num_responses": 7,
              "rvariance": 0.07043737445293183
            },
            {
              "id": "reasoning_sample_622",
              "variance": 0.8205132653546746,
              "mean_reward": 1.0796618824325908,
              "min_reward": 0.7243421398453159,
              "max_reward": 2.403916273625018,
              "num_responses": 7,
              "rvariance": 0.3020141998765048
            },
            {
              "id": "reasoning_sample_647",
              "variance": 2.0417609876282348,
              "mean_reward": 0.12696901726396967,
              "min_reward": -0.9408913677921414,
              "max_reward": 2.110220250231846,
              "num_responses": 5,
              "rvariance": 1.1077188479163678
            },
            {
              "id": "reasoning_sample_395",
              "variance": 0.7191106979028616,
              "mean_reward": -0.2365993169029326,
              "min_reward": -0.9066172713121765,
              "max_reward": 0.08188208867275229,
              "num_responses": 6,
              "rvariance": 0.11764857662403423
            },
            {
              "id": "reasoning_sample_252",
              "variance": 0.9935185791347145,
              "mean_reward": 0.754170642221185,
              "min_reward": -0.02366491973416888,
              "max_reward": 1.7431002209903812,
              "num_responses": 6,
              "rvariance": 0.2708721694230415
            },
            {
              "id": "reasoning_sample_497",
              "variance": 0.7158840570208567,
              "mean_reward": 0.8567675789645587,
              "min_reward": 0.5132481230314736,
              "max_reward": 1.2291321800523303,
              "num_responses": 7,
              "rvariance": 0.07638630569615905
            },
            {
              "id": "reasoning_sample_87",
              "variance": 0.08799408200881353,
              "mean_reward": -1.0057109979550876,
              "min_reward": -1.0825767540775193,
              "max_reward": -0.966704494848182,
              "num_responses": 7,
              "rvariance": 0.0014759109528788472
            },
            {
              "id": "reasoning_sample_299",
              "variance": 1.5868763263962322,
              "mean_reward": 0.9960765186320789,
              "min_reward": -1.4026595295724216,
              "max_reward": 1.945016237073187,
              "num_responses": 7,
              "rvariance": 1.02643582550454
            },
            {
              "id": "reasoning_sample_303",
              "variance": 0.6020768479560025,
              "mean_reward": 0.645411333558401,
              "min_reward": 0.357222110603851,
              "max_reward": 1.2015981778592204,
              "num_responses": 5,
              "rvariance": 0.09085999266393179
            },
            {
              "id": "reasoning_sample_509",
              "variance": 1.7963641930821432,
              "mean_reward": -0.07922460273097989,
              "min_reward": -1.1686205109309877,
              "max_reward": 0.6876301369211695,
              "num_responses": 7,
              "rvariance": 0.6024371079205826
            },
            {
              "id": "reasoning_sample_572",
              "variance": 1.0536344839230045,
              "mean_reward": 0.30149853473684285,
              "min_reward": -0.17051293143075485,
              "max_reward": 1.2658441829764766,
              "num_responses": 7,
              "rvariance": 0.23482161887006664
            },
            {
              "id": "reasoning_sample_557",
              "variance": 0.8911838709836563,
              "mean_reward": 0.21037409890726502,
              "min_reward": -0.14756792960316328,
              "max_reward": 0.8344781486177554,
              "num_responses": 7,
              "rvariance": 0.13963270214290116
            },
            {
              "id": "reasoning_sample_678",
              "variance": 0.6525558519767041,
              "mean_reward": 0.3827893983545958,
              "min_reward": 0.1277720923279354,
              "max_reward": 1.1189961712798908,
              "num_responses": 7,
              "rvariance": 0.1116294900387111
            },
            {
              "id": "reasoning_sample_53",
              "variance": 0.24964161988419614,
              "mean_reward": -0.5094433869983216,
              "min_reward": -0.7693774791308945,
              "max_reward": -0.28982694093423095,
              "num_responses": 7,
              "rvariance": 0.017287442912382125
            },
            {
              "id": "reasoning_sample_75",
              "variance": 2.5078886997557577,
              "mean_reward": -0.5793163806590111,
              "min_reward": -2.2860420999346966,
              "max_reward": 0.7977661456936089,
              "num_responses": 6,
              "rvariance": 1.2208427331877996
            },
            {
              "id": "reasoning_sample_595",
              "variance": 1.1858550569545008,
              "mean_reward": -0.4232808078139604,
              "min_reward": -1.020625249143022,
              "max_reward": 0.48571412083836374,
              "num_responses": 5,
              "rvariance": 0.2936910133129297
            },
            {
              "id": "reasoning_sample_245",
              "variance": 0.6461312514649784,
              "mean_reward": 0.21404529919967966,
              "min_reward": -0.046609921561760435,
              "max_reward": 0.8987241537350118,
              "num_responses": 5,
              "rvariance": 0.12328231260046978
            },
            {
              "id": "reasoning_sample_418",
              "variance": 1.1151270888209501,
              "mean_reward": 0.3886895416816908,
              "min_reward": -0.5192769592101465,
              "max_reward": 2.0000842414594064,
              "num_responses": 7,
              "rvariance": 0.5060786150655426
            },
            {
              "id": "reasoning_sample_60",
              "variance": 2.709517903315718,
              "mean_reward": 0.3114277111229495,
              "min_reward": -1.3751255273793117,
              "max_reward": 1.8715922312248938,
              "num_responses": 6,
              "rvariance": 1.395905324564377
            },
            {
              "id": "reasoning_sample_385",
              "variance": 1.3368331689800532,
              "mean_reward": 0.1595468225373948,
              "min_reward": -0.8452393914233691,
              "max_reward": 0.7518761420384258,
              "num_responses": 7,
              "rvariance": 0.33536005554943416
            },
            {
              "id": "reasoning_sample_243",
              "variance": 0.809958564513982,
              "mean_reward": 0.6012039633705746,
              "min_reward": 0.1690730956176002,
              "max_reward": 1.522828203445502,
              "num_responses": 6,
              "rvariance": 0.18947708691153697
            },
            {
              "id": "reasoning_sample_71",
              "variance": 0.32765462609800733,
              "mean_reward": -1.8409090644794202,
              "min_reward": -2.042825080562226,
              "max_reward": -1.5885140443759131,
              "num_responses": 7,
              "rvariance": 0.019987927630401064
            },
            {
              "id": "reasoning_sample_218",
              "variance": 1.3528373077547986,
              "mean_reward": 0.3713168974408001,
              "min_reward": -0.3334224444066549,
              "max_reward": 1.3484461895558064,
              "num_responses": 7,
              "rvariance": 0.3385860304362535
            },
            {
              "id": "reasoning_sample_32",
              "variance": 0.14868361184279322,
              "mean_reward": -1.5357405401724527,
              "min_reward": -1.616048046569023,
              "max_reward": -1.437077032313809,
              "num_responses": 4,
              "rvariance": 0.004848817332675936
            },
            {
              "id": "reasoning_sample_55",
              "variance": 0.6340277630009239,
              "mean_reward": -0.9893217109353794,
              "min_reward": -1.3384135244551651,
              "max_reward": -0.4756814557377226,
              "num_responses": 7,
              "rvariance": 0.07640700535633871
            },
            {
              "id": "reasoning_sample_403",
              "variance": 0.5433376432773681,
              "mean_reward": 1.1216184572030439,
              "min_reward": 0.7702321435004991,
              "max_reward": 1.4402261968661725,
              "num_responses": 7,
              "rvariance": 0.053735498569801025
            },
            {
              "id": "reasoning_sample_580",
              "variance": 0.5203926414497766,
              "mean_reward": 1.4287536959523768,
              "min_reward": 1.0180381632384878,
              "max_reward": 1.7063882180662346,
              "num_responses": 4,
              "rvariance": 0.06571963818001492
            },
            {
              "id": "reasoning_sample_530",
              "variance": 1.264728500736847,
              "mean_reward": 0.32968810841074114,
              "min_reward": -0.19345793325834643,
              "max_reward": 1.669676215142088,
              "num_responses": 5,
              "rvariance": 0.4741711643407793
            },
            {
              "id": "reasoning_sample_318",
              "variance": 0.5249816418152949,
              "mean_reward": 0.3618111109693693,
              "min_reward": -0.032842920465205504,
              "max_reward": 0.7151641391142793,
              "num_responses": 7,
              "rvariance": 0.05083624339231145
            },
            {
              "id": "reasoning_sample_76",
              "variance": 0.3414216271945625,
              "mean_reward": -1.8081304904400037,
              "min_reward": -2.102482085313964,
              "max_reward": -1.6206370469345415,
              "num_responses": 7,
              "rvariance": 0.02274621694690391
            },
            {
              "id": "reasoning_sample_393",
              "variance": 0.8099585645139821,
              "mean_reward": 0.05281841969113632,
              "min_reward": -0.3861959486101155,
              "max_reward": 0.6876301369211695,
              "num_responses": 6,
              "rvariance": 0.13287245315639318
            },
            {
              "id": "reasoning_sample_642",
              "variance": 0.883382570362275,
              "mean_reward": 0.4054066144417932,
              "min_reward": -0.13838992887212667,
              "max_reward": 1.4035141939420261,
              "num_responses": 6,
              "rvariance": 0.22843141720681467
            },
            {
              "id": "reasoning_sample_16",
              "variance": 0.3717090296069836,
              "mean_reward": -2.152961089334666,
              "min_reward": -2.5797381233278687,
              "max_reward": -1.9464560728863416,
              "num_responses": 6,
              "rvariance": 0.040763057909300286
            },
            {
              "id": "reasoning_sample_260",
              "variance": 1.284002302272024,
              "mean_reward": -0.10298906890955684,
              "min_reward": -0.7831444802274494,
              "max_reward": 1.3943361932109894,
              "num_responses": 7,
              "rvariance": 0.4495326096423184
            },
            {
              "id": "reasoning_sample_582",
              "variance": 1.6401087306362447,
              "mean_reward": 0.19155919740863997,
              "min_reward": -0.7900279807757269,
              "max_reward": 1.3484461895558064,
              "num_responses": 5,
              "rvariance": 0.5686507649228018
            },
            {
              "id": "reasoning_sample_295",
              "variance": 0.7158840570208566,
              "mean_reward": 0.7044564715947367,
              "min_reward": 0.24708610183141153,
              "max_reward": 1.137352172741964,
              "num_responses": 6,
              "rvariance": 0.094159130550953
            },
            {
              "id": "reasoning_sample_366",
              "variance": 0.5883098468594476,
              "mean_reward": 0.442446403106334,
              "min_reward": -0.0007199179065773214,
              "max_reward": 0.7885881449625723,
              "num_responses": 7,
              "rvariance": 0.0718882913635759
            },
            {
              "id": "reasoning_sample_286",
              "variance": 0.3359148267559404,
              "mean_reward": 0.9367472996207348,
              "min_reward": 0.6050281303418398,
              "max_reward": 1.1281741720109273,
              "num_responses": 7,
              "rvariance": 0.026123380775055886
            },
            {
              "id": "reasoning_sample_356",
              "variance": 0.4462802855466558,
              "mean_reward": 0.16563134534346147,
              "min_reward": -0.3334224444066549,
              "max_reward": 0.41229011499007073,
              "num_responses": 6,
              "rvariance": 0.056718264201141184
            },
            {
              "id": "reasoning_sample_343",
              "variance": 0.6176794491987647,
              "mean_reward": 0.22689450022313093,
              "min_reward": -0.2990049416652676,
              "max_reward": 0.5958501296108032,
              "num_responses": 5,
              "rvariance": 0.08828406503686154
            },
            {
              "id": "reasoning_sample_205",
              "variance": 1.3317279060734142,
              "mean_reward": 0.6909079943251111,
              "min_reward": 0.05893708684516073,
              "max_reward": 1.4677601990592823,
              "num_responses": 7,
              "rvariance": 0.36801200925628696
            },
            {
              "id": "reasoning_sample_512",
              "variance": 0.8764990698139975,
              "mean_reward": -0.3204202767043531,
              "min_reward": -1.0516010016102708,
              "max_reward": 0.5683161274176933,
              "num_responses": 6,
              "rvariance": 0.22374873138849263
            },
            {
              "id": "reasoning_sample_226",
              "variance": 1.9448183549066604,
              "mean_reward": -0.013175776041555605,
              "min_reward": -2.6072721255209785,
              "max_reward": 0.9537921581212315,
              "num_responses": 7,
              "rvariance": 1.2251703988489833
            },
            {
              "id": "reasoning_sample_225",
              "variance": 0.3258190259518001,
              "mean_reward": 0.6203247982269009,
              "min_reward": 0.46735811937629046,
              "max_reward": 0.9996821617764147,
              "num_responses": 6,
              "rvariance": 0.03239330541853814
            },
            {
              "id": "reasoning_sample_508",
              "variance": 0.6286930500760088,
              "mean_reward": 0.425139316013522,
              "min_reward": 0.10482709050034385,
              "max_reward": 1.0088601625074514,
              "num_responses": 5,
              "rvariance": 0.09912351458072678
            },
            {
              "id": "reasoning_sample_585",
              "variance": 1.225492547611665,
              "mean_reward": -0.24852593764456615,
              "min_reward": -1.08028225389476,
              "max_reward": 0.3664001113348876,
              "num_responses": 5,
              "rvariance": 0.31051015429869044
            },
            {
              "id": "reasoning_sample_574",
              "variance": 0.6626516527808444,
              "mean_reward": 0.037958799459934175,
              "min_reward": -0.2577039383756028,
              "max_reward": 0.6142061310728765,
              "num_responses": 7,
              "rvariance": 0.08879559920265688
            },
            {
              "id": "reasoning_sample_520",
              "variance": 0.6699940533656736,
              "mean_reward": 1.0088601625074511,
              "min_reward": 0.7518761420384258,
              "max_reward": 1.6146082107558684,
              "num_responses": 7,
              "rvariance": 0.09304434463471468
            },
            {
              "id": "reasoning_sample_238",
              "variance": 0.33224362646352557,
              "mean_reward": 1.3447749892633918,
              "min_reward": 1.1465301734730007,
              "max_reward": 1.6146082107558684,
              "num_responses": 5,
              "rvariance": 0.02451595737679921
            },
            {
              "id": "reasoning_sample_630",
              "variance": 0.7177196571670641,
              "mean_reward": 0.7628897429156697,
              "min_reward": 0.44900211791421724,
              "max_reward": 1.5962522092937952,
              "num_responses": 5,
              "rvariance": 0.17731277363890627
            },
            {
              "id": "reasoning_sample_233",
              "variance": 1.0068266801947177,
              "mean_reward": 0.541765482445766,
              "min_reward": -0.42520245171702115,
              "max_reward": 1.0731061676247076,
              "num_responses": 7,
              "rvariance": 0.21505953745902082
            },
            {
              "id": "reasoning_sample_394",
              "variance": 0.5862447966949642,
              "mean_reward": 0.03246838830833189,
              "min_reward": -0.7504478526231315,
              "max_reward": 0.3021541062176313,
              "num_responses": 7,
              "rvariance": 0.1122478676242115
            },
            {
              "id": "reasoning_sample_284",
              "variance": 0.8921016710567602,
              "mean_reward": 0.37426696910434754,
              "min_reward": -0.05119892192727875,
              "max_reward": 1.6146082107558684,
              "num_responses": 7,
              "rvariance": 0.2748052100622644
            },
            {
              "id": "reasoning_sample_207",
              "variance": 0.5727072456166854,
              "mean_reward": 0.7656431431349807,
              "min_reward": 0.2883871051210763,
              "max_reward": 1.4035141939420261,
              "num_responses": 7,
              "rvariance": 0.09474710908968265
            },
            {
              "id": "reasoning_sample_345",
              "variance": 0.4841395385621819,
              "mean_reward": 0.2600882695337134,
              "min_reward": -0.2990049416652676,
              "max_reward": 0.504070122300437,
              "num_responses": 6,
              "rvariance": 0.06873925394443442
            },
            {
              "id": "reasoning_sample_565",
              "variance": 0.5378308428387462,
              "mean_reward": 0.45227997531815894,
              "min_reward": 0.15071709415552698,
              "max_reward": 0.8069441464246455,
              "num_responses": 7,
              "rvariance": 0.0554554539834259
            },
            {
              "id": "reasoning_sample_78",
              "variance": 0.7388290588484483,
              "mean_reward": -1.9857903617336414,
              "min_reward": -2.33193210358988,
              "max_reward": -1.482967035968992,
              "num_responses": 7,
              "rvariance": 0.09967403784075594
            },
            {
              "id": "reasoning_sample_601",
              "variance": 0.720473057386375,
              "mean_reward": 0.8551286502625878,
              "min_reward": 0.504070122300437,
              "max_reward": 1.4585821983282459,
              "num_responses": 4,
              "rvariance": 0.1336136102996554
            },
            {
              "id": "reasoning_sample_539",
              "variance": 0.13767001096554934,
              "mean_reward": 0.3021541062176312,
              "min_reward": 0.21496309927278334,
              "max_reward": 0.38475611279696087,
              "num_responses": 6,
              "rvariance": 0.0035308796501425936
            },
            {
              "id": "reasoning_sample_603",
              "variance": 1.0830040862623216,
              "mean_reward": 1.241369514360379,
              "min_reward": 0.8803681522729385,
              "max_reward": 2.954596317487215,
              "num_responses": 6,
              "rvariance": 0.5881523584226919
            },
            {
              "id": "reasoning_sample_339",
              "variance": 1.0852985864450808,
              "mean_reward": 0.045170085748605794,
              "min_reward": -0.5628724626825705,
              "max_reward": 0.6968081376522061,
              "num_responses": 6,
              "rvariance": 0.20728123751321692
            },
            {
              "id": "reasoning_sample_447",
              "variance": 1.005908880121614,
              "mean_reward": 0.09827137569246054,
              "min_reward": -0.19804693362386472,
              "max_reward": 0.9262581559281217,
              "num_responses": 7,
              "rvariance": 0.21676165725303917
            },
            {
              "id": "reasoning_sample_44",
              "variance": 0.19273801535176927,
              "mean_reward": -1.7360176275532877,
              "min_reward": -1.8409090644794204,
              "max_reward": -1.5518020414517666,
              "num_responses": 7,
              "rvariance": 0.008004969898594883
            },
            {
              "id": "reasoning_sample_266",
              "variance": 0.8847592704719309,
              "mean_reward": 0.7872770020009957,
              "min_reward": 0.357222110603851,
              "max_reward": 2.348848269238798,
              "num_responses": 7,
              "rvariance": 0.4137279256126348
            },
            {
              "id": "reasoning_sample_529",
              "variance": 0.7287332580443083,
              "mean_reward": 0.774165572385229,
              "min_reward": 0.38475611279696087,
              "max_reward": 1.8899482326869672,
              "num_responses": 7,
              "rvariance": 0.21946665459770553
            },
            {
              "id": "reasoning_sample_466",
              "variance": 0.42769483406630676,
              "mean_reward": 0.6666518495359429,
              "min_reward": 0.4214681157211074,
              "max_reward": 1.063928166893671,
              "num_responses": 7,
              "rvariance": 0.04211097232599163
            },
            {
              "id": "reasoning_sample_349",
              "variance": 0.399243031800093,
              "mean_reward": 0.6080874639188522,
              "min_reward": 0.3939341135279975,
              "max_reward": 0.9813261603143414,
              "num_responses": 6,
              "rvariance": 0.03873906129076262
            },
            {
              "id": "reasoning_sample_206",
              "variance": 0.2184364173986717,
              "mean_reward": 0.7656431431349808,
              "min_reward": 0.5866721288797666,
              "max_reward": 0.8987241537350118,
              "num_responses": 4,
              "rvariance": 0.012698531385900502
            },
            {
              "id": "reasoning_sample_516",
              "variance": 0.6865144546815396,
              "mean_reward": 0.0799153742303873,
              "min_reward": -0.23475893654801122,
              "max_reward": 0.7518761420384258,
              "num_responses": 7,
              "rvariance": 0.10254406838852878
            },
            {
              "id": "reasoning_sample_542",
              "variance": 0.6679290032011903,
              "mean_reward": -0.4179911654283495,
              "min_reward": -0.931139742015415,
              "max_reward": -0.12003392741005342,
              "num_responses": 7,
              "rvariance": 0.08130275870680082
            },
            {
              "id": "reasoning_sample_151",
              "variance": 1.036196282534035,
              "mean_reward": 0.5430766254073427,
              "min_reward": 0.1277720923279354,
              "max_reward": 1.4861162005213557,
              "num_responses": 4,
              "rvariance": 0.31038222133323556
            },
            {
              "id": "reasoning_sample_223",
              "variance": 0.881088070179516,
              "mean_reward": 0.2562641025624481,
              "min_reward": -0.11085592667901681,
              "max_reward": 0.990504161045378,
              "num_responses": 7,
              "rvariance": 0.14333907282933314
            },
            {
              "id": "reasoning_sample_452",
              "variance": 0.7672808611146616,
              "mean_reward": 1.3943361932109894,
              "min_reward": 0.8069441464246455,
              "max_reward": 1.816524226838674,
              "num_responses": 4,
              "rvariance": 0.13932584353087515
            },
            {
              "id": "reasoning_sample_68",
              "variance": 0.5607758446663376,
              "mean_reward": -1.814686205247887,
              "min_reward": -2.175906091162257,
              "max_reward": -1.482967035968992,
              "num_responses": 7,
              "rvariance": 0.05330142686371384
            },
            {
              "id": "reasoning_sample_552",
              "variance": 0.3450928274869772,
              "mean_reward": 1.0534390232010578,
              "min_reward": 0.9170801551970851,
              "max_reward": 1.669676215142088,
              "num_responses": 7,
              "rvariance": 0.06388504056084669
            },
            {
              "id": "reasoning_sample_209",
              "variance": 0.573625045689789,
              "mean_reward": 0.2952706056693538,
              "min_reward": 0.02681408428653255,
              "max_reward": 0.8344781486177554,
              "num_responses": 4,
              "rvariance": 0.09996144918080133
            },
            {
              "id": "reasoning_sample_391",
              "variance": 0.3047096242704159,
              "mean_reward": -0.2636040817026978,
              "min_reward": -0.4160244509859845,
              "max_reward": -0.060376922658315374,
              "num_responses": 7,
              "rvariance": 0.018038258031723115
            },
            {
              "id": "reasoning_sample_210",
              "variance": 0.3111342247821417,
              "mean_reward": 0.27855353290925133,
              "min_reward": 0.13236109269345372,
              "max_reward": 0.7518761420384258,
              "num_responses": 7,
              "rvariance": 0.03943090187137777
            },
            {
              "id": "reasoning_sample_465",
              "variance": 0.8572252682788206,
              "mean_reward": 0.38705061297972004,
              "min_reward": -0.4022574498894296,
              "max_reward": 0.7702321435004991,
              "num_responses": 7,
              "rvariance": 0.15861431403092277
            },
            {
              "id": "reasoning_sample_396",
              "variance": 0.611254848687039,
              "mean_reward": 0.2697033179186089,
              "min_reward": -0.5445164612204972,
              "max_reward": 0.5774941281487299,
              "num_responses": 7,
              "rvariance": 0.12213939750060242
            },
            {
              "id": "reasoning_sample_348",
              "variance": 0.4543110361863129,
              "mean_reward": 0.07860423126881064,
              "min_reward": -0.13380092850660835,
              "max_reward": 0.34804410987281437,
              "num_responses": 7,
              "rvariance": 0.036075226741546965
            },
            {
              "id": "reasoning_sample_83",
              "variance": 0.7085416564360272,
              "mean_reward": -2.803943569757478,
              "min_reward": -3.470004194238421,
              "max_reward": -2.33193210358988,
              "num_responses": 7,
              "rvariance": 0.11472558169282243
            },
            {
              "id": "reasoning_sample_242",
              "variance": 0.6883500548277469,
              "mean_reward": 0.18152895375257846,
              "min_reward": -0.276059939837676,
              "max_reward": 0.7426981413073892,
              "num_responses": 7,
              "rvariance": 0.09336151782193487
            },
            {
              "id": "reasoning_sample_269",
              "variance": 0.2946138234662756,
              "mean_reward": 0.32418130797211914,
              "min_reward": 0.1598950948865636,
              "max_reward": 0.6509181339970229,
              "num_responses": 5,
              "rvariance": 0.028508729434455492
            },
            {
              "id": "reasoning_sample_694",
              "variance": 1.0669425849830074,
              "mean_reward": 0.6012039633705745,
              "min_reward": -0.03743192083072382,
              "max_reward": 1.3209121873626966,
              "num_responses": 6,
              "rvariance": 0.20472374814435954
            },
            {
              "id": "reasoning_sample_18",
              "variance": 0.5208515414863284,
              "mean_reward": -1.955634073617378,
              "min_reward": -2.396178108707136,
              "max_reward": -1.703239053513871,
              "num_responses": 6,
              "rvariance": 0.054984851490192714
            },
            {
              "id": "reasoning_sample_230",
              "variance": 1.000402079682992,
              "mean_reward": 0.628890932242535,
              "min_reward": 0.283798104755558,
              "max_reward": 1.9083042341490404,
              "num_responses": 5,
              "rvariance": 0.4098100373708881
            },
            {
              "id": "reasoning_sample_237",
              "variance": 1.1605581924395811,
              "mean_reward": 0.2530518023065853,
              "min_reward": -0.4389694528135761,
              "max_reward": 1.1924201771281837,
              "num_responses": 5,
              "rvariance": 0.2970142267420982
            },
            {
              "id": "reasoning_sample_312",
              "variance": 0.323524525769041,
              "mean_reward": 0.09488425637505417,
              "min_reward": -0.2622929387411211,
              "max_reward": 0.25626410256244814,
              "num_responses": 6,
              "rvariance": 0.028860670858032653
            },
            {
              "id": "reasoning_sample_47",
              "variance": 0.8569958182605453,
              "mean_reward": -0.9848966034400579,
              "min_reward": -1.308585022079296,
              "max_reward": 0.4398241171831806,
              "num_responses": 7,
              "rvariance": 0.35105769488962835
            },
            {
              "id": "reasoning_sample_2",
              "variance": 1.3987273114099825,
              "mean_reward": -1.0968354337846655,
              "min_reward": -1.6894720524173161,
              "max_reward": 1.5595402063696486,
              "num_responses": 7,
              "rvariance": 1.1823829622998419
            },
            {
              "id": "reasoning_sample_58",
              "variance": 0.5077728904446013,
              "mean_reward": -1.021198874188712,
              "min_reward": -1.5013230374310653,
              "max_reward": -0.5743449635963663,
              "num_responses": 7,
              "rvariance": 0.06630110892614878
            },
            {
              "id": "reasoning_sample_308",
              "variance": 0.18723121491314718,
              "mean_reward": -0.18165764660415645,
              "min_reward": -0.28064894020319436,
              "max_reward": -0.01907591936865057,
              "num_responses": 7,
              "rvariance": 0.007044854857605884
            },
            {
              "id": "reasoning_sample_59",
              "variance": 0.9728680774898826,
              "mean_reward": -2.197539950028272,
              "min_reward": -2.7632981379486012,
              "max_reward": -1.6114590462035048,
              "num_responses": 7,
              "rvariance": 0.16049736866480524
            },
            {
              "id": "reasoning_sample_219",
              "variance": 0.3744624298262944,
              "mean_reward": 0.23921924406195158,
              "min_reward": 0.04975908611412411,
              "max_reward": 0.6968081376522061,
              "num_responses": 7,
              "rvariance": 0.04058183655345858
            },
            {
              "id": "reasoning_sample_216",
              "variance": 1.2491258994940844,
              "mean_reward": 0.8918406531867342,
              "min_reward": 0.32968810841074114,
              "max_reward": 2.110220250231846,
              "num_responses": 4,
              "rvariance": 0.5039558540018878
            },
            {
              "id": "reasoning_sample_201",
              "variance": 0.2927782233200683,
              "mean_reward": 0.4113723149169671,
              "min_reward": 0.27003110365900307,
              "max_reward": 0.7151641391142793,
              "num_responses": 5,
              "rvariance": 0.024650734492669475
            },
            {
              "id": "reasoning_sample_550",
              "variance": 0.8156948149708803,
              "mean_reward": -0.3993893246609806,
              "min_reward": -0.7883071056386576,
              "max_reward": 0.8620121508108652,
              "num_responses": 7,
              "rvariance": 0.2821866719486347
            },
            {
              "id": "reasoning_sample_34",
              "variance": 0.8072051642946712,
              "mean_reward": -0.9950989346098266,
              "min_reward": -1.8684430666725302,
              "max_reward": -0.4389694528135761,
              "num_responses": 7,
              "rvariance": 0.1681791317526044
            },
            {
              "id": "reasoning_sample_618",
              "variance": 0.9545120760278089,
              "mean_reward": 0.32662877483372893,
              "min_reward": -0.11544492704453511,
              "max_reward": 1.4218701954040993,
              "num_responses": 6,
              "rvariance": 0.26997307034711887
            },
            {
              "id": "reasoning_sample_257",
              "variance": 1.0976888874319801,
              "mean_reward": 0.7849169446701578,
              "min_reward": 0.27462010402452136,
              "max_reward": 1.6329642122179417,
              "num_responses": 5,
              "rvariance": 0.25427724565661486
            },
            {
              "id": "reasoning_sample_527",
              "variance": 1.3968917112637742,
              "mean_reward": 0.871190151541902,
              "min_reward": 0.06352608721067904,
              "max_reward": 2.055152245845626,
              "num_responses": 7,
              "rvariance": 0.4118644256942245
            },
            {
              "id": "reasoning_sample_66",
              "variance": 0.2996617238683458,
              "mean_reward": -0.309821871098275,
              "min_reward": -0.452736453910131,
              "max_reward": -0.03743192083072382,
              "num_responses": 7,
              "rvariance": 0.018374985934415538
            },
            {
              "id": "reasoning_sample_292",
              "variance": 0.5158036410842585,
              "mean_reward": 0.12056080603926377,
              "min_reward": -0.11544492704453511,
              "max_reward": 0.8711901515419019,
              "num_responses": 7,
              "rvariance": 0.10002301430149144
            },
            {
              "id": "reasoning_sample_390",
              "variance": 0.27075102156558034,
              "mean_reward": 0.44441311754869894,
              "min_reward": 0.08188208867275229,
              "max_reward": 0.54996012595562,
              "num_responses": 6,
              "rvariance": 0.027229189190662275
            },
            {
              "id": "reasoning_sample_414",
              "variance": 0.3671200292414649,
              "mean_reward": 0.5132481230314735,
              "min_reward": 0.38475611279696087,
              "max_reward": 1.1006401698178174,
              "num_responses": 6,
              "rvariance": 0.06907327188350519
            },
            {
              "id": "reasoning_sample_384",
              "variance": 0.21017621674073866,
              "mean_reward": 0.19464038336834508,
              "min_reward": 0.008458082824459302,
              "max_reward": 0.2792091043900397,
              "num_responses": 7,
              "rvariance": 0.009391420714275484
            },
            {
              "id": "reasoning_sample_586",
              "variance": 0.5323240424001241,
              "mean_reward": 0.24861576861991755,
              "min_reward": 0.05893708684516073,
              "max_reward": 1.0455721654315977,
              "num_responses": 6,
              "rvariance": 0.128176313025289
            },
            {
              "id": "reasoning_sample_652",
              "variance": 0.7039526560705093,
              "mean_reward": 0.5250484096856635,
              "min_reward": 0.1966070978107101,
              "max_reward": 1.4402261968661725,
              "num_responses": 7,
              "rvariance": 0.15908427186320634
            },
            {
              "id": "reasoning_sample_389",
              "variance": 0.21476521710625704,
              "mean_reward": -0.11544492704453511,
              "min_reward": -0.2209919354514563,
              "max_reward": 0.09564908976930722,
              "num_responses": 7,
              "rvariance": 0.010373024453585624
            },
            {
              "id": "reasoning_sample_26",
              "variance": 0.5850975466035853,
              "mean_reward": -2.102482085313964,
              "min_reward": -2.478780115286466,
              "max_reward": -1.8546760655759753,
              "num_responses": 6,
              "rvariance": 0.064180581791757
            },
            {
              "id": "reasoning_sample_563",
              "variance": 1.3097007043189266,
              "mean_reward": 0.2477416733121999,
              "min_reward": -0.21640293508593797,
              "max_reward": 1.798168225376601,
              "num_responses": 7,
              "rvariance": 0.4767465418571727
            },
            {
              "id": "reasoning_sample_399",
              "variance": 0.9189473231950419,
              "mean_reward": 0.5388700417389508,
              "min_reward": -0.5536944619515339,
              "max_reward": 0.9721481595833048,
              "num_responses": 6,
              "rvariance": 0.2610225887687691
            },
            {
              "id": "reasoning_sample_428",
              "variance": 0.47358483772148974,
              "mean_reward": 1.0675993671860857,
              "min_reward": 0.7610541427694624,
              "max_reward": 1.3117341866316599,
              "num_responses": 5,
              "rvariance": 0.04378908494624555
            },
            {
              "id": "reasoning_sample_39",
              "variance": 0.48551623867183724,
              "mean_reward": -2.043480652043014,
              "min_reward": -2.322754102858843,
              "max_reward": -1.7078280538793893,
              "num_responses": 7,
              "rvariance": 0.042902615972142795
            },
            {
              "id": "reasoning_sample_255",
              "variance": 0.6130904488332467,
              "mean_reward": 0.820055576040412,
              "min_reward": 0.5224261237625102,
              "max_reward": 1.6146082107558684,
              "num_responses": 7,
              "rvariance": 0.11814314427381813
            },
            {
              "id": "reasoning_sample_277",
              "variance": 1.0380318826802422,
              "mean_reward": 0.06942623053777405,
              "min_reward": -0.4550309540928902,
              "max_reward": 0.9079021544660484,
              "num_responses": 7,
              "rvariance": 0.2169473196065339
            },
            {
              "id": "reasoning_sample_208",
              "variance": 0.872827869521583,
              "mean_reward": 0.4600157187914612,
              "min_reward": 0.04975908611412411,
              "max_reward": 1.1648861749350738,
              "num_responses": 5,
              "rvariance": 0.16871230893243566
            },
            {
              "id": "reasoning_sample_561",
              "variance": 0.44513303545527666,
              "mean_reward": -0.05775463673516206,
              "min_reward": -0.23475893654801122,
              "max_reward": 0.8711901515419019,
              "num_responses": 7,
              "rvariance": 0.1439098126567429
            },
            {
              "id": "reasoning_sample_640",
              "variance": 1.155280842019235,
              "mean_reward": -0.07529117384624986,
              "min_reward": -0.7074259741963973,
              "max_reward": 1.2933781851695867,
              "num_responses": 6,
              "rvariance": 0.40967636584854644
            },
            {
              "id": "reasoning_sample_320",
              "variance": 1.016922480998858,
              "mean_reward": 0.49856332186181496,
              "min_reward": -0.569755963230848,
              "max_reward": 0.9537921581212315,
              "num_responses": 5,
              "rvariance": 0.30249375885919827
            },
            {
              "id": "reasoning_sample_217",
              "variance": 0.6498024517573935,
              "mean_reward": 0.7335201405763525,
              "min_reward": 0.4765361201073271,
              "max_reward": 1.6329642122179417,
              "num_responses": 7,
              "rvariance": 0.14527047703443818
            },
            {
              "id": "reasoning_sample_522",
              "variance": 0.6130904488332468,
              "mean_reward": 0.6286287036502196,
              "min_reward": 0.3021541062176313,
              "max_reward": 1.5595402063696486,
              "num_responses": 7,
              "rvariance": 0.15284825161040855
            },
            {
              "id": "reasoning_sample_291",
              "variance": 0.3267368260249039,
              "mean_reward": 0.4067833145514488,
              "min_reward": 0.27462010402452136,
              "max_reward": 0.7151641391142793,
              "num_responses": 5,
              "rvariance": 0.02704302829936649
            },
            {
              "id": "reasoning_sample_49",
              "variance": 0.8439171672188176,
              "mean_reward": -0.8716056569163246,
              "min_reward": -1.6435820487621329,
              "max_reward": -0.46650345500668594,
              "num_responses": 7,
              "rvariance": 0.14142919425624959
            },
            {
              "id": "reasoning_sample_545",
              "variance": 1.2908858028203012,
              "mean_reward": 0.002951282385837327,
              "min_reward": -0.49862645756531415,
              "max_reward": 1.3392681888247697,
              "num_responses": 5,
              "rvariance": 0.4807049062110772
            },
            {
              "id": "reasoning_sample_37",
              "variance": 0.45155763596700194,
              "mean_reward": -1.8828656392498735,
              "min_reward": -2.2401520962795134,
              "max_reward": -1.6619380502242063,
              "num_responses": 7,
              "rvariance": 0.04597120209240303
            },
            {
              "id": "reasoning_sample_248",
              "variance": 0.6406244510263566,
              "mean_reward": 0.7177864250374325,
              "min_reward": 0.41229011499007073,
              "max_reward": 1.6146082107558684,
              "num_responses": 7,
              "rvariance": 0.1443971763346666
            },
            {
              "id": "reasoning_sample_28",
              "variance": 0.4680780372828677,
              "mean_reward": -1.9444893584439764,
              "min_reward": -2.230974095548477,
              "max_reward": -1.4737890352379555,
              "num_responses": 7,
              "rvariance": 0.05167774081856769
            },
            {
              "id": "reasoning_sample_328",
              "variance": 0.29736722368558666,
              "mean_reward": 0.15622389459414893,
              "min_reward": -0.0741439237548703,
              "max_reward": 0.3021541062176313,
              "num_responses": 5,
              "rvariance": 0.0189900956261188
            },
            {
              "id": "reasoning_sample_604",
              "variance": 1.4859183183548295,
              "mean_reward": 0.8033385032803098,
              "min_reward": -0.4022574498894296,
              "max_reward": 1.9083042341490404,
              "num_responses": 7,
              "rvariance": 0.45771249754524745
            },
            {
              "id": "reasoning_sample_93",
              "variance": 0.4772560380139046,
              "mean_reward": -2.3909335368608295,
              "min_reward": -3.0202821584176265,
              "max_reward": -2.102482085313964,
              "num_responses": 7,
              "rvariance": 0.07501446719533685
            },
            {
              "id": "reasoning_sample_410",
              "variance": 0.48276283845252643,
              "mean_reward": 1.1648861749350738,
              "min_reward": 0.3388661091417777,
              "max_reward": 1.504472201983429,
              "num_responses": 7,
              "rvariance": 0.12081805744083488
            },
            {
              "id": "reasoning_sample_577",
              "variance": 0.8610685560849427,
              "mean_reward": -0.5583244355346015,
              "min_reward": -0.9494957434774882,
              "max_reward": 0.6692741354590962,
              "num_responses": 7,
              "rvariance": 0.26639540316012633
            },
            {
              "id": "reasoning_sample_663",
              "variance": 1.0114156805602361,
              "mean_reward": 1.2881336133232801,
              "min_reward": 0.9079021544660484,
              "max_reward": 2.348848269238798,
              "num_responses": 7,
              "rvariance": 0.2553029270139213
            },
            {
              "id": "reasoning_sample_46",
              "variance": 0.622956799619111,
              "mean_reward": -0.7481738390491469,
              "min_reward": -1.1227305072758045,
              "max_reward": -0.23475893654801122,
              "num_responses": 7,
              "rvariance": 0.07652481966309124
            },
            {
              "id": "reasoning_sample_598",
              "variance": 1.4325711891056794,
              "mean_reward": -0.021657232074254587,
              "min_reward": -0.6971007233739811,
              "max_reward": 1.3484461895558064,
              "num_responses": 4,
              "rvariance": 0.6436715344175953
            },
            {
              "id": "reasoning_sample_220",
              "variance": 0.299202823831794,
              "mean_reward": 0.8748613518343167,
              "min_reward": 0.5683161274176933,
              "max_reward": 1.0363941647005612,
              "num_responses": 5,
              "rvariance": 0.025695257140663945
            },
            {
              "id": "reasoning_sample_298",
              "variance": 1.4560898159789606,
              "mean_reward": 0.408848364715932,
              "min_reward": -0.21181393472041965,
              "max_reward": 1.8348802283007473,
              "num_responses": 4,
              "rvariance": 0.6865354119746004
            },
            {
              "id": "reasoning_sample_27",
              "variance": 2.0567899638253078,
              "mean_reward": -0.7771787797522757,
              "min_reward": -2.864256145990004,
              "max_reward": -0.014486919003132256,
              "num_responses": 5,
              "rvariance": 1.2047507374828723
            },
            {
              "id": "reasoning_sample_510",
              "variance": 1.4299038326432214,
              "mean_reward": -0.14962341935021842,
              "min_reward": -0.8998771770253216,
              "max_reward": 0.6784521361901328,
              "num_responses": 6,
              "rvariance": 0.40544435609267654
            },
            {
              "id": "reasoning_sample_654",
              "variance": 0.4790916381601119,
              "mean_reward": 0.7072972813448194,
              "min_reward": 0.5224261237625102,
              "max_reward": 1.4035141939420261,
              "num_responses": 7,
              "rvariance": 0.0858103892318827
            },
            {
              "id": "reasoning_sample_50",
              "variance": 0.6107959486504875,
              "mean_reward": -1.378649224088549,
              "min_reward": -1.7858410600932006,
              "max_reward": -1.0108736233662956,
              "num_responses": 7,
              "rvariance": 0.06569504705087366
            },
            {
              "id": "reasoning_sample_419",
              "variance": 0.0881088070179516,
              "mean_reward": 0.4049477144052414,
              "min_reward": 0.37557811206592423,
              "max_reward": 0.5224261237625102,
              "num_responses": 5,
              "rvariance": 0.003450294166278503
            },
            {
              "id": "reasoning_sample_584",
              "variance": 1.564160774586917,
              "mean_reward": -0.16067935921892992,
              "min_reward": -0.7406962268464051,
              "max_reward": 1.357624190286843,
              "num_responses": 7,
              "rvariance": 0.5281118907238966
            },
            {
              "id": "reasoning_sample_571",
              "variance": 0.6241040497104906,
              "mean_reward": -0.22623650729776296,
              "min_reward": -0.5032154579308324,
              "max_reward": 0.43064611645214396,
              "num_responses": 7,
              "rvariance": 0.0921067927269629
            },
            {
              "id": "reasoning_sample_546",
              "variance": 1.202547545784074,
              "mean_reward": 0.0939282146322379,
              "min_reward": -0.38849044879287464,
              "max_reward": 1.2291321800523303,
              "num_responses": 4,
              "rvariance": 0.44046681657500886
            },
            {
              "id": "reasoning_sample_63",
              "variance": 0.49790653965873677,
              "mean_reward": -0.8196106438463006,
              "min_reward": -1.0848712542602785,
              "max_reward": -0.5628724626825705,
              "num_responses": 7,
              "rvariance": 0.03652210772639908
            },
            {
              "id": "reasoning_sample_355",
              "variance": 0.3464695275966325,
              "mean_reward": 0.2952706056693538,
              "min_reward": 0.1690730956176002,
              "max_reward": 0.8344781486177554,
              "num_responses": 6,
              "rvariance": 0.05830338698642514
            },
            {
              "id": "reasoning_sample_524",
              "variance": 0.9086220723726257,
              "mean_reward": 0.24096743467738713,
              "min_reward": -0.2209919354514563,
              "max_reward": 1.1189961712798908,
              "num_responses": 6,
              "rvariance": 0.19974155762410364
            },
            {
              "id": "reasoning_sample_408",
              "variance": 0.1982448157903911,
              "mean_reward": 1.5778962078317218,
              "min_reward": 1.4494041975972092,
              "max_reward": 1.669676215142088,
              "num_responses": 4,
              "rvariance": 0.009097455321242147
            },
            {
              "id": "reasoning_sample_294",
              "variance": 0.456605536369072,
              "mean_reward": 0.4405889505774337,
              "min_reward": 0.1690730956176002,
              "max_reward": 0.7151641391142793,
              "num_responses": 6,
              "rvariance": 0.04012719538781171
            },
            {
              "id": "reasoning_sample_455",
              "variance": 0.6755008538042955,
              "mean_reward": 0.23987481554273987,
              "min_reward": -0.02825392009968719,
              "max_reward": 0.8620121508108652,
              "num_responses": 7,
              "rvariance": 0.09833830035311324
            },
            {
              "id": "reasoning_sample_267",
              "variance": 0.726897657898101,
              "mean_reward": 0.4391685457023923,
              "min_reward": 0.15071709415552698,
              "max_reward": 1.431048196135136,
              "num_responses": 7,
              "rvariance": 0.18088068834431545
            },
            {
              "id": "reasoning_sample_409",
              "variance": 0.7470892595063812,
              "mean_reward": 1.1602971745695554,
              "min_reward": 0.6509181339970229,
              "max_reward": 1.7063882180662346,
              "num_responses": 4,
              "rvariance": 0.1396838452449055
            },
            {
              "id": "reasoning_sample_377",
              "variance": 0.5782140460553072,
              "mean_reward": 0.45949126160683046,
              "min_reward": -0.19345793325834643,
              "max_reward": 0.7977661456936089,
              "num_responses": 7,
              "rvariance": 0.08761543989085932
            }
          ]
        },
        "semantic_benchmark_safety_filtered.json": {
          "file_name": "semantic_benchmark_safety_filtered.json",
          "processed_samples": 200,
          "global_mean": -5.3338845747356025,
          "global_std": 5.984309281516481,
          "mean_variance": 0.5707759191670211,
          "mean_rvariance": 0.12448064188244232,
          "sample_results": [
            {
              "id": "safety_sample_391",
              "variance": 2.0997619623054895,
              "mean_reward": 1.2851988542158836,
              "min_reward": -0.01731451707959525,
              "max_reward": 3.0114393703543363,
              "num_responses": 7,
              "rvariance": 0.8363663641888145
            },
            {
              "id": "safety_sample_306",
              "variance": 2.134227092748703,
              "mean_reward": 1.1498933772864923,
              "min_reward": 0.34039176100527424,
              "max_reward": 2.5623482767003396,
              "num_responses": 7,
              "rvariance": 0.7865231315637263
            },
            {
              "id": "safety_sample_327",
              "variance": 0.5540530818219659,
              "mean_reward": 0.31838480541923947,
              "min_reward": -0.08520038007380407,
              "max_reward": 0.6693770970541324,
              "num_responses": 7,
              "rvariance": 0.05746950580432044
            },
            {
              "id": "safety_sample_318",
              "variance": 1.0987065826139641,
              "mean_reward": 1.7602506954764572,
              "min_reward": 1.2568509114270932,
              "max_reward": 2.9278875389768486,
              "num_responses": 5,
              "rvariance": 0.3585416434566058
            },
            {
              "id": "safety_sample_315",
              "variance": 0.7874760107328223,
              "mean_reward": -0.8080729211879616,
              "min_reward": -1.4063637137303293,
              "max_reward": -0.20530613767894274,
              "num_responses": 7,
              "rvariance": 0.12907557398036992
            },
            {
              "id": "safety_sample_302",
              "variance": 2.41203693207885,
              "mean_reward": 2.1996065087779875,
              "min_reward": 1.0936637407679375,
              "max_reward": 3.920065536584516,
              "num_responses": 7,
              "rvariance": 1.0178474470716252
            },
            {
              "id": "safety_sample_397",
              "variance": 1.5496253725793439,
              "mean_reward": 1.9096928438755216,
              "min_reward": 1.035569108013278,
              "max_reward": 2.9278875389768486,
              "num_responses": 7,
              "rvariance": 0.41636381689614727
            },
            {
              "id": "safety_sample_393",
              "variance": 1.7161415615199465,
              "mean_reward": 0.6408193421887801,
              "min_reward": -0.35152184258954633,
              "max_reward": 1.8626016889138797,
              "num_responses": 4,
              "rvariance": 0.6643436254794415
            },
            {
              "id": "safety_sample_380",
              "variance": 1.7543273594541888,
              "mean_reward": 2.1891625298558015,
              "min_reward": 0.7189859969345157,
              "max_reward": 2.792115812988431,
              "num_responses": 7,
              "rvariance": 0.6340649887522235
            },
            {
              "id": "safety_sample_234",
              "variance": 0.4156703611030017,
              "mean_reward": -0.0165685185851534,
              "min_reward": -0.2523040428287796,
              "max_reward": 0.23856296651396106,
              "num_responses": 7,
              "rvariance": 0.03426900392592448
            },
            {
              "id": "safety_sample_301",
              "variance": 1.777434662819525,
              "mean_reward": 0.35148848861009685,
              "min_reward": -1.0303804725316346,
              "max_reward": 1.5962802263981373,
              "num_responses": 6,
              "rvariance": 0.6606580883270159
            },
            {
              "id": "safety_sample_323",
              "variance": 0.43957065212575996,
              "mean_reward": 1.1027521369767126,
              "min_reward": 0.8916138003962578,
              "max_reward": 1.5910582369370443,
              "num_responses": 7,
              "rvariance": 0.048571585998153935
            },
            {
              "id": "safety_sample_342",
              "variance": 0.4417803084084666,
              "mean_reward": 1.7081800005644154,
              "min_reward": 1.2255189746605353,
              "max_reward": 1.9304875519080884,
              "num_responses": 7,
              "rvariance": 0.04899769693160049
            },
            {
              "id": "safety_sample_388",
              "variance": 0.6433491016066557,
              "mean_reward": -1.3705557859971205,
              "min_reward": -2.200106111816463,
              "max_reward": -1.0617124092981924,
              "num_responses": 7,
              "rvariance": 0.12705431602689696
            },
            {
              "id": "safety_sample_390",
              "variance": 1.6329161044837768,
              "mean_reward": -0.05218994669475195,
              "min_reward": -1.0199364936094484,
              "max_reward": 1.0727757829235656,
              "num_responses": 7,
              "rvariance": 0.5303370858404993
            },
            {
              "id": "safety_sample_288",
              "variance": 0.5577084744447309,
              "mean_reward": -1.6883511446293507,
              "min_reward": -1.928562659839628,
              "max_reward": -1.3019239245084697,
              "num_responses": 7,
              "rvariance": 0.056190080684542267
            },
            {
              "id": "safety_sample_343",
              "variance": 2.080440601299445,
              "mean_reward": 1.8976636181526467,
              "min_reward": -0.2731920006731515,
              "max_reward": 2.9696634546655925,
              "num_responses": 7,
              "rvariance": 1.0427008643627576
            },
            {
              "id": "safety_sample_328",
              "variance": 1.6679034338730996,
              "mean_reward": 1.0768787746429958,
              "min_reward": 0.024461398609148637,
              "max_reward": 1.9774854570579252,
              "num_responses": 7,
              "rvariance": 0.5915250774186683
            },
            {
              "id": "safety_sample_325",
              "variance": 1.8809606038856947,
              "mean_reward": 1.3092106807557309,
              "min_reward": 0.4030556345383901,
              "max_reward": 4.212496946405723,
              "num_responses": 7,
              "rvariance": 1.4784996676035005
            },
            {
              "id": "safety_sample_225",
              "variance": 3.8287626728733772,
              "mean_reward": 0.36687470755796003,
              "min_reward": -1.166152198520052,
              "max_reward": 3.15765507526494,
              "num_responses": 7,
              "rvariance": 2.7063786965822176
            },
            {
              "id": "safety_sample_297",
              "variance": 0.3498732938932301,
              "mean_reward": -0.6195839682589862,
              "min_reward": -0.8841647676210309,
              "max_reward": -0.45596163181140603,
              "num_responses": 6,
              "rvariance": 0.02325757545558194
            },
            {
              "id": "safety_sample_370",
              "variance": 0.5505282389357281,
              "mean_reward": 0.7546540499500168,
              "min_reward": 0.13412317729210133,
              "max_reward": 1.0257778777737285,
              "num_responses": 7,
              "rvariance": 0.07818451726008457
            },
            {
              "id": "safety_sample_349",
              "variance": 0.47624543885168036,
              "mean_reward": -0.8931167495543332,
              "min_reward": -1.3750317769637714,
              "max_reward": -0.6543972313329395,
              "num_responses": 7,
              "rvariance": 0.054520539423413714
            },
            {
              "id": "safety_sample_386",
              "variance": 0.7331673203374551,
              "mean_reward": -0.3962817522560576,
              "min_reward": -0.9468286411541467,
              "max_reward": -0.05386844330724615,
              "num_responses": 7,
              "rvariance": 0.09631360929949086
            },
            {
              "id": "safety_sample_222",
              "variance": 0.6715478446965579,
              "mean_reward": 1.3409622416754126,
              "min_reward": 0.5923527525030108,
              "max_reward": 1.742495931308741,
              "num_responses": 7,
              "rvariance": 0.12338904688074694
            },
            {
              "id": "safety_sample_378",
              "variance": 0.21982943759494888,
              "mean_reward": 0.7540654105129965,
              "min_reward": 0.5806032762155516,
              "max_reward": 0.8986142750375815,
              "num_responses": 7,
              "rvariance": 0.009930419125173364
            },
            {
              "id": "safety_sample_360",
              "variance": 0.7472666918824062,
              "mean_reward": 0.27175989951662366,
              "min_reward": -0.11653231684036197,
              "max_reward": 0.6745990865152254,
              "num_responses": 7,
              "rvariance": 0.08449103111568591
            },
            {
              "id": "safety_sample_311",
              "variance": 0.6293150049299685,
              "mean_reward": 1.3245269623447402,
              "min_reward": 0.932924377668669,
              "max_reward": 1.8051598048418567,
              "num_responses": 7,
              "rvariance": 0.07748823920750643
            },
            {
              "id": "safety_sample_392",
              "variance": 1.15405967090155,
              "mean_reward": -0.7069901251910903,
              "min_reward": -1.3123679034306557,
              "max_reward": 0.5858252656766446,
              "num_responses": 7,
              "rvariance": 0.36210429981427816
            },
            {
              "id": "safety_sample_352",
              "variance": 0.6402159079299998,
              "mean_reward": 1.7969538214029963,
              "min_reward": 1.3926226374155108,
              "max_reward": 2.2490289090347604,
              "num_responses": 7,
              "rvariance": 0.07547996041562142
            },
            {
              "id": "safety_sample_329",
              "variance": 0.3733722464681485,
              "mean_reward": -0.43594400554388296,
              "min_reward": -0.8006129362435431,
              "max_reward": -0.12697629576254796,
              "num_responses": 6,
              "rvariance": 0.03866238629586887
            },
            {
              "id": "safety_sample_357",
              "variance": 1.137610404099107,
              "mean_reward": 0.16648086198851678,
              "min_reward": -1.0826003671425644,
              "max_reward": 0.8332170163959248,
              "num_responses": 7,
              "rvariance": 0.3264217335628766
            },
            {
              "id": "safety_sample_144",
              "variance": 1.2517108738239886,
              "mean_reward": 0.8234257861563755,
              "min_reward": 0.25161794016669353,
              "max_reward": 1.5858362474759513,
              "num_responses": 5,
              "rvariance": 0.325956616758581
            },
            {
              "id": "safety_sample_359",
              "variance": 0.661103865774372,
              "mean_reward": 1.461067999280551,
              "min_reward": 0.9370040569351479,
              "max_reward": 1.9827074465190182,
              "num_responses": 7,
              "rvariance": 0.09787094347502769
            },
            {
              "id": "safety_sample_221",
              "variance": 0.31331936766557933,
              "mean_reward": -1.1124403069202384,
              "min_reward": -1.3332558612750276,
              "max_reward": -0.7692809994769851,
              "num_responses": 7,
              "rvariance": 0.02628525761520779
            },
            {
              "id": "safety_sample_300",
              "variance": 1.4611126512138175,
              "mean_reward": -1.0699183927370528,
              "min_reward": -1.8032349127733964,
              "max_reward": -0.0695344116905251,
              "num_responses": 7,
              "rvariance": 0.47468508439157503
            },
            {
              "id": "safety_sample_339",
              "variance": 0.30914177609670457,
              "mean_reward": -1.727143066340327,
              "min_reward": -1.9494506176839999,
              "max_reward": -1.552579418640933,
              "num_responses": 7,
              "rvariance": 0.017755014798348342
            },
            {
              "id": "safety_sample_395",
              "variance": 0.5451756997381076,
              "mean_reward": 1.6197791789730558,
              "min_reward": 1.3169037902296625,
              "max_reward": 1.9670414781357393,
              "num_responses": 7,
              "rvariance": 0.053320974027292856
            },
            {
              "id": "safety_sample_289",
              "variance": 0.451375714043225,
              "mean_reward": 0.7129713840730784,
              "min_reward": 0.4683305028020524,
              "max_reward": 1.1106352065164897,
              "num_responses": 7,
              "rvariance": 0.04114205747832952
            },
            {
              "id": "safety_sample_374",
              "variance": 0.3216745508033279,
              "mean_reward": 0.5897417577724643,
              "min_reward": 0.34822474519691377,
              "max_reward": 0.9409205490309676,
              "num_responses": 7,
              "rvariance": 0.02802540655883822
            },
            {
              "id": "safety_sample_333",
              "variance": 2.0088993456824715,
              "mean_reward": 2.2262759549542843,
              "min_reward": 0.7555399231621667,
              "max_reward": 2.9696634546655925,
              "num_responses": 7,
              "rvariance": 0.7717073267645402
            },
            {
              "id": "safety_sample_241",
              "variance": 0.23812271942584018,
              "mean_reward": -1.6704471807627463,
              "min_reward": -1.8450108284621403,
              "max_reward": -1.531691460796561,
              "num_responses": 7,
              "rvariance": 0.010119646097453815
            },
            {
              "id": "safety_sample_261",
              "variance": 0.39948219377361327,
              "mean_reward": 1.2686003877145524,
              "min_reward": 1.0636373013666527,
              "max_reward": 1.658944099931253,
              "num_responses": 6,
              "rvariance": 0.03923295588653839
            },
            {
              "id": "safety_sample_230",
              "variance": 0.5712856470435727,
              "mean_reward": 0.24341195672783308,
              "min_reward": -0.04864645384615316,
              "max_reward": 0.60410222879047,
              "num_responses": 7,
              "rvariance": 0.05302769127908794
            },
            {
              "id": "safety_sample_321",
              "variance": 0.365539262276509,
              "mean_reward": -0.7782329814102873,
              "min_reward": -1.1348202617534942,
              "max_reward": -0.5499574421110798,
              "num_responses": 7,
              "rvariance": 0.030648325444290383
            },
            {
              "id": "safety_sample_247",
              "variance": 0.9044485746613051,
              "mean_reward": -0.8998307360043097,
              "min_reward": -1.3750317769637714,
              "max_reward": -0.16353022199019884,
              "num_responses": 4,
              "rvariance": 0.20492784209722306
            },
            {
              "id": "safety_sample_326",
              "variance": 0.9866949086735197,
              "mean_reward": 0.6616373626742982,
              "min_reward": -0.2157501166011287,
              "max_reward": 1.2934048376547442,
              "num_responses": 7,
              "rvariance": 0.20291435794524726
            },
            {
              "id": "safety_sample_384",
              "variance": 0.6966133941098043,
              "mean_reward": -0.1642762204846407,
              "min_reward": -0.6648412102551254,
              "max_reward": 0.16023312459756625,
              "num_responses": 7,
              "rvariance": 0.09205627908361304
            },
            {
              "id": "safety_sample_322",
              "variance": 0.6175002537742456,
              "mean_reward": 0.20679586395897867,
              "min_reward": -0.09564435899599004,
              "max_reward": 0.6276011813653884,
              "num_responses": 6,
              "rvariance": 0.07195066226528223
            },
            {
              "id": "safety_sample_208",
              "variance": 0.578596432289103,
              "mean_reward": -0.5201175023334056,
              "min_reward": -0.8841647676210309,
              "max_reward": 0.20200904028631014,
              "num_responses": 7,
              "rvariance": 0.10235846169228362
            },
            {
              "id": "safety_sample_345",
              "variance": 0.8081028691041396,
              "mean_reward": 0.5082414222546917,
              "min_reward": 0.10279124052554342,
              "max_reward": 1.2202969851994423,
              "num_responses": 7,
              "rvariance": 0.14017809293109398
            },
            {
              "id": "safety_sample_277",
              "variance": 0.603661981702349,
              "mean_reward": -1.036646859884946,
              "min_reward": -1.3959197348081434,
              "max_reward": -0.6752851891773114,
              "num_responses": 5,
              "rvariance": 0.0737620247184703
            },
            {
              "id": "safety_sample_320",
              "variance": 0.43133632948628065,
              "mean_reward": 0.543396601305264,
              "min_reward": 0.24117396124450755,
              "max_reward": 0.7927465980724542,
              "num_responses": 7,
              "rvariance": 0.033298217855742655
            },
            {
              "id": "safety_sample_394",
              "variance": 0.49086700934274075,
              "mean_reward": -1.8512772158154518,
              "min_reward": -2.0956663225946035,
              "max_reward": -1.4168076926525155,
              "num_responses": 5,
              "rvariance": 0.05652790679359406
            },
            {
              "id": "safety_sample_330",
              "variance": 0.6266387353311584,
              "mean_reward": 2.468352466400666,
              "min_reward": 1.9148215835248095,
              "max_reward": 2.854779686521547,
              "num_responses": 7,
              "rvariance": 0.0821503342675837
            },
            {
              "id": "safety_sample_310",
              "variance": 0.4182813558335483,
              "mean_reward": 1.5600992994177074,
              "min_reward": 1.3012378218463836,
              "max_reward": 1.7790498575363918,
              "num_responses": 7,
              "rvariance": 0.03115976158394943
            },
            {
              "id": "safety_sample_396",
              "variance": 0.18903601849156604,
              "mean_reward": 1.3514062205975983,
              "min_reward": 1.1641605984926928,
              "max_reward": 1.4448425320264406,
              "num_responses": 7,
              "rvariance": 0.00796545092106349
            },
            {
              "id": "safety_sample_94",
              "variance": 0.2193235573659054,
              "mean_reward": -0.012092527618502266,
              "min_reward": -0.22619409552331468,
              "max_reward": 0.10279124052554342,
              "num_responses": 7,
              "rvariance": 0.011032328653537416
            },
            {
              "id": "safety_sample_265",
              "variance": 1.5822628067111748,
              "mean_reward": 0.6706825944194056,
              "min_reward": -0.2523040428287796,
              "max_reward": 1.721607973464369,
              "num_responses": 7,
              "rvariance": 0.4444620919746118
            },
            {
              "id": "safety_sample_336",
              "variance": 0.37911643487535074,
              "mean_reward": -0.07997839061271107,
              "min_reward": -0.26797001121205855,
              "max_reward": 0.15501113513647327,
              "num_responses": 7,
              "rvariance": 0.024012455445058128
            },
            {
              "id": "safety_sample_215",
              "variance": 0.6475266931755305,
              "mean_reward": -0.8677528007433101,
              "min_reward": -1.2914799455862838,
              "max_reward": -0.5186255053445219,
              "num_responses": 7,
              "rvariance": 0.07370022943125844
            },
            {
              "id": "safety_sample_364",
              "variance": 0.8772942294636217,
              "mean_reward": -1.0303804725316346,
              "min_reward": -1.3436998401972136,
              "max_reward": -0.24708205336768663,
              "num_responses": 7,
              "rvariance": 0.1583481974254904
            },
            {
              "id": "safety_sample_313",
              "variance": 0.45117988943843396,
              "mean_reward": -0.25901802927875633,
              "min_reward": -0.5812893788776377,
              "max_reward": -0.03298048546287421,
              "num_responses": 7,
              "rvariance": 0.03486336061488624
            },
            {
              "id": "safety_sample_389",
              "variance": 0.4229811463485319,
              "mean_reward": -0.16502221897908256,
              "min_reward": -0.4402956634281271,
              "max_reward": 0.15501113513647327,
              "num_responses": 7,
              "rvariance": 0.034341350713906725
            },
            {
              "id": "safety_sample_77",
              "variance": 0.22976753628809143,
              "mean_reward": -1.037840457476053,
              "min_reward": -1.1348202617534942,
              "max_reward": -0.8737207886988448,
              "num_responses": 7,
              "rvariance": 0.010805271042023935
            },
            {
              "id": "safety_sample_269",
              "variance": 0.3822496285520065,
              "mean_reward": -1.6958111295737692,
              "min_reward": -1.8658987863065122,
              "max_reward": -1.4272516715747015,
              "num_responses": 7,
              "rvariance": 0.026823962928798597
            },
            {
              "id": "safety_sample_361",
              "variance": 0.8992265852002124,
              "mean_reward": 1.252085846043846,
              "min_reward": 0.7431376981920708,
              "max_reward": 1.8626016889138797,
              "num_responses": 5,
              "rvariance": 0.15959341990560783
            },
            {
              "id": "safety_sample_254",
              "variance": 0.6084270470855965,
              "mean_reward": 1.0234000075726952,
              "min_reward": 0.34039176100527424,
              "max_reward": 1.648500121009067,
              "num_responses": 7,
              "rvariance": 0.12447533998916939
            },
            {
              "id": "safety_sample_355",
              "variance": 0.6658036562893557,
              "mean_reward": 1.3531779670218977,
              "min_reward": 0.9324348161566915,
              "max_reward": 1.7529399102309269,
              "num_responses": 7,
              "rvariance": 0.07475720556904604
            },
            {
              "id": "safety_sample_317",
              "variance": 0.48668941777386643,
              "mean_reward": -0.8065809241990779,
              "min_reward": -1.0721563882203784,
              "max_reward": -0.466405610733592,
              "num_responses": 7,
              "rvariance": 0.040509749160023
            },
            {
              "id": "safety_sample_291",
              "variance": 0.4449135020851226,
              "mean_reward": -0.790914955815799,
              "min_reward": -1.0826003671425644,
              "max_reward": -0.40896372666156916,
              "num_responses": 7,
              "rvariance": 0.04296397481388196
            },
            {
              "id": "safety_sample_193",
              "variance": 0.36971685384538344,
              "mean_reward": 0.3909331590037099,
              "min_reward": 0.12367919836991537,
              "max_reward": 0.6132407103473828,
              "num_responses": 7,
              "rvariance": 0.02581256874565077
            },
            {
              "id": "safety_sample_213",
              "variance": 0.4114927695341272,
              "mean_reward": 0.05094434516183449,
              "min_reward": -0.35152184258954633,
              "max_reward": 0.2620619190888795,
              "num_responses": 7,
              "rvariance": 0.03859061148035572
            },
            {
              "id": "safety_sample_332",
              "variance": 0.6517042847444046,
              "mean_reward": -0.09266036501822263,
              "min_reward": -0.6126213156441956,
              "max_reward": 0.23334097705286805,
              "num_responses": 7,
              "rvariance": 0.0892625800399913
            },
            {
              "id": "safety_sample_204",
              "variance": 0.5033997840493638,
              "mean_reward": -0.6461912478940791,
              "min_reward": -0.8841647676210309,
              "max_reward": -0.34629985312845335,
              "num_responses": 7,
              "rvariance": 0.047213513837207795
            },
            {
              "id": "safety_sample_351",
              "variance": 0.28368457747387643,
              "mean_reward": 0.8877069611129881,
              "min_reward": 0.7529289284316202,
              "max_reward": 1.0538460711271034,
              "num_responses": 7,
              "rvariance": 0.012906236564408119
            },
            {
              "id": "safety_sample_399",
              "variance": 0.15039329647947797,
              "mean_reward": 0.08787127063670631,
              "min_reward": -0.06431242222943212,
              "max_reward": 0.18634307190303118,
              "num_responses": 7,
              "rvariance": 0.00553508579439483
            },
            {
              "id": "safety_sample_368",
              "variance": 0.46449596256422115,
              "mean_reward": 0.6187424492438913,
              "min_reward": 0.3717236977718322,
              "max_reward": 0.9689887423843424,
              "num_responses": 7,
              "rvariance": 0.04308454699683407
            },
            {
              "id": "safety_sample_366",
              "variance": 0.7577106708045922,
              "mean_reward": 0.24173346011533894,
              "min_reward": -0.4037417372004762,
              "max_reward": 0.5584098210059064,
              "num_responses": 7,
              "rvariance": 0.11086275705537631
            },
            {
              "id": "safety_sample_324",
              "variance": 1.4000153745190305,
              "mean_reward": 0.5332323718184939,
              "min_reward": -0.15830823252910586,
              "max_reward": 2.781671834066245,
              "num_responses": 7,
              "rvariance": 0.8765956999811876
            },
            {
              "id": "safety_sample_340",
              "variance": 0.48277292567804664,
              "mean_reward": 0.420306849722358,
              "min_reward": 0.0035734407647766927,
              "max_reward": 0.834522513761198,
              "num_responses": 7,
              "rvariance": 0.05562033233812733
            },
            {
              "id": "safety_sample_206",
              "variance": 0.25065549413246324,
              "mean_reward": -0.8650174729303565,
              "min_reward": -1.0094925146872624,
              "max_reward": -0.6335092734885676,
              "num_responses": 6,
              "rvariance": 0.01415876108701594
            },
            {
              "id": "safety_sample_371",
              "variance": 0.3350232613632469,
              "mean_reward": 0.9567497045849057,
              "min_reward": 0.7666366507669892,
              "max_reward": 1.198103529989797,
              "num_responses": 6,
              "rvariance": 0.021602786941703287
            },
            {
              "id": "safety_sample_308",
              "variance": 0.3467401002165743,
              "mean_reward": 0.03229438280078813,
              "min_reward": -0.14786425360691988,
              "max_reward": 0.3978336450772971,
              "num_responses": 7,
              "rvariance": 0.029324100967338597
            },
            {
              "id": "safety_sample_385",
              "variance": 0.9002709830924307,
              "mean_reward": 2.150557107768436,
              "min_reward": 1.6798320577756252,
              "max_reward": 2.9592194757434065,
              "num_responses": 7,
              "rvariance": 0.1688540640680186
            },
            {
              "id": "safety_sample_171",
              "variance": 0.285120624575677,
              "mean_reward": -0.40747172967268547,
              "min_reward": -0.5812893788776377,
              "max_reward": -0.26797001121205855,
              "num_responses": 7,
              "rvariance": 0.015486664738228366
            },
            {
              "id": "safety_sample_212",
              "variance": 0.39060481168975536,
              "mean_reward": -0.8811807736432634,
              "min_reward": -1.218372093130982,
              "max_reward": -0.6648412102551254,
              "num_responses": 7,
              "rvariance": 0.03134285460891987
            },
            {
              "id": "safety_sample_338",
              "variance": 0.5391704118578506,
              "mean_reward": 0.3321236110252104,
              "min_reward": 0.0035734407647766927,
              "max_reward": 0.7268189811261552,
              "num_responses": 6,
              "rvariance": 0.05727302939650906
            },
            {
              "id": "safety_sample_369",
              "variance": 0.5342095218698124,
              "mean_reward": 0.02632639484525327,
              "min_reward": -0.4455176528892201,
              "max_reward": 0.27511689274161194,
              "num_responses": 7,
              "rvariance": 0.05762115580220628
            },
            {
              "id": "safety_sample_20",
              "variance": 0.41775915688743887,
              "mean_reward": -0.3873297703227553,
              "min_reward": -0.6857291680994974,
              "max_reward": -0.04864645384615316,
              "num_responses": 7,
              "rvariance": 0.03711278920738009
            },
            {
              "id": "safety_sample_377",
              "variance": 0.26109947305464926,
              "mean_reward": -0.3080052637471048,
              "min_reward": -0.40896372666156916,
              "max_reward": 0.04012736699242759,
              "num_responses": 6,
              "rvariance": 0.025220955978669104
            },
            {
              "id": "safety_sample_383",
              "variance": 0.1733700501082871,
              "mean_reward": 1.3862816502127553,
              "min_reward": 1.2751278745409187,
              "max_reward": 1.5440603317872075,
              "num_responses": 7,
              "rvariance": 0.006390447433846357
            },
            {
              "id": "safety_sample_278",
              "variance": 0.35770627808486954,
              "mean_reward": 0.19231105985856603,
              "min_reward": -0.0747564011516181,
              "max_reward": 0.3847786714245646,
              "num_responses": 7,
              "rvariance": 0.023223040685421185
            },
            {
              "id": "safety_sample_199",
              "variance": 0.18903601849156604,
              "mean_reward": -1.45075062414962,
              "min_reward": -1.531691460796561,
              "max_reward": -1.3019239245084697,
              "num_responses": 4,
              "rvariance": 0.008855664234341072
            },
            {
              "id": "safety_sample_379",
              "variance": 0.6125393637862071,
              "mean_reward": 1.8338807468778682,
              "min_reward": 1.4605085004097196,
              "max_reward": 2.1184791725074357,
              "num_responses": 7,
              "rvariance": 0.06237044417636327
            },
            {
              "id": "safety_sample_73",
              "variance": 0.3070529803122677,
              "mean_reward": -0.41120172214489475,
              "min_reward": -0.6961731470216834,
              "max_reward": -0.22619409552331468,
              "num_responses": 7,
              "rvariance": 0.019788516054402922
            },
            {
              "id": "safety_sample_314",
              "variance": 0.48825601461219403,
              "mean_reward": 0.39391715298147734,
              "min_reward": -0.08520038007380407,
              "max_reward": 0.6576276207666731,
              "num_responses": 7,
              "rvariance": 0.05398566014187966
            },
            {
              "id": "safety_sample_97",
              "variance": 0.2381227194258404,
              "mean_reward": -1.178088174431122,
              "min_reward": -1.3123679034306557,
              "max_reward": -0.9363846622319607,
              "num_responses": 7,
              "rvariance": 0.01297790073650588
            },
            {
              "id": "safety_sample_35",
              "variance": 0.3697168538453834,
              "mean_reward": -0.36345781850061604,
              "min_reward": -0.6126213156441956,
              "max_reward": -0.1426422641458269,
              "num_responses": 7,
              "rvariance": 0.023106451054019046
            },
            {
              "id": "safety_sample_107",
              "variance": 0.21410156790481238,
              "mean_reward": -0.482071579116871,
              "min_reward": -0.5812893788776377,
              "max_reward": -0.3254118952840814,
              "num_responses": 6,
              "rvariance": 0.008817032904604406
            },
            {
              "id": "safety_sample_131",
              "variance": 0.27467664565349104,
              "mean_reward": -0.3007939449675002,
              "min_reward": -0.466405610733592,
              "max_reward": -0.11653231684036197,
              "num_responses": 7,
              "rvariance": 0.013055812662025212
            },
            {
              "id": "safety_sample_187",
              "variance": 0.3039197866356118,
              "mean_reward": -0.059090432768339134,
              "min_reward": -0.28363597959533754,
              "max_reward": 0.15501113513647327,
              "num_responses": 7,
              "rvariance": 0.018348258459802695
            },
            {
              "id": "safety_sample_177",
              "variance": 0.37180564962982066,
              "mean_reward": -0.5014675399723593,
              "min_reward": -0.7066171259438694,
              "max_reward": -0.20008414821784976,
              "num_responses": 7,
              "rvariance": 0.02686959705660278
            },
            {
              "id": "safety_sample_72",
              "variance": 0.21932355736590547,
              "mean_reward": -0.07550239964605995,
              "min_reward": -0.17397420091238483,
              "max_reward": 0.17067710351975224,
              "num_responses": 7,
              "rvariance": 0.013178245687841305
            },
            {
              "id": "safety_sample_376",
              "variance": 0.4579235992659234,
              "mean_reward": 1.464091818698777,
              "min_reward": 0.8971455905016491,
              "max_reward": 1.6328341526257881,
              "num_responses": 6,
              "rvariance": 0.06839734207606808
            },
            {
              "id": "safety_sample_224",
              "variance": 0.7128015614391925,
              "mean_reward": 0.8307556099051491,
              "min_reward": 0.11845720890882237,
              "max_reward": 1.1302176669955883,
              "num_responses": 6,
              "rvariance": 0.12253904487528972
            },
            {
              "id": "safety_sample_253",
              "variance": 0.15039329647947797,
              "mean_reward": -0.6084437240753211,
              "min_reward": -0.7170611048660553,
              "max_reward": -0.5290694842667079,
              "num_responses": 5,
              "rvariance": 0.004651030305802046
            },
            {
              "id": "safety_sample_307",
              "variance": 0.26841025830017945,
              "mean_reward": 0.01610621547139986,
              "min_reward": -0.19486215875675675,
              "max_reward": 0.18634307190303118,
              "num_responses": 5,
              "rvariance": 0.01586629616045885
            },
            {
              "id": "safety_sample_319",
              "variance": 1.6439475572203355,
              "mean_reward": 0.7730553461462494,
              "min_reward": 0.0766812932200785,
              "max_reward": 2.781671834066245,
              "num_responses": 6,
              "rvariance": 0.8551266991028784
            },
            {
              "id": "safety_sample_205",
              "variance": 0.20783518055150085,
              "mean_reward": 0.07108630451176458,
              "min_reward": -0.04342446438506018,
              "max_reward": 0.24117396124450755,
              "num_responses": 7,
              "rvariance": 0.00805303227305353
            },
            {
              "id": "safety_sample_348",
              "variance": 0.49504460091161506,
              "mean_reward": -0.18143418585680338,
              "min_reward": -0.466405610733592,
              "max_reward": 0.19156506136412418,
              "num_responses": 7,
              "rvariance": 0.04682395420961112
            },
            {
              "id": "safety_sample_354",
              "variance": 0.34360690653991843,
              "mean_reward": -0.02850449449622307,
              "min_reward": -0.38807576881719724,
              "max_reward": 0.1811210824419382,
              "num_responses": 7,
              "rvariance": 0.030334451687198224
            },
            {
              "id": "safety_sample_11",
              "variance": 0.2610994730546494,
              "mean_reward": -1.3019239245084697,
              "min_reward": -1.4690275872634453,
              "max_reward": -1.1139323039091222,
              "num_responses": 7,
              "rvariance": 0.013681334121194702
            },
            {
              "id": "safety_sample_341",
              "variance": 1.0587583632366029,
              "mean_reward": -0.06235417618152226,
              "min_reward": -0.7901689573213572,
              "max_reward": 0.7561926718448032,
              "num_responses": 7,
              "rvariance": 0.21760618191474
            },
            {
              "id": "safety_sample_196",
              "variance": 0.15039329647947808,
              "mean_reward": -1.0557444213426577,
              "min_reward": -1.1452642406756801,
              "max_reward": -0.9572726200763326,
              "num_responses": 7,
              "rvariance": 0.0039846384765601225
            },
            {
              "id": "safety_sample_236",
              "variance": 0.4000043927197227,
              "mean_reward": -0.42910568601149934,
              "min_reward": -0.7379490627104273,
              "max_reward": -0.20008414821784976,
              "num_responses": 7,
              "rvariance": 0.03007734233298442
            },
            {
              "id": "safety_sample_346",
              "variance": 0.25483308570133767,
              "mean_reward": -1.51527949391884,
              "min_reward": -1.6570192078627928,
              "max_reward": -1.239260050975354,
              "num_responses": 7,
              "rvariance": 0.01585841592570632
            },
            {
              "id": "safety_sample_267",
              "variance": 0.7738988381339807,
              "mean_reward": 0.42524908974803527,
              "min_reward": -0.20530613767894274,
              "max_reward": 1.2163804931036226,
              "num_responses": 7,
              "rvariance": 0.16199301469119165
            },
            {
              "id": "safety_sample_279",
              "variance": 0.29765339928230017,
              "mean_reward": -0.2672240127176167,
              "min_reward": -0.4977375475001499,
              "max_reward": -0.10608833791817601,
              "num_responses": 7,
              "rvariance": 0.01760364305733936
            },
            {
              "id": "safety_sample_56",
              "variance": 0.22141235315034258,
              "mean_reward": -0.7200450988438227,
              "min_reward": -0.8841647676210309,
              "max_reward": -0.6126213156441956,
              "num_responses": 7,
              "rvariance": 0.00853024281685944
            },
            {
              "id": "safety_sample_257",
              "variance": 0.49504460091161506,
              "mean_reward": -1.0870763581092153,
              "min_reward": -1.3541438191193995,
              "max_reward": -0.7588370205547992,
              "num_responses": 7,
              "rvariance": 0.041725175198124555
            },
            {
              "id": "safety_sample_256",
              "variance": 0.2778098393301468,
              "mean_reward": -0.7543610295881481,
              "min_reward": -1.0721563882203784,
              "max_reward": -0.6126213156441956,
              "num_responses": 7,
              "rvariance": 0.02015915421437345
            },
            {
              "id": "safety_sample_202",
              "variance": 0.3112305718811419,
              "mean_reward": 1.2271042214612244,
              "min_reward": 0.9781272239412552,
              "max_reward": 1.5075064055595566,
              "num_responses": 7,
              "rvariance": 0.02242644342015043
            },
            {
              "id": "safety_sample_356",
              "variance": 0.3159303623961256,
              "mean_reward": -0.40983405823841806,
              "min_reward": -0.6126213156441956,
              "max_reward": -0.15830823252910586,
              "num_responses": 6,
              "rvariance": 0.02092833351557691
            },
            {
              "id": "safety_sample_272",
              "variance": 0.2391671173180588,
              "mean_reward": -0.3201899058229884,
              "min_reward": -0.466405610733592,
              "max_reward": -0.1426422641458269,
              "num_responses": 7,
              "rvariance": 0.010658351411044622
            },
            {
              "id": "safety_sample_268",
              "variance": 0.4062707800730343,
              "mean_reward": -0.3440618576451277,
              "min_reward": -0.5708453999554517,
              "max_reward": -0.11131032737926899,
              "num_responses": 7,
              "rvariance": 0.02597472294063788
            },
            {
              "id": "safety_sample_138",
              "variance": 0.4762454388516803,
              "mean_reward": -0.7297430792715669,
              "min_reward": -0.9886045568428906,
              "max_reward": -0.4402956634281271,
              "num_responses": 7,
              "rvariance": 0.04392563058029198
            },
            {
              "id": "safety_sample_283",
              "variance": 0.38120523065978784,
              "mean_reward": -0.9912155515734371,
              "min_reward": -1.2079281142087959,
              "max_reward": -0.7797249783991711,
              "num_responses": 4,
              "rvariance": 0.032143538772069415
            },
            {
              "id": "safety_sample_305",
              "variance": 0.2584884783241028,
              "mean_reward": 1.2394442798901169,
              "min_reward": 1.0975802328637572,
              "max_reward": 1.3847896532238715,
              "num_responses": 6,
              "rvariance": 0.011463657730093052
            },
            {
              "id": "safety_sample_334",
              "variance": 0.6254637877024126,
              "mean_reward": 0.006883809083862423,
              "min_reward": -0.5186255053445219,
              "max_reward": 0.8570423433121616,
              "num_responses": 7,
              "rvariance": 0.1470042341131668
            },
            {
              "id": "safety_sample_363",
              "variance": 0.612017164840098,
              "mean_reward": 1.459762501915278,
              "min_reward": 1.2411849430438142,
              "max_reward": 1.8626016889138797,
              "num_responses": 7,
              "rvariance": 0.06659660962203337
            },
            {
              "id": "safety_sample_167",
              "variance": 0.12950533863510605,
              "mean_reward": -0.6170973066108468,
              "min_reward": -0.7275050837882413,
              "max_reward": -0.5290694842667079,
              "num_responses": 7,
              "rvariance": 0.0039223089361446585
            },
            {
              "id": "safety_sample_1",
              "variance": 0.21096837422815656,
              "mean_reward": -0.4059797326838018,
              "min_reward": -0.6543972313329395,
              "max_reward": -0.28363597959533754,
              "num_responses": 7,
              "rvariance": 0.012293388819443172
            },
            {
              "id": "safety_sample_29",
              "variance": 0.1827696311382545,
              "mean_reward": 0.25049894242503074,
              "min_reward": 0.1080132299866364,
              "max_reward": 0.3612797188496462,
              "num_responses": 7,
              "rvariance": 0.0068209108223406655
            },
            {
              "id": "safety_sample_179",
              "variance": 0.29034261403677,
              "mean_reward": -0.7886769603324735,
              "min_reward": -1.0408244514538205,
              "max_reward": -0.6126213156441956,
              "num_responses": 7,
              "rvariance": 0.016561849310395154
            },
            {
              "id": "safety_sample_160",
              "variance": 0.25587748359355633,
              "mean_reward": -0.2975612848249188,
              "min_reward": -0.4402956634281271,
              "max_reward": -0.1426422641458269,
              "num_responses": 6,
              "rvariance": 0.012322636708943688
            },
            {
              "id": "safety_sample_23",
              "variance": 0.23394512785696575,
              "mean_reward": -0.3925517597838484,
              "min_reward": -0.5917333577998237,
              "max_reward": -0.24186006390659362,
              "num_responses": 7,
              "rvariance": 0.0115343040593834
            },
            {
              "id": "safety_sample_350",
              "variance": 0.7128015614391926,
              "mean_reward": -0.33150421632202315,
              "min_reward": -0.8632768097766589,
              "max_reward": 0.16545511405865926,
              "num_responses": 6,
              "rvariance": 0.10183597257112725
            },
            {
              "id": "safety_sample_367",
              "variance": 0.2885149177253874,
              "mean_reward": 0.5599018179947901,
              "min_reward": 0.23072998232232156,
              "max_reward": 0.6915705522637775,
              "num_responses": 7,
              "rvariance": 0.021759548641603586
            },
            {
              "id": "safety_sample_303",
              "variance": 0.36110057123457995,
              "mean_reward": 0.320156551843539,
              "min_reward": 0.1132352194477294,
              "max_reward": 0.49705144483806385,
              "num_responses": 4,
              "rvariance": 0.030505257931950032
            },
            {
              "id": "safety_sample_18",
              "variance": 0.16710366275497546,
              "mean_reward": -0.6648412102551254,
              "min_reward": -0.7797249783991711,
              "max_reward": -0.5812893788776377,
              "num_responses": 7,
              "rvariance": 0.005671988177807369
            },
            {
              "id": "safety_sample_30",
              "variance": 0.21932355736590547,
              "mean_reward": -0.9900965538317744,
              "min_reward": -1.1452642406756801,
              "max_reward": -0.831944873010101,
              "num_responses": 7,
              "rvariance": 0.009736764634901666
            },
            {
              "id": "safety_sample_263",
              "variance": 0.8485732874276102,
              "mean_reward": -0.8258525519721592,
              "min_reward": -1.2914799455862838,
              "max_reward": -0.3776317898950113,
              "num_responses": 6,
              "rvariance": 0.13605878585549383
            },
            {
              "id": "safety_sample_295",
              "variance": 0.5953067985646003,
              "mean_reward": -0.4954995520168244,
              "min_reward": -0.8528328308544729,
              "max_reward": -0.19486215875675675,
              "num_responses": 7,
              "rvariance": 0.05503587115934873
            },
            {
              "id": "safety_sample_47",
              "variance": 0.6245499395467211,
              "mean_reward": -0.970700592976286,
              "min_reward": -1.5003595240300032,
              "max_reward": -0.5186255053445219,
              "num_responses": 7,
              "rvariance": 0.0838243276387419
            },
            {
              "id": "safety_sample_375",
              "variance": 0.4967091100523385,
              "mean_reward": 0.7421352627151645,
              "min_reward": 0.37433469250237866,
              "max_reward": 0.9343930622046014,
              "num_responses": 7,
              "rvariance": 0.044771634745318346
            },
            {
              "id": "safety_sample_28",
              "variance": 0.5877349138460155,
              "mean_reward": 0.33199927794280343,
              "min_reward": -0.04864645384615316,
              "max_reward": 0.7137640074734227,
              "num_responses": 7,
              "rvariance": 0.06151529122956939
            },
            {
              "id": "safety_sample_347",
              "variance": 0.6668480541815742,
              "mean_reward": 1.7078070013171947,
              "min_reward": 1.3978446268766038,
              "max_reward": 2.708563981610943,
              "num_responses": 7,
              "rvariance": 0.17579406883365306
            },
            {
              "id": "safety_sample_10",
              "variance": 0.14203811334172922,
              "mean_reward": -0.8289608790323336,
              "min_reward": -0.9781605779207047,
              "max_reward": -0.7483930416326132,
              "num_responses": 7,
              "rvariance": 0.0049774590131779
            },
            {
              "id": "safety_sample_365",
              "variance": 0.4094039737496902,
              "mean_reward": 1.5216803769539518,
              "min_reward": 1.277738869271465,
              "max_reward": 1.8156037837640426,
              "num_responses": 7,
              "rvariance": 0.03172351001645717
            },
            {
              "id": "safety_sample_387",
              "variance": 1.0015775786376346,
              "mean_reward": 0.7519964303135678,
              "min_reward": 0.10279124052554342,
              "max_reward": 1.3691236848405923,
              "num_responses": 7,
              "rvariance": 0.18586898513815253
            },
            {
              "id": "safety_sample_170",
              "variance": 0.46057947046840136,
              "mean_reward": -0.24932004885101217,
              "min_reward": -0.4402956634281271,
              "max_reward": 0.1393451667531943,
              "num_responses": 7,
              "rvariance": 0.04109742768394022
            },
            {
              "id": "safety_sample_82",
              "variance": 0.2610994730546493,
              "mean_reward": -0.2044358061020939,
              "min_reward": -0.4194077055837551,
              "max_reward": -0.006870538157409279,
              "num_responses": 6,
              "rvariance": 0.01533815285956483
            },
            {
              "id": "safety_sample_286",
              "variance": 0.3394293149710441,
              "mean_reward": -1.780606291775327,
              "min_reward": -2.0330024490614877,
              "max_reward": -1.604799313251863,
              "num_responses": 6,
              "rvariance": 0.02183048868648617
            },
            {
              "id": "safety_sample_290",
              "variance": 0.45744627679174577,
              "mean_reward": -1.4197916866302829,
              "min_reward": -1.625687271096235,
              "max_reward": -1.0303804725316346,
              "num_responses": 7,
              "rvariance": 0.04075461521165515
            },
            {
              "id": "safety_sample_296",
              "variance": 0.45535748100730833,
              "mean_reward": -0.5723373969443354,
              "min_reward": -1.0094925146872624,
              "max_reward": -0.30974592690080244,
              "num_responses": 7,
              "rvariance": 0.04445431864631601
            },
            {
              "id": "safety_sample_183",
              "variance": 0.21932355736590536,
              "mean_reward": -0.7230290928215901,
              "min_reward": -0.8528328308544729,
              "max_reward": -0.6021773367220097,
              "num_responses": 7,
              "rvariance": 0.009874780045821624
            },
            {
              "id": "safety_sample_304",
              "variance": 0.46997905149836866,
              "mean_reward": -0.014703522349048759,
              "min_reward": -0.5186255053445219,
              "max_reward": 0.2568399296277865,
              "num_responses": 7,
              "rvariance": 0.05565054060032088
            },
            {
              "id": "safety_sample_353",
              "variance": 0.4898226114505221,
              "mean_reward": -0.10907233189594343,
              "min_reward": -0.466405610733592,
              "max_reward": 0.0766812932200785,
              "num_responses": 7,
              "rvariance": 0.043777597921805245
            },
            {
              "id": "safety_sample_141",
              "variance": 0.43342512527071786,
              "mean_reward": -1.0303804725316346,
              "min_reward": -1.3959197348081434,
              "max_reward": -0.7588370205547992,
              "num_responses": 6,
              "rvariance": 0.04079468420192224
            },
            {
              "id": "safety_sample_156",
              "variance": 0.3885160159053182,
              "mean_reward": 0.008795430225869675,
              "min_reward": -0.17397420091238483,
              "max_reward": 0.3900006608856576,
              "num_responses": 7,
              "rvariance": 0.03398518191153263
            },
            {
              "id": "safety_sample_372",
              "variance": 0.48668941777386643,
              "mean_reward": -0.8640228082711008,
              "min_reward": -1.1243762828313082,
              "max_reward": -0.4402956634281271,
              "num_responses": 7,
              "rvariance": 0.04819965620878104
            },
            {
              "id": "safety_sample_85",
              "variance": 0.25274428991690046,
              "mean_reward": -0.5678614059776843,
              "min_reward": -0.821500894087915,
              "max_reward": -0.42462969504484815,
              "num_responses": 7,
              "rvariance": 0.015106009330691058
            },
            {
              "id": "safety_sample_98",
              "variance": 0.2579662793779935,
              "mean_reward": 0.13897216750597338,
              "min_reward": -0.059090432768339134,
              "max_reward": 0.2881718663943444,
              "num_responses": 7,
              "rvariance": 0.012112243592610728
            },
            {
              "id": "safety_sample_382",
              "variance": 0.42820313580962477,
              "mean_reward": 0.924065645547172,
              "min_reward": 0.6772100812457719,
              "max_reward": 1.1249956775344954,
              "num_responses": 7,
              "rvariance": 0.030292725112020184
            },
            {
              "id": "safety_sample_148",
              "variance": 0.300786592958956,
              "mean_reward": -0.024774502024013795,
              "min_reward": -0.2157501166011287,
              "max_reward": 0.20723102974740312,
              "num_responses": 7,
              "rvariance": 0.016921357195291496
            },
            {
              "id": "safety_sample_37",
              "variance": 0.4073151779652529,
              "mean_reward": -0.703135799636474,
              "min_reward": -0.9363846622319607,
              "max_reward": -0.476849589655778,
              "num_responses": 6,
              "rvariance": 0.02991125389493289
            },
            {
              "id": "safety_sample_271",
              "variance": 0.36971685384538333,
              "mean_reward": -0.7107947175127437,
              "min_reward": -1.1034883249869363,
              "max_reward": -0.5290694842667079,
              "num_responses": 5,
              "rvariance": 0.040864493287187574
            },
            {
              "id": "safety_sample_111",
              "variance": 0.20261319109040787,
              "mean_reward": -0.8931167495543332,
              "min_reward": -0.9990485357650766,
              "max_reward": -0.6961731470216834,
              "num_responses": 7,
              "rvariance": 0.008957645379708343
            },
            {
              "id": "safety_sample_209",
              "variance": 1.6083727540166397,
              "mean_reward": -0.6428342546690907,
              "min_reward": -1.3019239245084697,
              "max_reward": 0.39261165561620415,
              "num_responses": 7,
              "rvariance": 0.5137626454064266
            },
            {
              "id": "safety_sample_7",
              "variance": 0.5218072968997165,
              "mean_reward": 0.5307612518056551,
              "min_reward": 0.0035734407647766927,
              "max_reward": 0.8204884170845106,
              "num_responses": 7,
              "rvariance": 0.0631354027651829
            },
            {
              "id": "safety_sample_49",
              "variance": 0.24543350467137032,
              "mean_reward": 0.05492300379885771,
              "min_reward": -0.13742027468473392,
              "max_reward": 0.18634307190303118,
              "num_responses": 6,
              "rvariance": 0.011911326668806213
            },
            {
              "id": "safety_sample_358",
              "variance": 0.7193290482655588,
              "mean_reward": 1.1543693682531433,
              "min_reward": 0.7124585101081495,
              "max_reward": 1.7738278680752988,
              "num_responses": 6,
              "rvariance": 0.10983838624683599
            },
            {
              "id": "safety_sample_335",
              "variance": 0.5749410396663378,
              "mean_reward": 0.3605337203552044,
              "min_reward": -0.03298048546287421,
              "max_reward": 0.7738168862759921,
              "num_responses": 7,
              "rvariance": 0.06335352572229112
            },
            {
              "id": "safety_sample_132",
              "variance": 0.2235011489347798,
              "mean_reward": -1.424267677596934,
              "min_reward": -1.5943553343296768,
              "max_reward": -1.2705919877419118,
              "num_responses": 7,
              "rvariance": 0.009776833625168745
            },
            {
              "id": "safety_sample_38",
              "variance": 0.3665836601687276,
              "mean_reward": -0.36196582151173234,
              "min_reward": -0.5604014210332657,
              "max_reward": -0.16875221145129182,
              "num_responses": 7,
              "rvariance": 0.025695353036275705
            },
            {
              "id": "safety_sample_53",
              "variance": 0.22976753628809132,
              "mean_reward": -1.0721563882203782,
              "min_reward": -1.19748413528661,
              "max_reward": -0.9363846622319607,
              "num_responses": 7,
              "rvariance": 0.00947409014315077
            },
            {
              "id": "safety_sample_219",
              "variance": 0.453268685222871,
              "mean_reward": -0.8611880139922217,
              "min_reward": -1.166152198520052,
              "max_reward": -0.5917333577998237,
              "num_responses": 5,
              "rvariance": 0.04094302850811104
            },
            {
              "id": "safety_sample_270",
              "variance": 0.21305717001259383,
              "mean_reward": -0.8632768097766589,
              "min_reward": -0.9886045568428906,
              "max_reward": -0.6752851891773114,
              "num_responses": 7,
              "rvariance": 0.009661078764397172
            },
            {
              "id": "safety_sample_112",
              "variance": 0.29765339928230017,
              "mean_reward": 0.007925098649020853,
              "min_reward": -0.15830823252910586,
              "max_reward": 0.19678705082521716,
              "num_responses": 6,
              "rvariance": 0.01589262606284408
            },
            {
              "id": "safety_sample_362",
              "variance": 0.5080995745643475,
              "mean_reward": 0.29283435698460597,
              "min_reward": -0.04864645384615316,
              "max_reward": 0.7594564152579864,
              "num_responses": 7,
              "rvariance": 0.06044789784995454
            },
            {
              "id": "safety_sample_258",
              "variance": 0.3404737128632629,
              "mean_reward": -1.1900241503421916,
              "min_reward": -1.4794715661856312,
              "max_reward": -0.9259406833097747,
              "num_responses": 7,
              "rvariance": 0.024860582405711432
            },
            {
              "id": "safety_sample_78",
              "variance": 0.28825381825233287,
              "mean_reward": -0.5917333577998235,
              "min_reward": -0.7588370205547992,
              "max_reward": -0.41418571612266214,
              "num_responses": 7,
              "rvariance": 0.01430462952534936
            },
            {
              "id": "safety_sample_12",
              "variance": 0.14203811334172922,
              "mean_reward": 0.1374801705170897,
              "min_reward": 0.061015324836799535,
              "max_reward": 0.23595197178341457,
              "num_responses": 7,
              "rvariance": 0.003632087013585147
            },
            {
              "id": "safety_sample_173",
              "variance": 0.1618816732938826,
              "mean_reward": -1.1470049038293777,
              "min_reward": -1.239260050975354,
              "max_reward": -0.9677165989985186,
              "num_responses": 6,
              "rvariance": 0.0073232881547865515
            },
            {
              "id": "safety_sample_67",
              "variance": 0.547264495522545,
              "mean_reward": -0.22843209100664025,
              "min_reward": -0.5395134631888938,
              "max_reward": 0.045349356453520576,
              "num_responses": 7,
              "rvariance": 0.054233378326499604
            },
            {
              "id": "safety_sample_154",
              "variance": 0.1650148669705384,
              "mean_reward": -0.5074355279278941,
              "min_reward": -0.7379490627104273,
              "max_reward": -0.4194077055837551,
              "num_responses": 7,
              "rvariance": 0.009633253076711699
            },
            {
              "id": "safety_sample_17",
              "variance": 0.19634680373709623,
              "mean_reward": -0.5395134631888938,
              "min_reward": -0.6439532524107535,
              "max_reward": -0.4350736739670341,
              "num_responses": 5,
              "rvariance": 0.007809891414057841
            },
            {
              "id": "safety_sample_249",
              "variance": 0.25848847832410277,
              "mean_reward": 0.24117396124450755,
              "min_reward": 0.061015324836799535,
              "max_reward": 0.434387571304948,
              "num_responses": 6,
              "rvariance": 0.013589138342663494
            },
            {
              "id": "safety_sample_266",
              "variance": 0.22976753628809132,
              "mean_reward": -0.8841647676210309,
              "min_reward": -1.0721563882203784,
              "max_reward": -0.7797249783991711,
              "num_responses": 7,
              "rvariance": 0.010035056006889972
            },
            {
              "id": "safety_sample_133",
              "variance": 0.31854135712667214,
              "mean_reward": -0.5569200947258705,
              "min_reward": -0.7483930416326132,
              "max_reward": -0.2888579690564305,
              "num_responses": 6,
              "rvariance": 0.022130449599735594
            },
            {
              "id": "safety_sample_125",
              "variance": 0.375983241198695,
              "mean_reward": -0.6439532524107535,
              "min_reward": -0.8946087465432169,
              "max_reward": -0.42462969504484815,
              "num_responses": 6,
              "rvariance": 0.03130501167366761
            },
            {
              "id": "safety_sample_182",
              "variance": 0.17337005010828715,
              "mean_reward": -0.5827813758665215,
              "min_reward": -0.7275050837882413,
              "max_reward": -0.4977375475001499,
              "num_responses": 7,
              "rvariance": 0.00599699220997373
            },
            {
              "id": "safety_sample_117",
              "variance": 0.32898533604885805,
              "mean_reward": -0.2932096269406747,
              "min_reward": -0.5081815264223359,
              "max_reward": -0.012092527618502264,
              "num_responses": 6,
              "rvariance": 0.023737058430548828
            },
            {
              "id": "safety_sample_242",
              "variance": 0.535253919762031,
              "mean_reward": 0.005314103918474348,
              "min_reward": -0.3619658215117323,
              "max_reward": 0.34300275573582073,
              "num_responses": 6,
              "rvariance": 0.0544626001581664
            },
            {
              "id": "safety_sample_70",
              "variance": 0.29660900139008173,
              "mean_reward": -1.4794715661856315,
              "min_reward": -1.8658987863065122,
              "max_reward": -1.3436998401972136,
              "num_responses": 7,
              "rvariance": 0.027923634106128605
            },
            {
              "id": "safety_sample_31",
              "variance": 0.33942931497104417,
              "mean_reward": -0.5163875098611963,
              "min_reward": -0.6752851891773114,
              "max_reward": -0.19486215875675675,
              "num_responses": 7,
              "rvariance": 0.025211186070548428
            },
            {
              "id": "safety_sample_59",
              "variance": 0.19843559952153333,
              "mean_reward": -0.7083577890975671,
              "min_reward": -0.8528328308544729,
              "max_reward": -0.5917333577998237,
              "num_responses": 6,
              "rvariance": 0.0073232881547865445
            },
            {
              "id": "safety_sample_149",
              "variance": 0.2537886878091191,
              "mean_reward": -0.2590180292787563,
              "min_reward": -0.466405610733592,
              "max_reward": -0.09042236953489705,
              "num_responses": 7,
              "rvariance": 0.01312593339499261
            },
            {
              "id": "safety_sample_309",
              "variance": 0.2825096298451305,
              "mean_reward": 0.38235417631762864,
              "min_reward": 0.23072998232232156,
              "max_reward": 0.6628496102277661,
              "num_responses": 7,
              "rvariance": 0.01882275599905927
            }
          ]
        }
      },
      "overall_stats": {
        "mean_variance_across_files": 0.6203644339535656,
        "mean_rvariance_across_files": 0.14539716319326165,
        "total_processed_files": 4
      }
    }
  },
  "summary": {
    "model_comparison": {
      "Eurus-RM-7b": {
        "mean_variance": 0.6203644339535656,
        "mean_rvariance": 0.14539716319326165
      }
    }
  }
}