{
  "models": {
    "URM-LLaMa-3.1-8B": {
      "model_name": "URM-LLaMa-3.1-8B",
      "model_path": "LxzGordon/URM-LLaMa-3.1-8B",
      "files": {
        "semantic_benchmark_chat_filtered.json": {
          "file_name": "semantic_benchmark_chat_filtered.json",
          "processed_samples": 200,
          "global_mean": 10.293150443358119,
          "global_std": 2.699379266496462,
          "mean_variance": 0.643921397469274,
          "mean_rvariance": 0.12564304646048485,
          "sample_results": [
            {
              "id": "chat_sample_306",
              "rewards": [
                -0.020067278830433927,
                0.9069360778709152,
                1.0825673240717455,
                0.7865158409736499,
                0.7757022202872732,
                -0.12251050726567653,
                1.205340851853484
              ],
              "variance": 1.192721305388972,
              "mean_reward": 0.6592120755658509,
              "min_reward": -0.12251050726567653,
              "max_reward": 1.205340851853484,
              "num_responses": 7,
              "rvariance": 0.2344486183381435
            },
            {
              "id": "chat_sample_202",
              "rewards": [
                0.20270150372816037,
                -0.6910749119142159,
                -0.6897083709832532,
                -0.5995477594057789,
                0.8346899417294087,
                -1.3723782367793096,
                -0.3691951692918474
              ],
              "variance": 1.4190931207889133,
              "mean_reward": -0.3835018575595481,
              "min_reward": -1.3723782367793096,
              "max_reward": 0.8346899417294087,
              "num_responses": 7,
              "rvariance": 0.4343923228115087
            },
            {
              "id": "chat_sample_298",
              "rewards": [
                0.41971230177464774,
                -0.39946044731455865,
                -1.432677032005003,
                -2.345950326607076,
                -0.6691579695168013,
                -0.009611898191626035,
                -1.2133281347131406
              ],
              "variance": 1.9601041316407157,
              "mean_reward": -0.8072105009390798,
              "min_reward": -2.345950326607076,
              "max_reward": 0.41971230177464774,
              "num_responses": 7,
              "rvariance": 0.7500974096613078
            },
            {
              "id": "chat_sample_268",
              "rewards": [
                0.8429548999866322,
                -1.0124904263092616,
                -0.660223872551397,
                0.431344151208726,
                -0.2599559787707729,
                -0.09548493460411511,
                0.4924258457888697
              ],
              "variance": 1.4337679615225176,
              "mean_reward": -0.03734718789304552,
              "min_reward": -1.0124904263092616,
              "max_reward": 0.8429548999866322,
              "num_responses": 7,
              "rvariance": 0.3810110250827714
            },
            {
              "id": "chat_sample_303",
              "rewards": [
                0.2004785783047847,
                0.1675183741648596,
                0.2962869466874216,
                -0.6084422874507417,
                0.2962869466874216,
                -2.8710850147195814,
                0.2962869466874216
              ],
              "variance": 1.8097863250456991,
              "mean_reward": -0.31752421566263056,
              "min_reward": -2.8710850147195814,
              "max_reward": 0.2962869466874216,
              "num_responses": 7,
              "rvariance": 1.1770273880792086
            },
            {
              "id": "chat_sample_65",
              "rewards": [
                0.5956696382751882,
                -1.0407285037472096,
                0.4911497481046306,
                0.5329437137331261,
                -1.2882759095565788,
                -0.9527342905639088,
                0.44842732602148927
              ],
              "variance": 1.6977815496209083,
              "mean_reward": -0.17336403967618044,
              "min_reward": -1.2882759095565788,
              "max_reward": 0.5956696382751882,
              "num_responses": 7,
              "rvariance": 0.6458934422941022
            },
            {
              "id": "chat_sample_212",
              "rewards": [
                0.6852897101359167,
                0.9715309273159743,
                0.5357389753271737,
                1.0027871948193863,
                0.7597647776976515,
                -0.528080636385465,
                1.1859531407189345
              ],
              "variance": 0.9658424425370873,
              "mean_reward": 0.6589977270899389,
              "min_reward": -0.528080636385465,
              "max_reward": 1.1859531407189345,
              "num_responses": 7,
              "rvariance": 0.27553474787090787
            },
            {
              "id": "chat_sample_262",
              "rewards": [
                0.6369965493249007,
                -1.0530040547263277,
                -1.0617268819200887,
                0.6912201020870902,
                0.8049549578994004,
                -0.7648596431318191,
                0.6431957979587171
              ],
              "variance": 1.7932072300158466,
              "mean_reward": -0.01474616750116101,
              "min_reward": -1.0617268819200887,
              "max_reward": 0.8049549578994004,
              "num_responses": 7,
              "rvariance": 0.680681827243066
            },
            {
              "id": "chat_sample_178",
              "rewards": [
                0.9626127285775332,
                0.9217048241317818,
                0.03108049695529203,
                1.2010702347972595,
                0.29357364928571705,
                1.3130591119950874,
                -0.06860633221847935
              ],
              "variance": 1.254660020390607,
              "mean_reward": 0.6649278162177418,
              "min_reward": -0.06860633221847935,
              "max_reward": 1.3130591119950874,
              "num_responses": 7,
              "rvariance": 0.2771160423946119
            },
            {
              "id": "chat_sample_290",
              "rewards": [
                0.22504805154751148,
                -1.2675870168685814,
                0.10340329788015395,
                0.2424831071170583,
                -0.23941264318297129,
                -0.034390521442400866,
                0.298242781897817
              ],
              "variance": 0.9154693696865771,
              "mean_reward": -0.09603042043591611,
              "min_reward": -1.2675870168685814,
              "max_reward": 0.298242781897817,
              "num_responses": 7,
              "rvariance": 0.25854439388287853
            },
            {
              "id": "chat_sample_292",
              "rewards": [
                0.7459566376392894,
                -1.1480344698695697,
                -0.6312679018425812,
                -1.1522096975640155,
                -0.8789530922856307,
                -0.2554521877190894,
                -0.5471118739421084
              ],
              "variance": 1.2948159033716105,
              "mean_reward": -0.5524389407976722,
              "min_reward": -1.1522096975640155,
              "max_reward": 0.7459566376392894,
              "num_responses": 7,
              "rvariance": 0.371620725484846
            },
            {
              "id": "chat_sample_116",
              "rewards": [
                0.43952573209787626,
                0.41789566437366277,
                0.42055738086122035,
                -0.2632303069373091,
                -0.4411618499327356,
                -0.3660105777841697,
                0.6949042512153422
              ],
              "variance": 0.9377482263884588,
              "mean_reward": 0.12892575627055528,
              "min_reward": -0.4411618499327356,
              "max_reward": 0.6949042512153422,
              "num_responses": 7,
              "rvariance": 0.18701497791417523
            },
            {
              "id": "chat_sample_106",
              "rewards": [
                1.0627839237327807,
                0.7607610665873399,
                -0.007530290341255821,
                0.9561954975873559,
                0.6339299579906825,
                1.1101592269071263
              ],
              "variance": 0.7732717414952401,
              "mean_reward": 0.7527165637440049,
              "min_reward": -0.007530290341255821,
              "max_reward": 1.1101592269071263,
              "num_responses": 6,
              "rvariance": 0.14291015876275132
            },
            {
              "id": "chat_sample_251",
              "rewards": [
                -0.24891624996758752,
                -2.1721254722831875,
                0.14583813870222917,
                0.13833841510283015,
                0.09463383588730102,
                0.2108011204249675,
                -0.002312845545894769
              ],
              "variance": 1.1900232702851519,
              "mean_reward": -0.2619632939541917,
              "min_reward": -2.1721254722831875,
              "max_reward": 0.2108011204249675,
              "num_responses": 7,
              "rvariance": 0.6276456142141507
            },
            {
              "id": "chat_sample_280",
              "rewards": [
                0.5174058465811774,
                -0.36503124700324197,
                0.5551143211740854,
                0.642324221827206,
                0.5885175559053826,
                0.6148810557374135,
                -0.24428668627592912
              ],
              "variance": 0.9184428327401848,
              "mean_reward": 0.32984643827801335,
              "min_reward": -0.36503124700324197,
              "max_reward": 0.642324221827206,
              "num_responses": 7,
              "rvariance": 0.16345797691086492
            },
            {
              "id": "chat_sample_58",
              "rewards": [
                -1.048315844241872,
                -0.15061009348207932,
                -1.2206158819530315,
                -1.9502003556354357,
                -2.11510524475122,
                -0.8904217199228877,
                -1.7430528175968634
              ],
              "variance": 1.4216652419351852,
              "mean_reward": -1.3026174225119127,
              "min_reward": -2.11510524475122,
              "max_reward": -0.15061009348207932,
              "num_responses": 7,
              "rvariance": 0.4059861689342355
            },
            {
              "id": "chat_sample_90",
              "rewards": [
                0.8762740507619912,
                0.5309193394998231,
                -0.8534134739042215,
                -1.1574582322254376,
                0.6670230006492328,
                0.2742357525956519
              ],
              "variance": 1.7770843787704416,
              "mean_reward": 0.05626340622950665,
              "min_reward": -1.1574582322254376,
              "max_reward": 0.8762740507619912,
              "num_responses": 6,
              "rvariance": 0.6031478633324991
            },
            {
              "id": "chat_sample_180",
              "rewards": [
                0.6447718421916603,
                -0.12336689175808953,
                0.5161707309931097,
                0.8611039625937891,
                0.4698969983003416
              ],
              "variance": 0.6606324501676546,
              "mean_reward": 0.47371532846416214,
              "min_reward": -0.12336689175808953,
              "max_reward": 0.8611039625937891,
              "num_responses": 5,
              "rvariance": 0.10753090065921841
            },
            {
              "id": "chat_sample_291",
              "rewards": [
                -1.7758003387894152,
                -2.0436889960571882,
                -2.2988604849302012,
                -2.6469186013639634,
                -3.5700085211748593,
                -2.8663409837937888
              ],
              "variance": 1.3084300850610222,
              "mean_reward": -2.5336029876849024,
              "min_reward": -3.5700085211748593,
              "max_reward": -1.7758003387894152,
              "num_responses": 6,
              "rvariance": 0.34451267477862996
            },
            {
              "id": "chat_sample_129",
              "rewards": [
                -0.6468919727140633,
                -0.7699385967056348,
                -0.8074605321021757,
                -0.6378787379077759,
                -0.8361246820227353,
                -2.053934520100083,
                -1.8458443938495643
              ],
              "variance": 1.2857937655582234,
              "mean_reward": -1.0854390622002903,
              "min_reward": -2.053934520100083,
              "max_reward": -0.6378787379077759,
              "num_responses": 7,
              "rvariance": 0.3068291115767149
            },
            {
              "id": "chat_sample_31",
              "rewards": [
                0.3135997625563188,
                -1.1673956839591806,
                -1.5762472071241556,
                -3.7544641665750484,
                -1.702093332236965,
                -1.5697847545106165
              ],
              "variance": 2.3013807887045763,
              "mean_reward": -1.5760642303082744,
              "min_reward": -3.7544641665750484,
              "max_reward": 0.3135997625563188,
              "num_responses": 6,
              "rvariance": 1.4165315114768144
            },
            {
              "id": "chat_sample_294",
              "rewards": [
                0.5872372186939533,
                -0.7248837280800386,
                0.551366579137981,
                0.49481057983333665,
                0.5029342205175547,
                0.21757588487484852,
                0.13454827779482412
              ],
              "variance": 0.774939359515491,
              "mean_reward": 0.25194129039606566,
              "min_reward": -0.7248837280800386,
              "max_reward": 0.5872372186939533,
              "num_responses": 7,
              "rvariance": 0.18474443185987593
            },
            {
              "id": "chat_sample_128",
              "rewards": [
                -0.690533665609605,
                -2.8341417747844977,
                -2.414294331263969,
                -3.0129862293015397,
                -2.8663098939277276,
                -2.837543288766739,
                -3.142954588018918
              ],
              "variance": 1.3401835077862683,
              "mean_reward": -2.5426805388104277,
              "min_reward": -3.142954588018918,
              "max_reward": -0.690533665609605,
              "num_responses": 7,
              "rvariance": 0.6150110125340279
            },
            {
              "id": "chat_sample_173",
              "rewards": [
                0.9350699335987718,
                0.0220178009984528,
                0.018579544447230308,
                0.9844639583035002,
                0.21210618821167276,
                -0.01798355121646863,
                0.2747466156220666
              ],
              "variance": 0.9508732372989124,
              "mean_reward": 0.3470000699950323,
              "min_reward": -0.01798355121646863,
              "max_reward": 0.9844639583035002,
              "num_responses": 7,
              "rvariance": 0.16032712212908584
            },
            {
              "id": "chat_sample_174",
              "rewards": [
                0.12271222446775301,
                -0.6373459706575455,
                -0.7674881499897204,
                0.2126212907652776,
                -1.1057246950996042,
                0.10246282943180271,
                -0.358208434578539
              ],
              "variance": 1.0614586190204367,
              "mean_reward": -0.3472815579515109,
              "min_reward": -1.1057246950996042,
              "max_reward": 0.2126212907652776,
              "num_responses": 7,
              "rvariance": 0.22467452884678002
            },
            {
              "id": "chat_sample_297",
              "rewards": [
                0.6132898198653722,
                0.4074639544283333,
                -0.20589635439326975,
                -0.2037433811685318,
                0.29329808001835644,
                0.6433441814103729,
                0.6952716769051563
              ],
              "variance": 0.8687197500667132,
              "mean_reward": 0.3204325681522557,
              "min_reward": -0.20589635439326975,
              "max_reward": 0.6952716769051563,
              "num_responses": 7,
              "rvariance": 0.12723356292947077
            },
            {
              "id": "chat_sample_264",
              "rewards": [
                -3.3040241182033347,
                -3.6883400843431042,
                -2.914197649951184,
                -2.6383229599859073,
                -3.348413381060075
              ],
              "variance": 0.8036965670578748,
              "mean_reward": -3.178659638708721,
              "min_reward": -3.6883400843431042,
              "max_reward": -2.6383229599859073,
              "num_responses": 5,
              "rvariance": 0.1332421224588203
            },
            {
              "id": "chat_sample_275",
              "rewards": [
                1.0386200319245795,
                0.46633014275768414,
                0.7620032480540577,
                1.0549722415909721,
                0.6402694643157069,
                0.7439499281026121,
                0.8393286910633124
              ],
              "variance": 0.47446718009863875,
              "mean_reward": 0.7922105354012751,
              "min_reward": 0.46633014275768414,
              "max_reward": 1.0549722415909721,
              "num_responses": 7,
              "rvariance": 0.03778673723249498
            },
            {
              "id": "chat_sample_172",
              "rewards": [
                0.1767725554331212,
                -0.8047331029431707,
                -0.7712528501345854,
                -1.183312282206784,
                -0.8552809856314885,
                -0.961147632272788,
                -0.9203768058728519
              ],
              "variance": 0.6579708043388839,
              "mean_reward": -0.7599044433755068,
              "min_reward": -1.183312282206784,
              "max_reward": 0.1767725554331212,
              "num_responses": 7,
              "rvariance": 0.16201761116446392
            },
            {
              "id": "chat_sample_145",
              "rewards": [
                0.39320819095747644,
                0.4193915108839254,
                0.9275401800151092,
                0.9331533140148854,
                0.7851125574737058,
                1.0108832785768682,
                1.0585143665583536
              ],
              "variance": 0.6210175308561167,
              "mean_reward": 0.7896861997829036,
              "min_reward": 0.39320819095747644,
              "max_reward": 1.0585143665583536,
              "num_responses": 7,
              "rvariance": 0.06501673570909791
            },
            {
              "id": "chat_sample_270",
              "rewards": [
                0.45984719909605937,
                -0.04278831821824947,
                0.4481913256745702,
                0.4242941707854168,
                0.14813949537862284,
                0.5059743148068343,
                0.42651886267845507
              ],
              "variance": 0.40652967544049545,
              "mean_reward": 0.33859672145738706,
              "min_reward": -0.04278831821824947,
              "max_reward": 0.5059743148068343,
              "num_responses": 7,
              "rvariance": 0.0359329676498303
            },
            {
              "id": "chat_sample_278",
              "rewards": [
                0.3090436840026232,
                -0.9458535379342736,
                -0.05663532060918806,
                0.14800665685999773,
                0.10211377502647925,
                0.34565624081687407,
                0.2273225578850341
              ],
              "variance": 0.7360113142675457,
              "mean_reward": 0.01852200800679237,
              "min_reward": -0.9458535379342736,
              "max_reward": 0.34565624081687407,
              "num_responses": 7,
              "rvariance": 0.1706342850835792
            },
            {
              "id": "chat_sample_165",
              "rewards": [
                0.5573386597731911,
                0.45831319684108524,
                0.8654053162221423,
                0.9658298231270022,
                1.067683757282812,
                0.9766328449954034,
                1.1673218318938965
              ],
              "variance": 0.5898105125268971,
              "mean_reward": 0.8655036328765047,
              "min_reward": 0.45831319684108524,
              "max_reward": 1.1673218318938965,
              "num_responses": 7,
              "rvariance": 0.05930796938743478
            },
            {
              "id": "chat_sample_127",
              "rewards": [
                0.07285114518424164,
                1.062491749650592,
                1.2548705414282977,
                0.552455431037988,
                0.5761197652256148,
                0.6358462242806364,
                0.5040901982647392
              ],
              "variance": 0.807848689329134,
              "mean_reward": 0.6655321507245872,
              "min_reward": 0.07285114518424164,
              "max_reward": 1.2548705414282977,
              "num_responses": 7,
              "rvariance": 0.12912758767480445
            },
            {
              "id": "chat_sample_256",
              "rewards": [
                0.3085730964845151,
                -0.912128099136524,
                0.33784561855686307,
                0.47706603877890785,
                0.10422152662785548,
                0.16351060779442517,
                0.39418893491413426
              ],
              "variance": 0.72965810013794,
              "mean_reward": 0.124753960574311,
              "min_reward": -0.912128099136524,
              "max_reward": 0.47706603877890785,
              "num_responses": 7,
              "rvariance": 0.19328065708179487
            },
            {
              "id": "chat_sample_114",
              "rewards": [
                -0.08775698312431232,
                0.0337605847273403,
                -0.2063337322817216,
                -0.5749288250125002,
                0.18236943791200186,
                -0.5368437390875327,
                -0.34624731519935814
              ],
              "variance": 0.6452818994587247,
              "mean_reward": -0.2194257960094404,
              "min_reward": -0.5749288250125002,
              "max_reward": 0.18236943791200186,
              "num_responses": 7,
              "rvariance": 0.06946729767996031
            },
            {
              "id": "chat_sample_119",
              "rewards": [
                -0.8086744500542925,
                -0.149045001361044,
                -0.9965596963043576,
                -0.2185824329219686,
                -0.11341106873985589,
                0.2676673118023588,
                -0.3674152744598438
              ],
              "variance": 0.9228488320313486,
              "mean_reward": -0.34086008743414337,
              "min_reward": -0.9965596963043576,
              "max_reward": 0.2676673118023588,
              "num_responses": 7,
              "rvariance": 0.16046870523842616
            },
            {
              "id": "chat_sample_179",
              "rewards": [
                -0.12021268352860798,
                -0.934134071604932,
                -1.0462497813245324,
                -0.39542583060525316,
                -0.3362300190368671,
                -0.517077650151261,
                -0.7278612893432634
              ],
              "variance": 0.7291572706592088,
              "mean_reward": -0.5824559036563881,
              "min_reward": -1.0462497813245324,
              "max_reward": -0.12021268352860798,
              "num_responses": 7,
              "rvariance": 0.09621079514692933
            },
            {
              "id": "chat_sample_191",
              "rewards": [
                -0.23131514624975927,
                0.4322888591842674,
                0.6682051221474233,
                0.9148643470104532,
                0.586477636739049,
                1.0892929806650071,
                0.8593685827972822
              ],
              "variance": 0.8177885434616181,
              "mean_reward": 0.6170260546133891,
              "min_reward": -0.23131514624975927,
              "max_reward": 1.0892929806650071,
              "num_responses": 7,
              "rvariance": 0.16111953229600418
            },
            {
              "id": "chat_sample_156",
              "rewards": [
                0.8554134572227923,
                1.53189220014548,
                1.993967454243631,
                1.9188373797310159,
                2.129721354399852,
                2.117641528259347
              ],
              "variance": 0.9300286126454633,
              "mean_reward": 1.7579122290003528,
              "min_reward": 0.8554134572227923,
              "max_reward": 2.129721354399852,
              "num_responses": 6,
              "rvariance": 0.20247587574693526
            },
            {
              "id": "chat_sample_166",
              "rewards": [
                0.10993287634087057,
                -0.8483726760751172,
                -0.05862648521283479,
                -1.049952301737275,
                -0.31055473578537274,
                -1.5972074295523233,
                -1.0113669516038681
              ],
              "variance": 1.2776516122719417,
              "mean_reward": -0.6808782433751316,
              "min_reward": -1.5972074295523233,
              "max_reward": 0.10993287634087057,
              "num_responses": 7,
              "rvariance": 0.3232672838749107
            },
            {
              "id": "chat_sample_245",
              "rewards": [
                -0.27596019391363963,
                -2.0121652850468634,
                -1.0414562892481876,
                -1.5153534649161091,
                -1.5248655507551057,
                -1.0626532186111395,
                -1.2471390706425585
              ],
              "variance": 0.9845275933574407,
              "mean_reward": -1.239941867590515,
              "min_reward": -2.0121652850468634,
              "max_reward": -0.27596019391363963,
              "num_responses": 7,
              "rvariance": 0.2505003309172765
            },
            {
              "id": "chat_sample_161",
              "rewards": [
                0.5587143863463991,
                1.130721993661216,
                1.0764998540747568,
                1.3270908871127307,
                0.8923489246913606,
                1.2973827536215934,
                1.1958079216724693
              ],
              "variance": 0.5503708976646724,
              "mean_reward": 1.068366674454361,
              "min_reward": 0.5587143863463991,
              "max_reward": 1.3270908871127307,
              "num_responses": 7,
              "rvariance": 0.06147284166782428
            },
            {
              "id": "chat_sample_296",
              "rewards": [
                -2.596201137588039,
                -2.680413692517714,
                -3.061074126337765,
                -3.996323363423982
              ],
              "variance": 1.0942836882311755,
              "mean_reward": -3.0835030799668752,
              "min_reward": -3.996323363423982,
              "max_reward": -2.596201137588039,
              "num_responses": 4,
              "rvariance": 0.308422041292984
            },
            {
              "id": "chat_sample_130",
              "rewards": [
                0.18811117090321314,
                -0.3148875325737197,
                -0.2512239659347664,
                0.5991884458430238,
                0.11770180991684494,
                0.24672616724654683,
                0.23067885024391346
              ],
              "variance": 0.6644004712754855,
              "mean_reward": 0.11661356366357942,
              "min_reward": -0.3148875325737197,
              "max_reward": 0.5991884458430238,
              "num_responses": 7,
              "rvariance": 0.08420420464002887
            },
            {
              "id": "chat_sample_18",
              "rewards": [
                0.5646815208665541,
                0.03042478341654676,
                0.4177840234909885,
                -0.4486827711680854,
                -0.19585291447977274,
                0.16820164463034093,
                0.23025207117343702
              ],
              "variance": 0.7735278795963125,
              "mean_reward": 0.10954405113285845,
              "min_reward": -0.4486827711680854,
              "max_reward": 0.5646815208665541,
              "num_responses": 7,
              "rvariance": 0.10447392665107737
            },
            {
              "id": "chat_sample_44",
              "rewards": [
                0.510521561012217,
                -0.12217487802978859,
                0.7374655712652572,
                0.5016015958041133,
                0.5678442081504159,
                0.5149334956414471,
                0.6484708296650779
              ],
              "variance": 0.43197772003459706,
              "mean_reward": 0.47980891192982,
              "min_reward": -0.12217487802978859,
              "max_reward": 0.7374655712652572,
              "num_responses": 7,
              "rvariance": 0.06680291680197616
            },
            {
              "id": "chat_sample_215",
              "rewards": [
                -0.3903624219644681,
                -0.726319514621774,
                -0.4190520090481686,
                -0.34686911252058206,
                -0.23368716171265566,
                -0.028337889790577633
              ],
              "variance": 0.4416732360833547,
              "mean_reward": -0.357438018276371,
              "min_reward": -0.726319514621774,
              "max_reward": -0.028337889790577633,
              "num_responses": 6,
              "rvariance": 0.044114454900260204
            },
            {
              "id": "chat_sample_300",
              "rewards": [
                0.9470833404799648,
                0.9347434900051292,
                0.46954794389501814,
                0.9347434900051292,
                0.4163164404953269,
                0.4365538235375717
              ],
              "variance": 0.5144782832260977,
              "mean_reward": 0.6898314214030234,
              "min_reward": 0.4163164404953269,
              "max_reward": 0.9470833404799648,
              "num_responses": 6,
              "rvariance": 0.06227119823119088
            },
            {
              "id": "chat_sample_169",
              "rewards": [
                -1.0313012084520163,
                -1.2962603524313865,
                -1.6084336975518758,
                -1.8979368776108316,
                -2.1335387089740503,
                -1.3601005660365963
              ],
              "variance": 0.8519570128507397,
              "mean_reward": -1.5545952351761263,
              "min_reward": -2.1335387089740503,
              "max_reward": -1.0313012084520163,
              "num_responses": 6,
              "rvariance": 0.1390598892809201
            },
            {
              "id": "chat_sample_82",
              "rewards": [
                -0.49661486558007245,
                -0.848755646697962,
                -1.753760450103486,
                -2.2392583853394243,
                -2.0502786344864323,
                -0.8692770780619478,
                -1.6557510605212893
              ],
              "variance": 1.4179712005768232,
              "mean_reward": -1.416242302970088,
              "min_reward": -2.2392583853394243,
              "max_reward": -0.49661486558007245,
              "num_responses": 7,
              "rvariance": 0.3882238817165163
            },
            {
              "id": "chat_sample_77",
              "rewards": [
                0.6252544721838782,
                -0.37254368918421144,
                0.0015649086573746585,
                -0.3830866867182827,
                -0.10000568376455932,
                -0.19993840551536018
              ],
              "variance": 0.6912248783718735,
              "mean_reward": -0.07145918072352679,
              "min_reward": -0.3830866867182827,
              "max_reward": 0.6252544721838782,
              "num_responses": 6,
              "rvariance": 0.1159713049239993
            },
            {
              "id": "chat_sample_277",
              "rewards": [
                -0.732080325485341,
                -1.589285166409638,
                -1.3114463388265516,
                -1.7705376723706925,
                -0.8888990230737539
              ],
              "variance": 0.9032288654655645,
              "mean_reward": -1.2584497052331955,
              "min_reward": -1.7705376723706925,
              "max_reward": -0.732080325485341,
              "num_responses": 5,
              "rvariance": 0.15762545245034434
            },
            {
              "id": "chat_sample_73",
              "rewards": [
                -3.013984637954823,
                -3.6769173849170738,
                -2.216732364202356,
                -2.6480392497178964,
                -3.341617418974243,
                -2.93099377344378
              ],
              "variance": 1.0768815949855322,
              "mean_reward": -2.971380804868362,
              "min_reward": -3.6769173849170738,
              "max_reward": -2.216732364202356,
              "num_responses": 6,
              "rvariance": 0.21872454089985402
            },
            {
              "id": "chat_sample_6",
              "rewards": [
                -0.2889430393456499,
                0.007402737598229616,
                0.37942336829866025,
                0.4217826042191775,
                0.24056260129991433,
                0.12728384795447917,
                0.4272607799367336
              ],
              "variance": 0.5351094476855222,
              "mean_reward": 0.18782469999450638,
              "min_reward": -0.2889430393456499,
              "max_reward": 0.4272607799367336,
              "num_responses": 7,
              "rvariance": 0.05929743283050061
            },
            {
              "id": "chat_sample_80",
              "rewards": [
                0.4456801124022634,
                -0.5969517555896688,
                -0.5969517555896688,
                -0.8008659475578767
              ],
              "variance": 0.8725822419720982,
              "mean_reward": -0.3872723365837377,
              "min_reward": -0.8008659475578767,
              "max_reward": 0.4456801124022634,
              "num_responses": 4,
              "rvariance": 0.2382000937049335
            },
            {
              "id": "chat_sample_224",
              "rewards": [
                -1.6640972763829909,
                -2.7644510136568625,
                -2.973575584541781,
                -2.609131695518037,
                -2.375983137222193,
                -2.637039089835153,
                -2.3575708706353136
              ],
              "variance": 0.7679194090764456,
              "mean_reward": -2.483121238256047,
              "min_reward": -2.973575584541781,
              "max_reward": -1.6640972763829909,
              "num_responses": 7,
              "rvariance": 0.15104328090240318
            },
            {
              "id": "chat_sample_267",
              "rewards": [
                1.042437372865389,
                0.22096397368765408,
                0.3918960572921209,
                1.1058914362023617,
                0.4140723174360004,
                0.44151053741073776,
                0.5540770501882254
              ],
              "variance": 0.7442957743498441,
              "mean_reward": 0.5958355350117842,
              "min_reward": 0.22096397368765408,
              "max_reward": 1.1058914362023617,
              "num_responses": 7,
              "rvariance": 0.1000468664540763
            },
            {
              "id": "chat_sample_308",
              "rewards": [
                0.1553240807902197,
                -0.39522515965158544,
                -0.04039439853153722,
                -0.49381960398602476,
                0.22392316366638812,
                -0.058025885527561646,
                -0.04043891356703394
              ],
              "variance": 0.6174266513260482,
              "mean_reward": -0.09266524525816215,
              "min_reward": -0.49381960398602476,
              "max_reward": 0.22392316366638812,
              "num_responses": 7,
              "rvariance": 0.060121994886486174
            },
            {
              "id": "chat_sample_252",
              "rewards": [
                0.7464678539596367,
                1.3285598832841223,
                1.175558526636519,
                1.8911843570453102,
                1.3807721336885117,
                1.3459165076006512,
                1.6461856136650943
              ],
              "variance": 0.7402628534514146,
              "mean_reward": 1.3592349822685492,
              "min_reward": 0.7464678539596367,
              "max_reward": 1.8911843570453102,
              "num_responses": 7,
              "rvariance": 0.11087336977574706
            },
            {
              "id": "chat_sample_159",
              "rewards": [
                -0.22247431888253857,
                -0.4551466369573545,
                -0.17657719752182996,
                -0.043289289014553776,
                -1.2522003595197486,
                -0.3887697729166967,
                -0.1460314041167029
              ],
              "variance": 0.669033567906469,
              "mean_reward": -0.38349842556134645,
              "min_reward": -1.2522003595197486,
              "max_reward": -0.043289289014553776,
              "num_responses": 7,
              "rvariance": 0.1429546148244358
            },
            {
              "id": "chat_sample_188",
              "rewards": [
                0.7240584198202981,
                0.21936991146415266,
                1.495104762834635,
                1.005032731054443,
                1.3387944552151092,
                1.259065200289032,
                1.3568778051508186
              ],
              "variance": 0.8899855717465052,
              "mean_reward": 1.0569004694040698,
              "min_reward": 0.21936991146415266,
              "max_reward": 1.495104762834635,
              "num_responses": 7,
              "rvariance": 0.17389653287552886
            },
            {
              "id": "chat_sample_88",
              "rewards": [
                0.5415859899102741,
                -0.6037349990939302,
                0.7320170722380323,
                0.6041515190069751,
                0.7540548411603665,
                0.6604312424563937,
                0.5748895957526025
              ],
              "variance": 0.6573745854983735,
              "mean_reward": 0.4661993230615305,
              "min_reward": -0.6037349990939302,
              "max_reward": 0.7540548411603665,
              "num_responses": 7,
              "rvariance": 0.1960761286568117
            },
            {
              "id": "chat_sample_27",
              "rewards": [
                -0.9207654291986169,
                -0.7850355530298067,
                -1.1459111733351628,
                -1.6199030317769978,
                -1.4395535451074482,
                -1.7333315817498187,
                -1.1891126619907926
              ],
              "variance": 0.7988009730350334,
              "mean_reward": -1.261944710884092,
              "min_reward": -1.7333315817498187,
              "max_reward": -0.7850355530298067,
              "num_responses": 7,
              "rvariance": 0.10635693939914923
            },
            {
              "id": "chat_sample_167",
              "rewards": [
                0.21990762482943838,
                -1.3936055494204576,
                0.3919483447941329,
                0.3434262495148481,
                0.22924942299296336,
                0.3376470673667904,
                0.4789017540522486
              ],
              "variance": 0.852227353367899,
              "mean_reward": 0.08678213058999489,
              "min_reward": -1.3936055494204576,
              "max_reward": 0.4789017540522486,
              "num_responses": 7,
              "rvariance": 0.3721786639180663
            },
            {
              "id": "chat_sample_76",
              "rewards": [
                1.1130194945847565,
                0.5302791708941084,
                0.34464158064269496,
                0.005424291576153378,
                0.550250876899103,
                0.6464588207194129
              ],
              "variance": 0.7047062215426605,
              "mean_reward": 0.5316790392193715,
              "min_reward": 0.005424291576153378,
              "max_reward": 1.1130194945847565,
              "num_responses": 6,
              "rvariance": 0.11056751106660166
            },
            {
              "id": "chat_sample_209",
              "rewards": [
                0.024901386075628917,
                0.4456652740570978,
                0.48900808028573306,
                0.276548414677886,
                0.22809697818510397,
                0.29885115404960544,
                0.6345983901109983
              ],
              "variance": 0.40042546287452524,
              "mean_reward": 0.34252423963457906,
              "min_reward": 0.024901386075628917,
              "max_reward": 0.6345983901109983,
              "num_responses": 7,
              "rvariance": 0.03394870301130961
            },
            {
              "id": "chat_sample_61",
              "rewards": [
                -1.5810392860247702,
                -3.340667058295782,
                -2.4805864047608237,
                -2.3689398693836017,
                -3.2171350084409363,
                -1.7059569546829338,
                -1.8202560209054683
              ],
              "variance": 1.610557941163206,
              "mean_reward": -2.359225800356331,
              "min_reward": -3.340667058295782,
              "max_reward": -1.5810392860247702,
              "num_responses": 7,
              "rvariance": 0.4338401100738407
            },
            {
              "id": "chat_sample_118",
              "rewards": [
                -0.657665671186066,
                -0.7742392437461231,
                -0.08834698399161005,
                -0.21970414115769935,
                -0.08354677933054758,
                -0.335630125939459,
                0.1961733384431738
              ],
              "variance": 0.7326363679890299,
              "mean_reward": -0.2804228009869045,
              "min_reward": -0.7742392437461231,
              "max_reward": 0.1961733384431738,
              "num_responses": 7,
              "rvariance": 0.09938551916180578
            },
            {
              "id": "chat_sample_150",
              "rewards": [
                0.9102814181178867,
                1.0253704495735214,
                0.3796848058087203,
                0.4309569410586911,
                0.8028390805375764,
                0.7627306802611034,
                0.6666039940452716
              ],
              "variance": 0.5458689437414379,
              "mean_reward": 0.7112096242003957,
              "min_reward": 0.3796848058087203,
              "max_reward": 1.0253704495735214,
              "num_responses": 7,
              "rvariance": 0.04854527338260046
            },
            {
              "id": "chat_sample_120",
              "rewards": [
                -0.4431275773732413,
                -0.3513743167479957,
                -0.3501575724444188,
                0.04929067941277375,
                0.18237155767559696,
                -0.19824118146356476,
                -0.005211268968236459
              ],
              "variance": 0.49059865171599704,
              "mean_reward": -0.15949281141558377,
              "min_reward": -0.4431275773732413,
              "max_reward": 0.18237155767559696,
              "num_responses": 7,
              "rvariance": 0.04848375243779489
            },
            {
              "id": "chat_sample_244",
              "rewards": [
                1.0516053504141174,
                0.8201836928603997,
                1.0172450424196409,
                0.9726734798937233,
                0.8080791361446182,
                1.3159737869383248
              ],
              "variance": 0.3696581541737123,
              "mean_reward": 0.9976267481118041,
              "min_reward": 0.8080791361446182,
              "max_reward": 1.3159737869383248,
              "num_responses": 6,
              "rvariance": 0.02878006746030896
            },
            {
              "id": "chat_sample_8",
              "rewards": [
                1.194672788267303,
                1.4310161835948678,
                1.374862939373289,
                0.21936001923404227,
                1.4256817985078447,
                1.4033359572763586,
                1.6097341588840697
              ],
              "variance": 0.6979556930565499,
              "mean_reward": 1.2369519778768248,
              "min_reward": 0.21936001923404227,
              "max_reward": 1.6097341588840697,
              "num_responses": 7,
              "rvariance": 0.18517577166901517
            },
            {
              "id": "chat_sample_40",
              "rewards": [
                1.4933319338812816,
                1.0493449758338953,
                1.6563696645637318,
                1.8755896095702267,
                1.6333108761764332,
                1.7123837109759001,
                1.4844455315967668
              ],
              "variance": 0.46726076112201254,
              "mean_reward": 1.5578251860854624,
              "min_reward": 1.0493449758338953,
              "max_reward": 1.8755896095702267,
              "num_responses": 7,
              "rvariance": 0.05833824965517244
            },
            {
              "id": "chat_sample_286",
              "rewards": [
                -0.07571177978919316,
                0.5908097269395309,
                0.5240866348450097,
                0.4689494639733401,
                0.5497400138726883,
                0.6440313381091118,
                0.5683487118860454
              ],
              "variance": 0.3610134049390365,
              "mean_reward": 0.4671791585480762,
              "min_reward": -0.07571177978919316,
              "max_reward": 0.6440313381091118,
              "num_responses": 7,
              "rvariance": 0.05165499285418917
            },
            {
              "id": "chat_sample_307",
              "rewards": [
                -0.5272143596629416,
                0.2519372527511226,
                -0.023315463245964094,
                -0.20965964136240478,
                -0.13506304068788524,
                -0.19922121883235755,
                -0.12470728893804618
              ],
              "variance": 0.42346715183549016,
              "mean_reward": -0.13817767999692526,
              "min_reward": -0.5272143596629416,
              "max_reward": 0.2519372527511226,
              "num_responses": 7,
              "rvariance": 0.04653709493757581
            },
            {
              "id": "chat_sample_206",
              "rewards": [
                0.4191251272588101,
                0.646502982460977,
                0.41179639792274775,
                0.38349684734054224,
                0.7357966107280629,
                0.8417155448713745,
                0.9277991444676417
              ],
              "variance": 0.4756724070200158,
              "mean_reward": 0.6237475221500224,
              "min_reward": 0.38349684734054224,
              "max_reward": 0.9277991444676417,
              "num_responses": 7,
              "rvariance": 0.042506321069542344
            },
            {
              "id": "chat_sample_261",
              "rewards": [
                -1.5850442260437445,
                -2.24329582840019,
                -2.6176022708439834,
                -2.569705505825248,
                -2.5063429456167965,
                -2.8098860265538432,
                -2.371579681647343
              ],
              "variance": 0.7145205856703158,
              "mean_reward": -2.3862080692758783,
              "min_reward": -2.8098860265538432,
              "max_reward": -1.5850442260437445,
              "num_responses": 7,
              "rvariance": 0.134807341107916
            },
            {
              "id": "chat_sample_79",
              "rewards": [
                0.06694336404474899,
                -0.18763812396096619,
                0.05397535695790427,
                -0.20056302918804425,
                -0.08948812339362902,
                0.01316778798898677,
                -0.056179571436245496
              ],
              "variance": 0.25197064584443957,
              "mean_reward": -0.05711176271246356,
              "min_reward": -0.20056302918804425,
              "max_reward": 0.06694336404474899,
              "num_responses": 7,
              "rvariance": 0.010190533203422782
            },
            {
              "id": "chat_sample_69",
              "rewards": [
                -0.32933442806206636,
                -0.844964096214226,
                -0.6688527235591095,
                -1.0229634716446951,
                -1.2278117727704687,
                -0.8468676439226093
              ],
              "variance": 0.6262940463969939,
              "mean_reward": -0.8234656893621959,
              "min_reward": -1.2278117727704687,
              "max_reward": -0.32933442806206636,
              "num_responses": 6,
              "rvariance": 0.07872930431102527
            },
            {
              "id": "chat_sample_203",
              "rewards": [
                0.6557522176141835,
                0.9158571029608165,
                0.7132105296224676,
                0.7989079789504974,
                1.304316853635038,
                1.0825157431575985
              ],
              "variance": 0.5089349247779928,
              "mean_reward": 0.9117600709901003,
              "min_reward": 0.6557522176141835,
              "max_reward": 1.304316853635038,
              "num_responses": 6,
              "rvariance": 0.050162108149007546
            },
            {
              "id": "chat_sample_168",
              "rewards": [
                -0.5417375666407113,
                -0.22698941534006256,
                0.15403385134867997,
                0.199344504781416,
                0.45237856536272153,
                -0.020002272746851422,
                0.12407028634433534
              ],
              "variance": 0.6534468048742603,
              "mean_reward": 0.02015685044421822,
              "min_reward": -0.5417375666407113,
              "max_reward": 0.45237856536272153,
              "num_responses": 7,
              "rvariance": 0.08943774966621465
            },
            {
              "id": "chat_sample_265",
              "rewards": [
                0.8987509640424398,
                0.8012443117262099,
                0.47604572590180855,
                0.5733541803218982,
                0.7364275936915322,
                0.7968521615572006
              ],
              "variance": 0.32529768477247145,
              "mean_reward": 0.7137791562068482,
              "min_reward": 0.47604572590180855,
              "max_reward": 0.8987509640424398,
              "num_responses": 6,
              "rvariance": 0.020919192799886733
            },
            {
              "id": "chat_sample_301",
              "rewards": [
                -1.9620583131863225,
                -1.0601928796651146,
                -0.8014510023101191,
                -1.397144141448514,
                -0.7599940790932417,
                -0.9106612227287275,
                -1.064407676280002
              ],
              "variance": 0.8382415771202693,
              "mean_reward": -1.1365584735302916,
              "min_reward": -1.9620583131863225,
              "max_reward": -0.7599940790932417,
              "num_responses": 7,
              "rvariance": 0.15221709220168256
            },
            {
              "id": "chat_sample_196",
              "rewards": [
                0.5443635868076961,
                0.8456696105640669,
                0.7582851827082845,
                0.6807392842851413,
                1.0671601756748268,
                0.6136296886284502,
                0.389019538093595
              ],
              "variance": 0.45203986928631523,
              "mean_reward": 0.6998381523945801,
              "min_reward": 0.389019538093595,
              "max_reward": 1.0671601756748268,
              "num_responses": 7,
              "rvariance": 0.041169365122773804
            },
            {
              "id": "chat_sample_225",
              "rewards": [
                -0.5242283193453365,
                -0.6234636388733555,
                -0.04628663473799928,
                0.14363429115120924,
                -0.17171587301044264,
                -0.21530033228891712,
                -0.06106421334717872
              ],
              "variance": 0.5936041827742283,
              "mean_reward": -0.21406067435028867,
              "min_reward": -0.6234636388733555,
              "max_reward": 0.14363429115120924,
              "num_responses": 7,
              "rvariance": 0.0635873011581122
            },
            {
              "id": "chat_sample_126",
              "rewards": [
                0.09584846042728283,
                0.05652543256278753,
                0.3375227079025456,
                0.37508138586806794,
                0.35876768524031927,
                0.6043380582033422,
                0.5381131105536653
              ],
              "variance": 0.4844838403320514,
              "mean_reward": 0.33802812010828726,
              "min_reward": 0.05652543256278753,
              "max_reward": 0.6043380582033422,
              "num_responses": 7,
              "rvariance": 0.03580758095644197
            },
            {
              "id": "chat_sample_162",
              "rewards": [
                0.38271324139822704,
                -0.2826445151167972,
                0.22363134287813188,
                -0.45542927210336537,
                0.0576482006803158,
                0.3220222899074433,
                -0.3641409462933076
              ],
              "variance": 0.7469549471210876,
              "mean_reward": -0.01659995123562174,
              "min_reward": -0.45542927210336537,
              "max_reward": 0.38271324139822704,
              "num_responses": 7,
              "rvariance": 0.10306793383033523
            },
            {
              "id": "chat_sample_49",
              "rewards": [
                0.6292696577268955,
                0.7834234591823582,
                0.6867629458344984,
                0.5171239180230315,
                0.4406499133911346,
                0.5790966199009746,
                0.33586999888624697
              ],
              "variance": 0.3266892035844628,
              "mean_reward": 0.5674566447064486,
              "min_reward": 0.33586999888624697,
              "max_reward": 0.7834234591823582,
              "num_responses": 7,
              "rvariance": 0.019582528721348184
            },
            {
              "id": "chat_sample_177",
              "rewards": [
                0.4810540206891215,
                -0.08133621919480989,
                -0.0493362679634568,
                -0.961926998687913,
                0.19028675493963196
              ],
              "variance": 0.9744378012799975,
              "mean_reward": -0.08425174204348525,
              "min_reward": -0.961926998687913,
              "max_reward": 0.4810540206891215,
              "num_responses": 5,
              "rvariance": 0.23329668768680395
            },
            {
              "id": "chat_sample_273",
              "rewards": [
                0.09825156575624043,
                -0.4370495085582771,
                -0.23618848275485205,
                -0.32945313482339095,
                -0.7319679780148016,
                -0.4587742590564043,
                -0.36583039787858773
              ],
              "variance": 0.4656392832893483,
              "mean_reward": -0.351573170761439,
              "min_reward": -0.7319679780148016,
              "max_reward": 0.09825156575624043,
              "num_responses": 7,
              "rvariance": 0.054263853052093525
            },
            {
              "id": "chat_sample_285",
              "rewards": [
                -0.5571270503410043,
                0.19067820461685706,
                0.5501321701377784,
                0.10596467889087766,
                0.14881428678972383,
                0.21276260833828306,
                0.1251337010812013
              ],
              "variance": 0.5069824458599563,
              "mean_reward": 0.11090837135910243,
              "min_reward": -0.5571270503410043,
              "max_reward": 0.5501321701377784,
              "num_responses": 7,
              "rvariance": 0.0939414343533925
            },
            {
              "id": "chat_sample_293",
              "rewards": [
                -0.740955775657948,
                0.21441743711817682,
                -0.49223119446544356,
                -0.4809314413279281,
                -0.8248616714542013,
                -0.28710379113298407,
                -0.16052140146481625
              ],
              "variance": 0.7639722679448304,
              "mean_reward": -0.39602683405502065,
              "min_reward": -0.8248616714542013,
              "max_reward": 0.21441743711817682,
              "num_responses": 7,
              "rvariance": 0.10847265858395913
            },
            {
              "id": "chat_sample_233",
              "rewards": [
                0.6074131285919407,
                0.5348635129624051,
                0.7393069392415181,
                0.8604832251543627,
                0.06398912018107014,
                0.21387195128637582,
                0.762865285249391
              ],
              "variance": 0.6479936423671262,
              "mean_reward": 0.5403990232381519,
              "min_reward": 0.06398912018107014,
              "max_reward": 0.8604832251543627,
              "num_responses": 7,
              "rvariance": 0.07565962139100471
            },
            {
              "id": "chat_sample_235",
              "rewards": [
                -1.8330466744381912,
                -2.448385782575803,
                -1.7777547608240805,
                -1.5950042885891684,
                -1.9634361595231258,
                -2.318133375536684,
                -1.6641085817888313
              ],
              "variance": 0.7337674738433653,
              "mean_reward": -1.9428385176108403,
              "min_reward": -2.448385782575803,
              "max_reward": -1.5950042885891684,
              "num_responses": 7,
              "rvariance": 0.0906906362765714
            },
            {
              "id": "chat_sample_158",
              "rewards": [
                -0.690249617287864,
                -2.325535590010709,
                -1.3969971711725881,
                -1.3397889912685237,
                -1.6175260701990462,
                -1.6711702209119135,
                -1.69184498184261
              ],
              "variance": 0.86534798343359,
              "mean_reward": -1.5333018060990364,
              "min_reward": -2.325535590010709,
              "max_reward": -0.690249617287864,
              "num_responses": 7,
              "rvariance": 0.2065192699253482
            },
            {
              "id": "chat_sample_216",
              "rewards": [
                -0.9046849025663273,
                -1.0970138798995486,
                -0.865388725040703,
                -1.2506515189196088,
                -0.7289289436073195,
                -0.851350237338342,
                -1.2444434379374796
              ],
              "variance": 0.44454495048439824,
              "mean_reward": -0.9917802350441898,
              "min_reward": -1.2506515189196088,
              "max_reward": -0.7289289436073195,
              "num_responses": 7,
              "rvariance": 0.036328421732461876
            },
            {
              "id": "chat_sample_242",
              "rewards": [
                0.9897909242179405,
                0.9788585967702392,
                0.9398005393551291,
                1.1281687384109402,
                0.9117150848960268,
                0.31759834328450787,
                1.063985123103327
              ],
              "variance": 0.4155901809749529,
              "mean_reward": 0.9042739071483016,
              "min_reward": 0.31759834328450787,
              "max_reward": 1.1281687384109402,
              "num_responses": 7,
              "rvariance": 0.06200261915136866
            },
            {
              "id": "chat_sample_92",
              "rewards": [
                1.7819614180451313,
                0.9553751490760592,
                1.506832708218357,
                1.3241733858180331,
                1.7318890689899769,
                1.4248349529516098,
                1.105493980528284
              ],
              "variance": 0.7064715606646446,
              "mean_reward": 1.404365809089636,
              "min_reward": 0.9553751490760592,
              "max_reward": 1.7819614180451313,
              "num_responses": 7,
              "rvariance": 0.07973088405470295
            },
            {
              "id": "chat_sample_250",
              "rewards": [
                -2.3425322078100064,
                -3.130935528434805,
                -3.565644634520451,
                -3.179494675415262,
                -2.642078474488527,
                -3.342905528652188
              ],
              "variance": 0.9619697404370529,
              "mean_reward": -3.03393184155354,
              "min_reward": -3.565644634520451,
              "max_reward": -2.3425322078100064,
              "num_responses": 6,
              "rvariance": 0.17339400036921673
            },
            {
              "id": "chat_sample_283",
              "rewards": [
                -0.31990571959114306,
                0.19128798994437554,
                0.21792635245590203,
                0.14069205928123585,
                0.30363051436864963,
                0.006670712570061408,
                -0.24932748410503336
              ],
              "variance": 0.5297667955204783,
              "mean_reward": 0.041567774989149715,
              "min_reward": -0.31990571959114306,
              "max_reward": 0.30363051436864963,
              "num_responses": 7,
              "rvariance": 0.04978884824755487
            },
            {
              "id": "chat_sample_140",
              "rewards": [
                -0.5996113523136314,
                -0.4816917298706974,
                -0.4284121784961843,
                -0.5224293466409772,
                -1.3749403243778984,
                -0.7114670376989016,
                -0.7403099543493131
              ],
              "variance": 0.5337821930398551,
              "mean_reward": -0.6941231319639433,
              "min_reward": -1.3749403243778984,
              "max_reward": -0.4284121784961843,
              "num_responses": 7,
              "rvariance": 0.08858381813055241
            },
            {
              "id": "chat_sample_232",
              "rewards": [
                -0.3159728515344015,
                -0.1540992243595838,
                0.001098560666456688,
                0.01938293484976627,
                0.2738881113660585,
                0.22593552590598567,
                0.2618761176605956
              ],
              "variance": 0.4855295903722916,
              "mean_reward": 0.044587024936411056,
              "min_reward": -0.3159728515344015,
              "max_reward": 0.2738881113660585,
              "num_responses": 7,
              "rvariance": 0.043526708531462906
            },
            {
              "id": "chat_sample_0",
              "rewards": [
                0.7659672059768605,
                0.8680288769649884,
                1.0563083992437388,
                1.0142869123227043,
                -0.271688163681685,
                1.0165126640975402,
                1.1071399769598649
              ],
              "variance": 0.7257359722167468,
              "mean_reward": 0.7937936959834303,
              "min_reward": -0.271688163681685,
              "max_reward": 1.1071399769598649,
              "num_responses": 7,
              "rvariance": 0.20097966105084927
            },
            {
              "id": "chat_sample_34",
              "rewards": [
                0.8545387014458886,
                0.5683621370554809,
                1.0000710710662215,
                1.0373676049338187,
                0.7674757710686937,
                0.8267782774046989,
                1.3236971455970048
              ],
              "variance": 0.46406910373568455,
              "mean_reward": 0.9111843869388296,
              "min_reward": 0.5683621370554809,
              "max_reward": 1.3236971455970048,
              "num_responses": 7,
              "rvariance": 0.04892888706807942
            },
            {
              "id": "chat_sample_68",
              "rewards": [
                0.16041433976987585,
                -0.38223100881373473,
                0.10408798152136534,
                0.14171661168552532,
                -0.29495963501635675,
                0.14905947277888829,
                0.09011308672685682
              ],
              "variance": 0.48346960411059126,
              "mean_reward": -0.00454273590679712,
              "min_reward": -0.38223100881373473,
              "max_reward": 0.16041433976987585,
              "num_responses": 7,
              "rvariance": 0.04570671948490012
            },
            {
              "id": "chat_sample_149",
              "rewards": [
                0.7835036569050388,
                0.011140587404223653,
                0.1650325980556938,
                0.6383192818082317,
                0.5918915129608876,
                -0.073423848282235,
                0.5478576638002558
              ],
              "variance": 0.7190782187173144,
              "mean_reward": 0.38061735037887084,
              "min_reward": -0.073423848282235,
              "max_reward": 0.7835036569050388,
              "num_responses": 7,
              "rvariance": 0.09863957565011698
            },
            {
              "id": "chat_sample_309",
              "rewards": [
                0.15297114319967903,
                -0.3440201502487923,
                -0.010292342305647255,
                0.046875562090110685,
                -0.1296880267986231,
                -0.28958179477563456,
                -0.18988224702029266
              ],
              "variance": 0.4006709314988357,
              "mean_reward": -0.10908826512274288,
              "min_reward": -0.3440201502487923,
              "max_reward": 0.15297114319967903,
              "num_responses": 7,
              "rvariance": 0.028211915120266207
            },
            {
              "id": "chat_sample_243",
              "rewards": [
                -1.601249112140279,
                -1.8955146944095185,
                -1.754021887613546,
                -1.6412108954347588,
                -1.686627537047249,
                -2.5506714419171446,
                -1.7390803806196802
              ],
              "variance": 0.5323512112956021,
              "mean_reward": -1.8383394213117394,
              "min_reward": -2.5506714419171446,
              "max_reward": -1.601249112140279,
              "num_responses": 7,
              "rvariance": 0.09224795561802444
            },
            {
              "id": "chat_sample_281",
              "rewards": [
                -2.184835574799297,
                -1.8815030570460285,
                -2.5033625580021113,
                -1.526068163301382,
                -1.8933935176387067,
                -2.0136731435508315,
                -1.967315326902125
              ],
              "variance": 0.5729172685322528,
              "mean_reward": -1.9957359058914972,
              "min_reward": -2.5033625580021113,
              "max_reward": -1.526068163301382,
              "num_responses": 7,
              "rvariance": 0.07695483901962
            },
            {
              "id": "chat_sample_99",
              "rewards": [
                1.1862523806797736,
                -0.11900017875222126,
                0.35878252358548485,
                0.7157309285370197,
                0.6369548606408642,
                0.6827071314892421,
                0.4099034490323398
              ],
              "variance": 0.736270066743719,
              "mean_reward": 0.5530472993160719,
              "min_reward": -0.11900017875222126,
              "max_reward": 1.1862523806797736,
              "num_responses": 7,
              "rvariance": 0.1373062238499456
            },
            {
              "id": "chat_sample_43",
              "rewards": [
                0.6420140297544591,
                0.38081817274422397,
                0.8216654076133618,
                0.8116636563839014,
                0.6009923646624383,
                0.5769132633980404,
                0.5612298391458961
              ],
              "variance": 0.32659918429045826,
              "mean_reward": 0.6278995333860459,
              "min_reward": 0.38081817274422397,
              "max_reward": 0.8216654076133618,
              "num_responses": 7,
              "rvariance": 0.02004733261238293
            },
            {
              "id": "chat_sample_148",
              "rewards": [
                0.664665116943637,
                0.5015478951263712,
                0.5468910516008986,
                0.4374222200236902
              ],
              "variance": 0.17267297478632093,
              "mean_reward": 0.5376315709236492,
              "min_reward": 0.4374222200236902,
              "max_reward": 0.664665116943637,
              "num_responses": 4,
              "rvariance": 0.00689180136591472
            },
            {
              "id": "chat_sample_249",
              "rewards": [
                0.8127298974722275,
                0.527749586337311,
                0.3459339298478297,
                0.7354623946679051,
                0.4942827586981613,
                0.48540377558622916,
                0.6915338270991622
              ],
              "variance": 0.33675355849876465,
              "mean_reward": 0.584728024244118,
              "min_reward": 0.3459339298478297,
              "max_reward": 0.8127298974722275,
              "num_responses": 7,
              "rvariance": 0.023489714068867
            },
            {
              "id": "chat_sample_100",
              "rewards": [
                0.006893994335410012,
                0.5542770145540281,
                0.5139393265153538,
                -0.0575058368589016,
                0.613156274758882,
                0.5810637605172103
              ],
              "variance": 0.622415938899792,
              "mean_reward": 0.36863742230366375,
              "min_reward": -0.0575058368589016,
              "max_reward": 0.613156274758882,
              "num_responses": 6,
              "rvariance": 0.07882425082652901
            },
            {
              "id": "chat_sample_141",
              "rewards": [
                -1.5769043338386308,
                -0.8463504216054093,
                -0.4905184254806175,
                -0.8427461169059055,
                -0.9654090636867672,
                -0.6036339570292314,
                -1.736556448765803
              ],
              "variance": 1.082377435399714,
              "mean_reward": -1.008874109616052,
              "min_reward": -1.736556448765803,
              "max_reward": -0.4905184254806175,
              "num_responses": 7,
              "rvariance": 0.19157054117557548
            },
            {
              "id": "chat_sample_97",
              "rewards": [
                1.4541569361745095,
                0.582960595640876,
                1.4805589450451844,
                1.208585503329689,
                0.9315521859127338,
                1.1389788261579918,
                1.2706762053810918
              ],
              "variance": 0.6726021899187888,
              "mean_reward": 1.1524955996631536,
              "min_reward": 0.582960595640876,
              "max_reward": 1.4805589450451844,
              "num_responses": 7,
              "rvariance": 0.08415809563465457
            },
            {
              "id": "chat_sample_137",
              "rewards": [
                0.024721912757912003,
                0.2969843489102035,
                0.42346640310153744,
                0.7125943850041638,
                0.44938899210579136,
                0.6321825662004702,
                0.34131496497414676
              ],
              "variance": 0.47626791927266077,
              "mean_reward": 0.4115219390077464,
              "min_reward": 0.024721912757912003,
              "max_reward": 0.7125943850041638,
              "num_responses": 7,
              "rvariance": 0.044082064731335684
            },
            {
              "id": "chat_sample_207",
              "rewards": [
                -0.14538416963233794,
                0.1437113092284972,
                -0.33754709881727785,
                0.35933507529593617,
                -0.3018114175435258,
                0.062231129572882404,
                0.05059080108442385
              ],
              "variance": 0.5460665057084995,
              "mean_reward": -0.024124910115914566,
              "min_reward": -0.33754709881727785,
              "max_reward": 0.35933507529593617,
              "num_responses": 7,
              "rvariance": 0.05404249040327954
            },
            {
              "id": "chat_sample_190",
              "rewards": [
                -0.746744143448251,
                -0.02942886145417967,
                0.08699915400568183,
                0.14127287450628823,
                0.26360725792991235,
                0.15077012200011922,
                0.18326115179766622
              ],
              "variance": 0.5317545685023728,
              "mean_reward": 0.007105365048176735,
              "min_reward": -0.746744143448251,
              "max_reward": 0.26360725792991235,
              "num_responses": 7,
              "rvariance": 0.10163877341741653
            },
            {
              "id": "chat_sample_254",
              "rewards": [
                0.24813227709795102,
                0.32939836063046257,
                0.3201357003078206,
                0.4807932897669265,
                0.10302739313595946,
                -0.8189517705511136,
                0.3742030971518391
              ],
              "variance": 0.6826034465367438,
              "mean_reward": 0.14810547821997797,
              "min_reward": -0.8189517705511136,
              "max_reward": 0.4807932897669265,
              "num_responses": 7,
              "rvariance": 0.16735713377316838
            },
            {
              "id": "chat_sample_171",
              "rewards": [
                0.8348549299958926,
                0.44537698620816674,
                0.4809777091996986,
                0.2190703182093811,
                0.4220228440932868,
                0.6091039933529508,
                0.4869808797009699
              ],
              "variance": 0.3585625342704031,
              "mean_reward": 0.49976966582290666,
              "min_reward": 0.2190703182093811,
              "max_reward": 0.8348549299958926,
              "num_responses": 7,
              "rvariance": 0.030364010823130835
            },
            {
              "id": "chat_sample_131",
              "rewards": [
                0.49644067803795444,
                0.8741857303269032,
                1.0075598425537127,
                1.030187259049412,
                0.9789416208443799,
                0.7370211274981551,
                1.1253045845000524
              ],
              "variance": 0.4274452415155935,
              "mean_reward": 0.8928058346872243,
              "min_reward": 0.49644067803795444,
              "max_reward": 1.1253045845000524,
              "num_responses": 7,
              "rvariance": 0.03931972872694549
            },
            {
              "id": "chat_sample_272",
              "rewards": [
                -0.3624924768041991,
                -0.2461549045910611,
                -1.2332510861554484,
                -0.726500401115221,
                -0.510692922202875,
                -0.7048865849119031,
                -1.2452616666851812
              ],
              "variance": 0.9220978704483976,
              "mean_reward": -0.7184628632094128,
              "min_reward": -1.2452616666851812,
              "max_reward": -0.2461549045910611,
              "num_responses": 7,
              "rvariance": 0.1336758404761442
            },
            {
              "id": "chat_sample_317",
              "rewards": [
                -0.04506989043442239,
                0.5784642237617752,
                0.5513743516044963,
                0.4347378927244518,
                0.4978990753913706,
                0.5412765044253922,
                0.6283641653778631
              ],
              "variance": 0.3556094209473083,
              "mean_reward": 0.4552923318358467,
              "min_reward": -0.04506989043442239,
              "max_reward": 0.6283641653778631,
              "num_responses": 7,
              "rvariance": 0.044907197146253186
            },
            {
              "id": "chat_sample_221",
              "rewards": [
                0.03138362314938871,
                0.39985718276738264,
                0.37356575489758453,
                -0.18375189070331643,
                0.5584056074493823,
                0.07307725330105035,
                0.22953276472683928
              ],
              "variance": 0.5179471350318758,
              "mean_reward": 0.21172432794118734,
              "min_reward": -0.18375189070331643,
              "max_reward": 0.5584056074493823,
              "num_responses": 7,
              "rvariance": 0.05574841273585008
            },
            {
              "id": "chat_sample_263",
              "rewards": [
                -1.181314051724487,
                -0.8640518608000715,
                -0.6840641471174157,
                -0.6170612462283438,
                -0.4337144138353486,
                -0.47241705755435,
                -0.5188752096798902
              ],
              "variance": 0.5340207371030882,
              "mean_reward": -0.6816425695628437,
              "min_reward": -1.181314051724487,
              "max_reward": -0.4337144138353486,
              "num_responses": 7,
              "rvariance": 0.05983689281395562
            },
            {
              "id": "chat_sample_112",
              "rewards": [
                1.3820658960693766,
                1.3443030142108614,
                1.205763038102838,
                1.0854805858392529,
                1.3281797390127377,
                1.115068246099403,
                0.9117850370946645
              ],
              "variance": 0.34340580061285,
              "mean_reward": 1.1960922223470192,
              "min_reward": 0.9117850370946645,
              "max_reward": 1.3820658960693766,
              "num_responses": 7,
              "rvariance": 0.02481766818900195
            },
            {
              "id": "chat_sample_138",
              "rewards": [
                -1.080029627387889,
                -1.170828994395348,
                -0.5069529526332859,
                -0.5734481701413356,
                -0.5950619863446536,
                -0.7508395267139488,
                -0.5133687704477331
              ],
              "variance": 0.6055469308689185,
              "mean_reward": -0.7415042897234564,
              "min_reward": -1.170828994395348,
              "max_reward": -0.5069529526332859,
              "num_responses": 7,
              "rvariance": 0.0651078007665677
            },
            {
              "id": "chat_sample_1",
              "rewards": [
                0.8417416886223804,
                0.6182719709016792,
                0.5222982609586259,
                0.6500528798948738,
                0.7549712856213068,
                0.7096528597220555
              ],
              "variance": 0.22807137119169107,
              "mean_reward": 0.6828314909534869,
              "min_reward": 0.5222982609586259,
              "max_reward": 0.8417416886223804,
              "num_responses": 6,
              "rvariance": 0.01036487893755602
            },
            {
              "id": "chat_sample_42",
              "rewards": [
                -1.8045627044232135,
                -2.272548566012317,
                -2.4196403750507653,
                -2.7244609668477815,
                -3.1237127872784964,
                -2.8736329705608696,
                -2.292571146343594
              ],
              "variance": 0.8883106758712449,
              "mean_reward": -2.5015899309310052,
              "min_reward": -3.1237127872784964,
              "max_reward": -1.8045627044232135,
              "num_responses": 7,
              "rvariance": 0.16626226481913345
            },
            {
              "id": "chat_sample_101",
              "rewards": [
                -1.1200832671048224,
                -0.3145356518169361,
                -0.262526545423742,
                -0.5267586104899991,
                -0.6209707968855395,
                -0.3179131418117663,
                -0.34699064563336673
              ],
              "variance": 0.5268837757135942,
              "mean_reward": -0.5013969513094532,
              "min_reward": -1.1200832671048224,
              "max_reward": -0.262526545423742,
              "num_responses": 7,
              "rvariance": 0.07817110104157834
            },
            {
              "id": "chat_sample_21",
              "rewards": [
                -0.5116128996031404,
                -0.1776399056708309,
                0.11684613201229696,
                -0.35049037532884664,
                -0.2880265948847096,
                -0.11267480418449752,
                -0.21705973607283494
              ],
              "variance": 0.3940729553327844,
              "mean_reward": -0.22009402624750904,
              "min_reward": -0.5116128996031404,
              "max_reward": 0.11684613201229696,
              "num_responses": 7,
              "rvariance": 0.03335434486364222
            },
            {
              "id": "chat_sample_66",
              "rewards": [
                0.3714897997501345,
                0.8785609223871518,
                1.0639890093365847,
                1.0847054589513179,
                0.9174645903537534,
                0.9536418890431475,
                1.039915560775107
              ],
              "variance": 0.39654311585013313,
              "mean_reward": 0.9013953186567425,
              "min_reward": 0.3714897997501345,
              "max_reward": 1.0847054589513179,
              "num_responses": 7,
              "rvariance": 0.051933766784418786
            },
            {
              "id": "chat_sample_151",
              "rewards": [
                0.12158521682303458,
                0.22167833401919662,
                -0.0833528209615976,
                0.26703774201461955,
                0.10054373679038876,
                -0.2598570564696691,
                -0.001293945844525506
              ],
              "variance": 0.39377661238219197,
              "mean_reward": 0.05233445805306388,
              "min_reward": -0.2598570564696691,
              "max_reward": 0.26703774201461955,
              "num_responses": 7,
              "rvariance": 0.0286636051069575
            },
            {
              "id": "chat_sample_33",
              "rewards": [
                0.8465690969162465,
                0.8923800145574218,
                1.0943539162482647,
                0.71158891047223,
                0.7556425440930826,
                1.026522894381381,
                0.7333878526961851
              ],
              "variance": 0.3289870273215313,
              "mean_reward": 0.8657778899092589,
              "min_reward": 0.71158891047223,
              "max_reward": 1.0943539162482647,
              "num_responses": 7,
              "rvariance": 0.01894196639641107
            },
            {
              "id": "chat_sample_219",
              "rewards": [
                0.2928253727366532,
                -0.3055824769791761,
                -0.7905094892201725,
                -0.5333107997623965
              ],
              "variance": 0.8266529002047442,
              "mean_reward": -0.334144348306273,
              "min_reward": -0.7905094892201725,
              "max_reward": 0.2928253727366532,
              "num_responses": 4,
              "rvariance": 0.1604608072063345
            },
            {
              "id": "chat_sample_5",
              "rewards": [
                0.7711447285578475,
                0.8431884272760237,
                1.1309473951901599,
                0.9929613839683177,
                0.9537196137083005,
                0.851435367542689,
                1.1728219118352685
              ],
              "variance": 0.33332625405944993,
              "mean_reward": 0.9594598325826581,
              "min_reward": 0.7711447285578475,
              "max_reward": 1.1728219118352685,
              "num_responses": 7,
              "rvariance": 0.019533938313293846
            },
            {
              "id": "chat_sample_86",
              "rewards": [
                0.7389720165934953,
                0.49518719116539617,
                0.7490257020310352,
                0.9126841701529117,
                0.8031160629806671,
                0.9078712469102788,
                0.924396570603603
              ],
              "variance": 0.2759110439109326,
              "mean_reward": 0.7901789943481983,
              "min_reward": 0.49518719116539617,
              "max_reward": 0.924396570603603,
              "num_responses": 7,
              "rvariance": 0.01976808884530149
            },
            {
              "id": "chat_sample_108",
              "rewards": [
                0.4904057110827569,
                1.0630414750095831,
                1.1876213946682637,
                1.0085550715616036,
                0.8718313795606325,
                1.33155051642285,
                1.1658620213647504
              ],
              "variance": 0.5259319312006159,
              "mean_reward": 1.0169810813814915,
              "min_reward": 0.4904057110827569,
              "max_reward": 1.33155051642285,
              "num_responses": 7,
              "rvariance": 0.0643971706168199
            },
            {
              "id": "chat_sample_28",
              "rewards": [
                -0.7608165473681333,
                -0.04213401785523426,
                -0.1662680805710827,
                -0.250849474366302,
                -0.7122216735387508,
                -0.12119484066099583,
                0.15700646649684952
              ],
              "variance": 0.7691817989561032,
              "mean_reward": -0.2709254525519499,
              "min_reward": -0.7608165473681333,
              "max_reward": 0.15700646649684952,
              "num_responses": 7,
              "rvariance": 0.10056890770229883
            },
            {
              "id": "chat_sample_255",
              "rewards": [
                0.18983171235455443,
                -0.5613870685792535,
                0.19890500712936907,
                0.335845268310971,
                0.5051062716146484,
                0.19298733375976604,
                0.12418475357846975
              ],
              "variance": 0.5535936449170614,
              "mean_reward": 0.14078189688121787,
              "min_reward": -0.5613870685792535,
              "max_reward": 0.5051062716146484,
              "num_responses": 7,
              "rvariance": 0.09608689687180781
            },
            {
              "id": "chat_sample_29",
              "rewards": [
                0.5056856736639707,
                0.5332157500611615,
                0.730181710258624,
                0.9688660311830242,
                0.7895008214094574,
                0.8982213764376019,
                0.8040812620042942
              ],
              "variance": 0.40427551883348567,
              "mean_reward": 0.7471075178597333,
              "min_reward": 0.5056856736639707,
              "max_reward": 0.9688660311830242,
              "num_responses": 7,
              "rvariance": 0.025910873477598313
            },
            {
              "id": "chat_sample_60",
              "rewards": [
                0.757441516797442,
                0.5373807322315646,
                0.2985565069098891,
                0.9334129850552829,
                0.5659816425382042,
                0.4270862527340719,
                0.5139259013459182
              ],
              "variance": 0.45215574969617967,
              "mean_reward": 0.5762550768017676,
              "min_reward": 0.2985565069098891,
              "max_reward": 0.9334129850552829,
              "num_responses": 7,
              "rvariance": 0.037894259355771856
            },
            {
              "id": "chat_sample_125",
              "rewards": [
                0.46129146469217497,
                0.7255433142186528,
                0.6003910583893002,
                0.664822686037538,
                0.5936685814414311,
                -0.02541120285363485,
                0.6616691843959215
              ],
              "variance": 0.4225005396361329,
              "mean_reward": 0.5259964409030549,
              "min_reward": -0.02541120285363485,
              "max_reward": 0.7255433142186528,
              "num_responses": 7,
              "rvariance": 0.05654999651011108
            },
            {
              "id": "chat_sample_314",
              "rewards": [
                -0.1267761782068459,
                0.08988344567072297,
                -0.14050306066072987,
                0.20489969857626006,
                0.017178380710881316,
                -0.07854873006727749,
                -0.1134478113088373
              ],
              "variance": 0.26815687802133736,
              "mean_reward": -0.021044893612260886,
              "min_reward": -0.14050306066072987,
              "max_reward": 0.20489969857626006,
              "num_responses": 7,
              "rvariance": 0.014587346073969517
            },
            {
              "id": "chat_sample_310",
              "rewards": [
                0.6168637412866799,
                0.724741336991847,
                1.032631699768474,
                1.222064020149016,
                0.8048026882144871,
                1.232341340645837,
                1.1006930692793566
              ],
              "variance": 0.5445846496379643,
              "mean_reward": 0.9620196994765282,
              "min_reward": 0.6168637412866799,
              "max_reward": 1.232341340645837,
              "num_responses": 7,
              "rvariance": 0.052152005983388414
            },
            {
              "id": "chat_sample_222",
              "rewards": [
                0.1304606669956416,
                -0.016804962657603215,
                0.2074441214782231,
                0.296607737578144,
                0.13500614673136174,
                0.37003352216031343,
                0.11323970754919799
              ],
              "variance": 0.2647562119445343,
              "mean_reward": 0.17656956283361125,
              "min_reward": -0.016804962657603215,
              "max_reward": 0.37003352216031343,
              "num_responses": 7,
              "rvariance": 0.014006947262663572
            },
            {
              "id": "chat_sample_143",
              "rewards": [
                -0.25566416407859754,
                0.06886881597694818,
                0.2964289708482921,
                0.12506162911896854,
                0.13650552618094952,
                0.2254479802791169,
                0.19903501929653408
              ],
              "variance": 0.31478475255205707,
              "mean_reward": 0.1136691110888874,
              "min_reward": -0.25566416407859754,
              "max_reward": 0.2964289708482921,
              "num_responses": 7,
              "rvariance": 0.027464063732888674
            },
            {
              "id": "chat_sample_12",
              "rewards": [
                0.5567864613566723,
                0.4637341389415741,
                0.7690836117555632,
                0.8955829773495902,
                1.011048266843352,
                0.8146980979702608,
                0.796263573865633
              ],
              "variance": 0.4222035607564619,
              "mean_reward": 0.7581710182975209,
              "min_reward": 0.4637341389415741,
              "max_reward": 1.011048266843352,
              "num_responses": 7,
              "rvariance": 0.030691886177683765
            },
            {
              "id": "chat_sample_248",
              "rewards": [
                -0.5101841789400553,
                -0.871461141152747,
                -1.1576044959134983,
                -1.2271744305162142,
                -1.0452987140582057
              ],
              "variance": 0.544651492849996,
              "mean_reward": -0.9623445921161441,
              "min_reward": -1.2271744305162142,
              "max_reward": -0.5101841789400553,
              "num_responses": 5,
              "rvariance": 0.06557030011754506
            },
            {
              "id": "chat_sample_64",
              "rewards": [
                0.17709263973597852,
                -0.039073785811801334,
                0.025641183570312427,
                0.06929842139888473,
                0.18952293345753754,
                0.208609284867653,
                -0.652592723609103
              ],
              "variance": 0.4816388349523057,
              "mean_reward": -0.003071720912934014,
              "min_reward": -0.652592723609103,
              "max_reward": 0.208609284867653,
              "num_responses": 7,
              "rvariance": 0.07765661370727281
            },
            {
              "id": "chat_sample_4",
              "rewards": [
                0.4659076032143979,
                0.8557656912735083,
                0.9682876890154993,
                1.1152600847047578,
                0.9078380372806224,
                0.9306753103722349,
                0.9961212449007194
              ],
              "variance": 0.3439543247724707,
              "mean_reward": 0.8914079515373914,
              "min_reward": 0.4659076032143979,
              "max_reward": 1.1152600847047578,
              "num_responses": 7,
              "rvariance": 0.03587399081319699
            },
            {
              "id": "chat_sample_311",
              "rewards": [
                0.06069500755431321,
                0.061977464529337625,
                0.38665882803653906,
                0.2820407221527427,
                0.21719998013065406,
                0.05753514662191144,
                0.1622429891645663
              ],
              "variance": 0.2644569013249088,
              "mean_reward": 0.1754785911700092,
              "min_reward": 0.05753514662191144,
              "max_reward": 0.38665882803653906,
              "num_responses": 7,
              "rvariance": 0.013976695512581464
            },
            {
              "id": "chat_sample_117",
              "rewards": [
                -0.0539531130735447,
                -0.05066182679824787,
                0.17776248503202435,
                0.060498576127835636,
                0.2988525672253355,
                0.030968856072617724,
                -0.08299246115043372
              ],
              "variance": 0.2917673702136492,
              "mean_reward": 0.054353583347940986,
              "min_reward": -0.08299246115043372,
              "max_reward": 0.2988525672253355,
              "num_responses": 7,
              "rvariance": 0.01674523276217343
            },
            {
              "id": "chat_sample_39",
              "rewards": [
                0.11325383930649853,
                0.16408153078936716,
                0.21271809330278635,
                0.23874172437173916,
                0.2505403285419638,
                0.4202245779767925,
                -0.0027954450577083656
              ],
              "variance": 0.2515799027550796,
              "mean_reward": 0.19953780703306273,
              "min_reward": -0.0027954450577083656,
              "max_reward": 0.4202245779767925,
              "num_responses": 7,
              "rvariance": 0.014665055809145911
            },
            {
              "id": "chat_sample_287",
              "rewards": [
                0.10292352471980046,
                0.5088836903410839,
                0.8022635647215117,
                0.5056457514495967,
                0.7260287400819265,
                0.7516503226556789
              ],
              "variance": 0.47267230560389667,
              "mean_reward": 0.5662325989949331,
              "min_reward": 0.10292352471980046,
              "max_reward": 0.8022635647215117,
              "num_responses": 6,
              "rvariance": 0.05620668624343301
            },
            {
              "id": "chat_sample_313",
              "rewards": [
                -0.16812216712891415,
                -0.7082817396033589,
                -0.4561118359809817,
                -0.4628795345522125,
                -0.48685688716404646,
                -0.5375997881031118,
                -0.4257808452868229
              ],
              "variance": 0.2831551946795514,
              "mean_reward": -0.4636618282599212,
              "min_reward": -0.7082817396033589,
              "max_reward": -0.16812216712891415,
              "num_responses": 7,
              "rvariance": 0.02209714403261518
            },
            {
              "id": "chat_sample_3",
              "rewards": [
                0.9888667072904849,
                1.0551828047747502,
                0.9634828915333142,
                1.183619634294682,
                1.0876861998599352,
                1.1562241628857788,
                0.8292845445619504
              ],
              "variance": 0.25737879870457125,
              "mean_reward": 1.0377638493144137,
              "min_reward": 0.8292845445619504,
              "max_reward": 1.183619634294682,
              "num_responses": 7,
              "rvariance": 0.012782089813430248
            },
            {
              "id": "chat_sample_170",
              "rewards": [
                -1.7494997252773719,
                -1.6044852845621036,
                -0.6265040864565676,
                -1.7014008761292383,
                -1.4026385686869656,
                -1.1568590457158947
              ],
              "variance": 0.8337687346170739,
              "mean_reward": -1.3735645978046902,
              "min_reward": -1.7494997252773719,
              "max_reward": -0.6265040864565676,
              "num_responses": 6,
              "rvariance": 0.15133903478846647
            },
            {
              "id": "chat_sample_83",
              "rewards": [
                -0.2559390267580931,
                -0.810397817857094,
                -0.6364132746757095,
                -0.20221361844074784,
                -0.520893931210273,
                -0.325328074867362,
                -0.37338735509505394
              ],
              "variance": 0.47155822851710827,
              "mean_reward": -0.4463675855577619,
              "min_reward": -0.810397817857094,
              "max_reward": -0.20221361844074784,
              "num_responses": 7,
              "rvariance": 0.04143434614694216
            },
            {
              "id": "chat_sample_279",
              "rewards": [
                0.276029072597091,
                -0.15143750787202623,
                0.2692903441283263,
                0.17526469692915309,
                0.07423888375115512,
                -0.04485367454772406,
                0.2862350277195443
              ],
              "variance": 0.3675986625235172,
              "mean_reward": 0.12639526324364564,
              "min_reward": -0.15143750787202623,
              "max_reward": 0.2862350277195443,
              "num_responses": 7,
              "rvariance": 0.02571196974590943
            },
            {
              "id": "chat_sample_55",
              "rewards": [
                0.6868102872214552,
                0.5536976125047058,
                0.8892420578488358,
                0.3801518603875033,
                0.3440918552837038,
                0.527390639701877
              ],
              "variance": 0.42590431469954193,
              "mean_reward": 0.5635640521580134,
              "min_reward": 0.3440918552837038,
              "max_reward": 0.8892420578488358,
              "num_responses": 6,
              "rvariance": 0.03407828958985278
            },
            {
              "id": "chat_sample_103",
              "rewards": [
                -0.18639452931851827,
                -0.36872952788879443,
                0.04928361353412348,
                -0.10216360310435246,
                -0.046196191491275795,
                0.15813064779010785,
                0.0027237127560193124
              ],
              "variance": 0.35215095598314594,
              "mean_reward": -0.0704779825318129,
              "min_reward": -0.36872952788879443,
              "max_reward": 0.15813064779010785,
              "num_responses": 7,
              "rvariance": 0.02513534971384615
            },
            {
              "id": "chat_sample_113",
              "rewards": [
                0.2579665670034,
                0.7948680628322042,
                0.8888675662803714,
                0.9312119638557231,
                0.8222561150685246,
                0.8194449552475138,
                0.8749227014701265
              ],
              "variance": 0.32569786080982965,
              "mean_reward": 0.7699339902511234,
              "min_reward": 0.2579665670034,
              "max_reward": 0.9312119638557231,
              "num_responses": 7,
              "rvariance": 0.04558567151474453
            },
            {
              "id": "chat_sample_104",
              "rewards": [
                0.17114740943963944,
                0.6191184631639818,
                0.7390462083193231,
                0.6334515980060591,
                0.5725670414402579,
                0.7969963054816662,
                0.6806608530321233
              ],
              "variance": 0.35022705854424974,
              "mean_reward": 0.6018554112690072,
              "min_reward": 0.17114740943963944,
              "max_reward": 0.7969963054816662,
              "num_responses": 7,
              "rvariance": 0.035825014923574365
            },
            {
              "id": "chat_sample_282",
              "rewards": [
                0.4868755981090809,
                0.2579835251121606,
                0.43294739907447277,
                0.8608669023650725,
                0.5572651746352283,
                0.6959485880798524,
                0.6656147710342335
              ],
              "variance": 0.3989540643043925,
              "mean_reward": 0.5653574226300144,
              "min_reward": 0.2579835251121606,
              "max_reward": 0.8608669023650725,
              "num_responses": 7,
              "rvariance": 0.033238207069559364
            },
            {
              "id": "chat_sample_62",
              "rewards": [
                0.7237538804504714,
                0.23857214328413262,
                0.41749502905419233,
                0.6529876925922644,
                0.5829305656566123,
                0.2565449122189652,
                -0.48440220092094183
              ],
              "variance": 0.7319117621334443,
              "mean_reward": 0.3411260031908138,
              "min_reward": -0.48440220092094183,
              "max_reward": 0.7237538804504714,
              "num_responses": 7,
              "rvariance": 0.14387593588984054
            },
            {
              "id": "chat_sample_91",
              "rewards": [
                0.4856496681632586,
                0.3344864998465236,
                0.33968486676952897,
                0.7110441312282941,
                0.5968786101122497,
                0.7501912187143976,
                0.6156300388743423
              ],
              "variance": 0.3890974462224087,
              "mean_reward": 0.5476521476726565,
              "min_reward": 0.3344864998465236,
              "max_reward": 0.7501912187143976,
              "num_responses": 7,
              "rvariance": 0.023899649241418675
            },
            {
              "id": "chat_sample_284",
              "rewards": [
                -1.3002794242076612,
                -0.7339464240368779,
                -0.5790185555752778,
                -0.7014447954213555,
                -0.8164313716365614,
                -0.7315058695510739,
                -0.4181108340119523
              ],
              "variance": 0.49531512571505376,
              "mean_reward": -0.7543910392058228,
              "min_reward": -1.3002794242076612,
              "max_reward": -0.4181108340119523,
              "num_responses": 7,
              "rvariance": 0.0642040048797752
            },
            {
              "id": "chat_sample_84",
              "rewards": [
                0.5660551276761671,
                0.7814845820807235,
                0.6240200631836756,
                0.9266244421420339,
                0.8288499930249587,
                0.6240200631836756,
                0.4434529474516976
              ],
              "variance": 0.35094551708540955,
              "mean_reward": 0.6849296026775616,
              "min_reward": 0.4434529474516976,
              "max_reward": 0.9266244421420339,
              "num_responses": 7,
              "rvariance": 0.02404491400824166
            },
            {
              "id": "chat_sample_175",
              "rewards": [
                0.2800930127027951,
                0.13771520460587613,
                0.319340788959665,
                0.35295105393541515,
                0.35145874036447766,
                0.4014671432178472,
                0.5255641100707817
              ],
              "variance": 0.22796404049499353,
              "mean_reward": 0.33837000769383685,
              "min_reward": 0.13771520460587613,
              "max_reward": 0.5255641100707817,
              "num_responses": 7,
              "rvariance": 0.011918210231650737
            },
            {
              "id": "chat_sample_185",
              "rewards": [
                0.1832865889608072,
                0.18935829848498617,
                0.4900478243291206,
                0.5042092583199963,
                0.5543557991009787,
                0.8026769186225526,
                0.5263798657609556
              ],
              "variance": 0.4667546322342938,
              "mean_reward": 0.4643306505113424,
              "min_reward": 0.1832865889608072,
              "max_reward": 0.8026769186225526,
              "num_responses": 7,
              "rvariance": 0.04046858070544564
            },
            {
              "id": "chat_sample_154",
              "rewards": [
                -2.9705330171949735,
                -2.594171110651816,
                -2.530910299095928,
                -2.811139160132469,
                -2.9137699876458765,
                -2.780579941557906,
                -3.1087988372113666
              ],
              "variance": 0.4569725591720699,
              "mean_reward": -2.815700336212905,
              "min_reward": -3.1087988372113666,
              "max_reward": -2.530910299095928,
              "num_responses": 7,
              "rvariance": 0.03584747948379562
            },
            {
              "id": "chat_sample_189",
              "rewards": [
                -1.752618604113602,
                -0.7738050455030638,
                -0.6673095356618901,
                -0.6207927367435526,
                -1.010015955605936,
                -0.6735854490790619,
                -0.8284002634822576
              ],
              "variance": 0.6583541989144474,
              "mean_reward": -0.9037896557413377,
              "min_reward": -1.752618604113602,
              "max_reward": -0.6207927367435526,
              "num_responses": 7,
              "rvariance": 0.13476832140881628
            },
            {
              "id": "chat_sample_218",
              "rewards": [
                1.0684694829887222,
                0.9031978747709887,
                0.8333057361018203,
                0.7406897316933765,
                0.9933641390513831,
                0.9289424036332556
              ],
              "variance": 0.2439190771224542,
              "mean_reward": 0.9113282280399245,
              "min_reward": 0.7406897316933765,
              "max_reward": 1.0684694829887222,
              "num_responses": 6,
              "rvariance": 0.0111674387020193
            },
            {
              "id": "chat_sample_257",
              "rewards": [
                0.11524217755868515,
                0.33593783132128957,
                0.3867535108104527,
                0.2086841831813459,
                0.24161117769161472,
                0.3981507730733419,
                0.17969146990354867
              ],
              "variance": 0.2374006627500051,
              "mean_reward": 0.26658158907718266,
              "min_reward": 0.11524217755868515,
              "max_reward": 0.3981507730733419,
              "num_responses": 7,
              "rvariance": 0.010141595804530121
            },
            {
              "id": "chat_sample_13",
              "rewards": [
                1.0262575706380632,
                0.983864065206092,
                0.7412528822218032,
                0.9142771724946156,
                0.744180982334476
              ],
              "variance": 0.26687604619840233,
              "mean_reward": 0.88196653457901,
              "min_reward": 0.7412528822218032,
              "max_reward": 1.0262575706380632,
              "num_responses": 5,
              "rvariance": 0.014206435504888306
            },
            {
              "id": "chat_sample_237",
              "rewards": [
                -0.8958341829689962,
                -0.38161415760756595,
                -0.6903916414487345,
                -0.32844907346718727,
                -0.778272800573631,
                -0.4876517985122021,
                -0.8887223761074972
              ],
              "variance": 0.5312189749006823,
              "mean_reward": -0.6358480043836877,
              "min_reward": -0.8958341829689962,
              "max_reward": -0.32844907346718727,
              "num_responses": 7,
              "rvariance": 0.04798416555057564
            },
            {
              "id": "chat_sample_89",
              "rewards": [
                0.667236390184471,
                0.6045910166590219,
                0.3393513572972361,
                0.5030967357265109,
                0.4889367149113653,
                0.7715103877779991,
                0.6035311348614811
              ],
              "variance": 0.2798434173561686,
              "mean_reward": 0.568321962488298,
              "min_reward": 0.3393513572972361,
              "max_reward": 0.7715103877779991,
              "num_responses": 7,
              "rvariance": 0.01665837372405027
            },
            {
              "id": "chat_sample_23",
              "rewards": [
                0.7703452243885692,
                0.7155564013343579,
                0.9628257648188389,
                1.0164745083528286,
                0.9404951152264509,
                0.9154585874049411,
                0.7613637860362081
              ],
              "variance": 0.24124443007696672,
              "mean_reward": 0.8689313410803134,
              "min_reward": 0.7155564013343579,
              "max_reward": 1.0164745083528286,
              "num_responses": 7,
              "rvariance": 0.011812168697598205
            },
            {
              "id": "chat_sample_236",
              "rewards": [
                -0.09934502411075885,
                -0.08640386736278517,
                0.08125247489941538,
                -0.3229949217370421,
                -0.08486986510781107,
                -0.29480418568605077,
                0.10133228884775915
              ],
              "variance": 0.3953648805852002,
              "mean_reward": -0.10083330003675335,
              "min_reward": -0.3229949217370421,
              "max_reward": 0.10133228884775915,
              "num_responses": 7,
              "rvariance": 0.0230674143066367
            },
            {
              "id": "chat_sample_234",
              "rewards": [
                -0.872085764825431,
                -0.8815130601206244,
                -0.504209271953385,
                -0.2653670286411514,
                -0.7363827389954918,
                -0.42445316668843674,
                -0.7754485688771172
              ],
              "variance": 0.5150379714739859,
              "mean_reward": -0.6370656571573768,
              "min_reward": -0.8815130601206244,
              "max_reward": -0.2653670286411514,
              "num_responses": 7,
              "rvariance": 0.049288208208338846
            },
            {
              "id": "chat_sample_194",
              "rewards": [
                0.3895395867622551,
                0.3578498276036489,
                0.2692896375404613,
                0.2899142307327411,
                0.41974056528924886,
                0.29506242991732945,
                0.3104349555088618
              ],
              "variance": 0.11995558471722345,
              "mean_reward": 0.3331187476220781,
              "min_reward": 0.2692896375404613,
              "max_reward": 0.41974056528924886,
              "num_responses": 7,
              "rvariance": 0.002743128573947671
            },
            {
              "id": "chat_sample_70",
              "rewards": [
                0.18410764405996885,
                -0.27336842962471974,
                0.24261099952062826,
                0.3752827634096007,
                0.047011933548060936,
                0.0477375992854439,
                0.3347090750240072
              ],
              "variance": 0.43207876209929597,
              "mean_reward": 0.13687022646042715,
              "min_reward": -0.27336842962471974,
              "max_reward": 0.3752827634096007,
              "num_responses": 7,
              "rvariance": 0.04195830363759046
            },
            {
              "id": "chat_sample_74",
              "rewards": [
                0.4521333793735571,
                0.31562343020175676,
                0.5011592718006063,
                0.47129462909736547,
                0.19812069459918885,
                0.18667891730080294,
                0.1588174511949143
              ],
              "variance": 0.3077061553202143,
              "mean_reward": 0.32626111050974166,
              "min_reward": 0.1588174511949143,
              "max_reward": 0.5011592718006063,
              "num_responses": 7,
              "rvariance": 0.01878880150622548
            },
            {
              "id": "chat_sample_200",
              "rewards": [
                0.11797879235993561,
                0.10734959110633102,
                0.14627975611787117,
                0.34656915233848923,
                0.1285924486805096,
                0.25270460717254223,
                0.4013897718466267
              ],
              "variance": 0.2547702882832505,
              "mean_reward": 0.21440915994604362,
              "min_reward": 0.10734959110633102,
              "max_reward": 0.4013897718466267,
              "num_responses": 7,
              "rvariance": 0.01238017782364523
            },
            {
              "id": "chat_sample_260",
              "rewards": [
                0.3228659558182858,
                0.3372619769803506,
                0.7671507406507811,
                0.654312898133123,
                0.4945781124257427,
                0.7472101245118478,
                0.5249635103855086
              ],
              "variance": 0.42368280245189643,
              "mean_reward": 0.5497633312722343,
              "min_reward": 0.3228659558182858,
              "max_reward": 0.7671507406507811,
              "num_responses": 7,
              "rvariance": 0.028210402558092235
            },
            {
              "id": "chat_sample_315",
              "rewards": [
                -0.284326194235562,
                -0.05377222658009773,
                -0.13116479543653,
                -0.23058382780945608,
                -0.3319756535015382,
                -0.2680916314486964,
                0.2419842560843491
              ],
              "variance": 0.36791634442763355,
              "mean_reward": -0.15113286756107588,
              "min_reward": -0.3319756535015382,
              "max_reward": 0.2419842560843491,
              "num_responses": 7,
              "rvariance": 0.033550753464526344
            },
            {
              "id": "chat_sample_240",
              "rewards": [
                -0.06060493123491103,
                0.29249045008863034,
                0.46538472819427773,
                0.48475830757152677,
                0.42952680721987596,
                0.19512087581821574,
                0.16659804347066162
              ],
              "variance": 0.39741730635674477,
              "mean_reward": 0.28189632587546815,
              "min_reward": -0.06060493123491103,
              "max_reward": 0.48475830757152677,
              "num_responses": 7,
              "rvariance": 0.033551250810473436
            },
            {
              "id": "chat_sample_20",
              "rewards": [
                1.3305143053187876,
                1.1146170897475831,
                0.9724865874034236,
                0.9609709716731424,
                0.9070417127567367,
                1.1133310998332335,
                1.0441501418502153
              ],
              "variance": 0.26157670786948484,
              "mean_reward": 1.0633017012261603,
              "min_reward": 0.9070417127567367,
              "max_reward": 1.3305143053187876,
              "num_responses": 7,
              "rvariance": 0.017148816420362485
            },
            {
              "id": "chat_sample_210",
              "rewards": [
                0.5628224881936674,
                0.8527192376934435,
                0.7392793823147821,
                0.787337955954609,
                0.8915723846276956,
                0.7346611240289641,
                1.0352400688722219
              ],
              "variance": 0.2831137886306607,
              "mean_reward": 0.8005189488121977,
              "min_reward": 0.5628224881936674,
              "max_reward": 1.0352400688722219,
              "num_responses": 7,
              "rvariance": 0.018695783726940512
            },
            {
              "id": "chat_sample_93",
              "rewards": [
                -0.563555586737022,
                -0.2558704877351855,
                -0.6736094730664729,
                -0.737687100194332,
                -0.650022156956134,
                -0.1804266882104983,
                -0.6602902918107096
              ],
              "variance": 0.473547555992306,
              "mean_reward": -0.5316373978157649,
              "min_reward": -0.737687100194332,
              "max_reward": -0.1804266882104983,
              "num_responses": 7,
              "rvariance": 0.04194202719316069
            },
            {
              "id": "chat_sample_226",
              "rewards": [
                0.7137355244061828,
                1.011033075204254,
                1.1801181381295396,
                1.316614308837972,
                1.1943834405365743,
                1.1200224869150415,
                1.2891464121729035
              ],
              "variance": 0.4080195159539054,
              "mean_reward": 1.1178647694574955,
              "min_reward": 0.7137355244061828,
              "max_reward": 1.316614308837972,
              "num_responses": 7,
              "rvariance": 0.03618678325962209
            },
            {
              "id": "chat_sample_30",
              "rewards": [
                1.2961766081359918,
                1.0266656251301165,
                0.7812577673760498,
                1.0943454371938843,
                1.1250650512138083,
                1.1543548846888494,
                1.0836710143169181
              ],
              "variance": 0.28258109203921655,
              "mean_reward": 1.0802194840079455,
              "min_reward": 0.7812577673760498,
              "max_reward": 1.2961766081359918,
              "num_responses": 7,
              "rvariance": 0.02094317734583879
            },
            {
              "id": "chat_sample_142",
              "rewards": [
                0.6154237152177544,
                0.7606875814493771,
                0.9612405349436502,
                1.178651261721743,
                0.9196218031056815,
                1.1037154988720106,
                0.7483509106199342
              ],
              "variance": 0.43850977155284143,
              "mean_reward": 0.8982416151328788,
              "min_reward": 0.6154237152177544,
              "max_reward": 1.178651261721743,
              "num_responses": 7,
              "rvariance": 0.03523562330405721
            },
            {
              "id": "chat_sample_136",
              "rewards": [
                -0.40745054289228655,
                -0.1900596005744145,
                -0.040125188554961846,
                0.15735552090217297,
                0.1011054741430854,
                -0.004209327375627849,
                0.1799458415349585
              ],
              "variance": 0.4434076266568505,
              "mean_reward": -0.02906254611672484,
              "min_reward": -0.40745054289228655,
              "max_reward": 0.1799458415349585,
              "num_responses": 7,
              "rvariance": 0.03788821535793727
            },
            {
              "id": "chat_sample_16",
              "rewards": [
                1.9138449831706659,
                1.9007374249804783,
                1.6357005563359552,
                1.4665801640174183,
                1.86645978776621,
                1.587116281324548,
                1.8304488905190297
              ],
              "variance": 0.36707861385485696,
              "mean_reward": 1.742984012587758,
              "min_reward": 1.4665801640174183,
              "max_reward": 1.9138449831706659,
              "num_responses": 7,
              "rvariance": 0.027025651350928687
            },
            {
              "id": "chat_sample_22",
              "rewards": [
                0.20046797948680928,
                -0.7935188469373236,
                -0.47780549661304766,
                -0.18159538453925334,
                -0.31473632277060387,
                -0.27304622555826735,
                -0.2104778701101063
              ],
              "variance": 0.5753207978139299,
              "mean_reward": -0.2929588810059704,
              "min_reward": -0.7935188469373236,
              "max_reward": 0.20046797948680928,
              "num_responses": 7,
              "rvariance": 0.07832490482440514
            },
            {
              "id": "chat_sample_217",
              "rewards": [
                0.3228058958497585,
                0.3230623872447634,
                0.26643078303856116,
                0.09163931651531564,
                0.4306573478039195,
                0.18072874088940866,
                0.236324487285481
              ],
              "variance": 0.22100740032865443,
              "mean_reward": 0.26452127980388684,
              "min_reward": 0.09163931651531564,
              "max_reward": 0.4306573478039195,
              "num_responses": 7,
              "rvariance": 0.010304774133957842
            }
          ]
        },
        "semantic_benchmark_chat_hard_filtered.json": {
          "file_name": "semantic_benchmark_chat_hard_filtered.json",
          "processed_samples": 200,
          "global_mean": 7.522878719601235,
          "global_std": 3.3052810098050727,
          "mean_variance": 0.7736287433183429,
          "mean_rvariance": 0.17468449210707987,
          "sample_results": [
            {
              "id": "chat_hard_sample_121",
              "rewards": [
                1.6343318319604363,
                -0.30014789329249414,
                1.6343318319604363,
                -0.30014789329249414,
                1.6343318319604363,
                -0.30014789329249414
              ],
              "variance": 1.9344797252529304,
              "mean_reward": 0.6670919693339711,
              "min_reward": -0.30014789329249414,
              "max_reward": 1.6343318319604363,
              "num_responses": 6,
              "rvariance": 0.9355529518536633
            },
            {
              "id": "chat_hard_sample_77",
              "rewards": [
                2.0131873558300115,
                0.6152779542599492,
                2.2415525945758645,
                1.7849020400271278,
                0.6300778367028121,
                2.2415525945758645,
                2.5977853090974157
              ],
              "variance": 1.7598877966588182,
              "mean_reward": 1.732047955009864,
              "min_reward": 0.6152779542599492,
              "max_reward": 2.5977853090974157,
              "num_responses": 7,
              "rvariance": 0.5445767735648886
            },
            {
              "id": "chat_hard_sample_265",
              "rewards": [
                1.3532690978106974,
                1.3532690978106974,
                -0.770939038137216,
                -0.38890621662150665,
                1.3532690978106974,
                0.13199863317839677,
                0.7150829555475426
              ],
              "variance": 1.8949884430384878,
              "mean_reward": 0.5352919467713299,
              "min_reward": -0.770939038137216,
              "max_reward": 1.3532690978106974,
              "num_responses": 7,
              "rvariance": 0.6803731133781169
            },
            {
              "id": "chat_hard_sample_334",
              "rewards": [
                2.1246299454992954,
                1.2883197326331288,
                1.7678706628516823,
                -0.984665105917585,
                -0.4374993659469091,
                1.02177816048254
              ],
              "variance": 2.6573325401077357,
              "mean_reward": 0.7967390049336922,
              "min_reward": -0.984665105917585,
              "max_reward": 2.1246299454992954,
              "num_responses": 6,
              "rvariance": 1.2825717071223706
            },
            {
              "id": "chat_hard_sample_61",
              "rewards": [
                1.8266691352558864,
                1.2418588235551773,
                0.8092200640853485,
                1.7623473238723917,
                0.2988511932943658,
                0.1303736295148454,
                0.7227163179273215
              ],
              "variance": 1.556615880643232,
              "mean_reward": 0.9702909267864767,
              "min_reward": 0.1303736295148454,
              "max_reward": 1.8266691352558864,
              "num_responses": 7,
              "rvariance": 0.3825736409132086
            },
            {
              "id": "chat_hard_sample_133",
              "rewards": [
                2.358768679150628,
                0.9509196910738755,
                1.5922340808015587,
                0.8144199603965209,
                0.8654731205946931,
                0.3675658812363779
              ],
              "variance": 1.384508459159644,
              "mean_reward": 1.1582302355422758,
              "min_reward": 0.3675658812363779,
              "max_reward": 2.358768679150628,
              "num_responses": 6,
              "rvariance": 0.4169486514912313
            },
            {
              "id": "chat_hard_sample_62",
              "rewards": [
                1.4497115648839747,
                -0.549146812257017,
                1.3371869859145635,
                1.4289818040154536
              ],
              "variance": 1.426739309428961,
              "mean_reward": 0.9166833856392437,
              "min_reward": -0.549146812257017,
              "max_reward": 1.4497115648839747,
              "num_responses": 4,
              "rvariance": 0.718012539062204
            },
            {
              "id": "chat_hard_sample_84",
              "rewards": [
                1.8015271662866856,
                0.23673635155265102,
                1.7985723256406576,
                0.3670020926783915,
                0.3670020926783915,
                0.23673635155265102
              ],
              "variance": 1.5633133944110207,
              "mean_reward": 0.8012627300649046,
              "min_reward": 0.23673635155265102,
              "max_reward": 1.8015271662866856,
              "num_responses": 6,
              "rvariance": 0.5016166730394253
            },
            {
              "id": "chat_hard_sample_343",
              "rewards": [
                -0.13021094234496186,
                -1.2992002610560658,
                -1.2931688199014355,
                -0.16397939560621855
              ],
              "variance": 1.157049350386338,
              "mean_reward": -0.7216398547271703,
              "min_reward": -1.2992002610560658,
              "max_reward": -0.13021094234496186,
              "num_responses": 4,
              "rvariance": 0.3302486817651395
            },
            {
              "id": "chat_hard_sample_87",
              "rewards": [
                0.644402220914579,
                -1.2887970060679605,
                -1.249781914557766,
                -1.4483566697705907,
                -1.3704788308436597
              ],
              "variance": 1.3039341009254595,
              "mean_reward": -0.9426024400650796,
              "min_reward": -1.4483566697705907,
              "max_reward": 0.644402220914579,
              "num_responses": 5,
              "rvariance": 0.6343318495402812
            },
            {
              "id": "chat_hard_sample_110",
              "rewards": [
                1.6408191512735202,
                -1.2752603100666864,
                -1.3742481930348236,
                -1.8970515733933506,
                -1.3742481930348236,
                -1.2722365106359304,
                -1.3742481930348236
              ],
              "variance": 1.4763552993060853,
              "mean_reward": -0.9894962602752739,
              "min_reward": -1.8970515733933506,
              "max_reward": 1.6408191512735202,
              "num_responses": 7,
              "rvariance": 1.1925601573162534
            },
            {
              "id": "chat_hard_sample_150",
              "rewards": [
                1.4828844912344412,
                -0.6851623887888747,
                0.36828778449742294,
                1.4249487249655386,
                -0.6107215249401083,
                1.3032961957297724,
                0.5943289102266023
              ],
              "variance": 2.088620901952715,
              "mean_reward": 0.5539803132749707,
              "min_reward": -0.6851623887888747,
              "max_reward": 1.4828844912344412,
              "num_responses": 7,
              "rvariance": 0.7301482814616866
            },
            {
              "id": "chat_hard_sample_65",
              "rewards": [
                -0.9294484508925226,
                -0.9829518119271433,
                -0.1982868238041787,
                -0.7963112544294839,
                -0.10200535673876028,
                -1.456120447927345,
                -0.10200535673876028
              ],
              "variance": 1.0702139095884637,
              "mean_reward": -0.652447071779742,
              "min_reward": -1.456120447927345,
              "max_reward": -0.10200535673876028,
              "num_responses": 7,
              "rvariance": 0.23782637714628405
            },
            {
              "id": "chat_hard_sample_46",
              "rewards": [
                -0.4602748079188712,
                -0.2737964045509909,
                0.4575360325815331,
                0.3600837088281368,
                0.4936231167803428,
                0.3293240514126744,
                0.4653471297370129
              ],
              "variance": 0.8250452904524879,
              "mean_reward": 0.19597754669569115,
              "min_reward": -0.4602748079188712,
              "max_reward": 0.4936231167803428,
              "num_responses": 7,
              "rvariance": 0.13223322002498875
            },
            {
              "id": "chat_hard_sample_114",
              "rewards": [
                1.7958206104525736,
                0.4858956934640728,
                1.0284039744260403,
                1.0284039744260403
              ],
              "variance": 0.9169474418919507,
              "mean_reward": 1.0846310631921816,
              "min_reward": 0.4858956934640728,
              "max_reward": 1.7958206104525736,
              "num_responses": 4,
              "rvariance": 0.21764939652953186
            },
            {
              "id": "chat_hard_sample_371",
              "rewards": [
                0.9044408931061619,
                -0.8770628569375535,
                -1.3325624634014346,
                0.2720547905526502
              ],
              "variance": 1.9106376438023787,
              "mean_reward": -0.25828240917004397,
              "min_reward": -1.3325624634014346,
              "max_reward": 0.9044408931061619,
              "num_responses": 4,
              "rvariance": 0.7925374751311384
            },
            {
              "id": "chat_hard_sample_223",
              "rewards": [
                1.331426186350205,
                1.4335714583613541,
                1.5907873889746682,
                0.9615116449959228,
                1.8163031006997057
              ],
              "variance": 0.6166193544720551,
              "mean_reward": 1.4267199558763712,
              "min_reward": 0.9615116449959228,
              "max_reward": 1.8163031006997057,
              "num_responses": 5,
              "rvariance": 0.08084795348859022
            },
            {
              "id": "chat_hard_sample_52",
              "rewards": [
                -0.6011111517111365,
                0.11803144970091195,
                -0.2041953509743145,
                -0.32415766865804163,
                0.34964813842626785,
                -0.2518946328725717,
                0.39363114774168745
              ],
              "variance": 0.8021804040317153,
              "mean_reward": -0.07429258119245673,
              "min_reward": -0.6011111517111365,
              "max_reward": 0.39363114774168745,
              "num_responses": 7,
              "rvariance": 0.11772206703500916
            },
            {
              "id": "chat_hard_sample_372",
              "rewards": [
                0.7419474514825463,
                -0.5833203623122415,
                -0.9857753712047558,
                -0.8269081806542071
              ],
              "variance": 1.2824823213837013,
              "mean_reward": -0.41351411567216456,
              "min_reward": -0.9857753712047558,
              "max_reward": 0.7419474514825463,
              "num_responses": 4,
              "rvariance": 0.46557579802893145
            },
            {
              "id": "chat_hard_sample_346",
              "rewards": [
                2.2168855467767994,
                1.5800953149760493,
                0.5359915095294923,
                0.5154539099606736,
                1.6363639521313156
              ],
              "variance": 1.4610079591304048,
              "mean_reward": 1.296958046674866,
              "min_reward": 0.5154539099606736,
              "max_reward": 2.2168855467767994,
              "num_responses": 5,
              "rvariance": 0.44628969463199564
            },
            {
              "id": "chat_hard_sample_108",
              "rewards": [
                1.3977131788332113,
                -0.19250351886237763,
                0.701176940531825,
                0.701176940531825,
                1.0355150966369577
              ],
              "variance": 1.0878652810594065,
              "mean_reward": 0.7286157275342883,
              "min_reward": -0.19250351886237763,
              "max_reward": 1.3977131788332113,
              "num_responses": 5,
              "rvariance": 0.2783690124474052
            },
            {
              "id": "chat_hard_sample_64",
              "rewards": [
                1.7756497331238783,
                0.6927691623436348,
                1.044714025401401,
                1.036934666598725,
                1.0650635030972375,
                1.6098110691147487
              ],
              "variance": 0.8278784866481335,
              "mean_reward": 1.2041570266132708,
              "min_reward": 0.6927691623436348,
              "max_reward": 1.7756497331238783,
              "num_responses": 6,
              "rvariance": 0.13756817668720964
            },
            {
              "id": "chat_hard_sample_233",
              "rewards": [
                0.02815420517032772,
                -0.3806842520624584,
                0.10745623054670657,
                0.9630575913079449,
                0.93074794815374,
                -0.06082859487215118,
                -0.3907666611567657
              ],
              "variance": 1.3283890211156033,
              "mean_reward": 0.171019495298192,
              "min_reward": -0.3907666611567657,
              "max_reward": 0.9630575913079449,
              "num_responses": 7,
              "rvariance": 0.27181381353001133
            },
            {
              "id": "chat_hard_sample_47",
              "rewards": [
                -0.4543645495658552,
                -1.720472073734476,
                -2.241278823171168,
                -1.7144475573113664
              ],
              "variance": 1.252647346450652,
              "mean_reward": -1.5326407509457165,
              "min_reward": -2.241278823171168,
              "max_reward": -0.4543645495658552,
              "num_responses": 4,
              "rvariance": 0.4332954511327599
            },
            {
              "id": "chat_hard_sample_26",
              "rewards": [
                -0.20654225789891087,
                -0.9687116786155463,
                -0.9258949095004241,
                -0.5691488992548925,
                -0.083414760849211,
                -0.7549602201529343,
                0.023080685209410246
              ],
              "variance": 0.9022050347207105,
              "mean_reward": -0.497941720151787,
              "min_reward": -0.9687116786155463,
              "max_reward": 0.023080685209410246,
              "num_responses": 7,
              "rvariance": 0.14344397874893916
            },
            {
              "id": "chat_hard_sample_379",
              "rewards": [
                -0.20228701037936975,
                -0.5107526383398556,
                -0.40312038218990054,
                -0.2264843305569393,
                -0.20099670207265782,
                -2.0541027531025655,
                -0.29694058847643645
              ],
              "variance": 0.9263217971882545,
              "mean_reward": -0.5563834864453893,
              "min_reward": -2.0541027531025655,
              "max_reward": -0.20099670207265782,
              "num_responses": 7,
              "rvariance": 0.38522327233893894
            },
            {
              "id": "chat_hard_sample_247",
              "rewards": [
                1.2148581412335977,
                1.4589583897081038,
                -0.07715884298111428,
                1.5542409642516444
              ],
              "variance": 1.215209939605283,
              "mean_reward": 1.037724663053058,
              "min_reward": -0.07715884298111428,
              "max_reward": 1.5542409642516444,
              "num_responses": 4,
              "rvariance": 0.42964211074873765
            },
            {
              "id": "chat_hard_sample_215",
              "rewards": [
                1.1353489509725545,
                1.2969427545594243,
                0.8593412708330109,
                0.36796347623786474,
                1.0544340402127856,
                1.3912622143606115,
                0.7278567769596069
              ],
              "variance": 0.750771081808989,
              "mean_reward": 0.9761642120194083,
              "min_reward": 0.36796347623786474,
              "max_reward": 1.3912622143606115,
              "num_responses": 7,
              "rvariance": 0.10741192698876935
            },
            {
              "id": "chat_hard_sample_49",
              "rewards": [
                -1.082174558706028,
                -2.5354610382480516,
                -2.058083896666074,
                -2.187471351010591,
                -2.0961041350811116,
                -1.0749070529749323,
                -2.2447908161741412
              ],
              "variance": 1.2817913485901153,
              "mean_reward": -1.8969989784087045,
              "min_reward": -2.5354610382480516,
              "max_reward": -1.0749070529749323,
              "num_responses": 7,
              "rvariance": 0.28833319237518124
            },
            {
              "id": "chat_hard_sample_415",
              "rewards": [
                -0.9660156498101088,
                -0.4492968002145384,
                0.08699941951229752,
                -0.15042077128846182,
                -0.15933347781671142,
                0.036222671513997884,
                0.5684015612907489
              ],
              "variance": 0.9355446162764447,
              "mean_reward": -0.14763472097325372,
              "min_reward": -0.9660156498101088,
              "max_reward": 0.5684015612907489,
              "num_responses": 7,
              "rvariance": 0.19463666512802127
            },
            {
              "id": "chat_hard_sample_297",
              "rewards": [
                0.959135885023323,
                0.1776983988500185,
                0.5895496913553194,
                -0.054852551569687415,
                0.4020700872217212,
                0.2880070637327688,
                -0.37429849547834637
              ],
              "variance": 0.9200150979556719,
              "mean_reward": 0.28390143987644534,
              "min_reward": -0.37429849547834637,
              "max_reward": 0.959135885023323,
              "num_responses": 7,
              "rvariance": 0.16037194320750944
            },
            {
              "id": "chat_hard_sample_80",
              "rewards": [
                1.5662496028306587,
                1.5662496028306587,
                1.4105025808911973,
                1.4105025808911973,
                -0.3486319780964438
              ],
              "variance": 1.211227757332046,
              "mean_reward": 1.1209744778694537,
              "min_reward": -0.3486319780964438,
              "max_reward": 1.5662496028306587,
              "num_responses": 5,
              "rvariance": 0.5447872108227635
            },
            {
              "id": "chat_hard_sample_413",
              "rewards": [
                -0.04592195615167572,
                -0.5961276532599896,
                -1.2202664005722101,
                -0.9917502603852995,
                -0.20913210748769587,
                -0.9935206834107879
              ],
              "variance": 0.9793665101718133,
              "mean_reward": -0.6761198435446097,
              "min_reward": -1.2202664005722101,
              "max_reward": -0.04592195615167572,
              "num_responses": 6,
              "rvariance": 0.18634783368606403
            },
            {
              "id": "chat_hard_sample_306",
              "rewards": [
                0.1748477177072828,
                -1.9086770434948797,
                -1.8106920924753407,
                -0.8095490328534428,
                -1.929680331258473,
                -0.641204193094738,
                -1.2254160925798567
              ],
              "variance": 1.6022949298263875,
              "mean_reward": -1.1643387240070642,
              "min_reward": -1.929680331258473,
              "max_reward": 0.1748477177072828,
              "num_responses": 7,
              "rvariance": 0.5363223170833508
            },
            {
              "id": "chat_hard_sample_43",
              "rewards": [
                0.16908576402100425,
                -0.25323918490953007,
                -0.7498774672166557,
                -1.2237241498449374,
                -0.6041291805322919,
                -0.10899702733094364,
                -0.7637280843802068
              ],
              "variance": 0.9499625997759347,
              "mean_reward": -0.5049441900276516,
              "min_reward": -1.2237241498449374,
              "max_reward": 0.16908576402100425,
              "num_responses": 7,
              "rvariance": 0.18969852163301207
            },
            {
              "id": "chat_hard_sample_102",
              "rewards": [
                1.3680482060589978,
                1.1091423045320283,
                1.6522720801479889,
                0.9304842312949889,
                1.7279816125174647,
                1.5038926840161952
              ],
              "variance": 0.6703135784192182,
              "mean_reward": 1.3819701864279441,
              "min_reward": 0.9304842312949889,
              "max_reward": 1.7279816125174647,
              "num_responses": 6,
              "rvariance": 0.08102009308513754
            },
            {
              "id": "chat_hard_sample_187",
              "rewards": [
                0.3914417784591896,
                -1.808919361206012,
                0.32080547752015126,
                0.18980109836552375,
                0.3920603878083824,
                0.32080547752015126
              ],
              "variance": 1.2013102145540302,
              "mean_reward": -0.032334190255435595,
              "min_reward": -1.808919361206012,
              "max_reward": 0.3920603878083824,
              "num_responses": 6,
              "rvariance": 0.6357851725925824
            },
            {
              "id": "chat_hard_sample_360",
              "rewards": [
                2.2077463438217233,
                1.0716119908720885,
                1.0716119908720885,
                -0.02333117368693536,
                0.8710400276764686,
                0.8710400276764686
              ],
              "variance": 1.2158247403521392,
              "mean_reward": 1.0116198678719837,
              "min_reward": -0.02333117368693536,
              "max_reward": 2.2077463438217233,
              "num_responses": 6,
              "rvariance": 0.4247609495791244
            },
            {
              "id": "chat_hard_sample_236",
              "rewards": [
                1.7741912115473064,
                0.550086223479152,
                1.2745539434307076,
                1.485020770908613,
                1.3832560706006287,
                0.856497514421796,
                0.7709632306766833
              ],
              "variance": 0.9180765193664195,
              "mean_reward": 1.1563669950092696,
              "min_reward": 0.550086223479152,
              "max_reward": 1.7741912115473064,
              "num_responses": 7,
              "rvariance": 0.16588585931861308
            },
            {
              "id": "chat_hard_sample_259",
              "rewards": [
                1.619003073147671,
                -0.10910436066951627,
                0.8150287597093925,
                1.376235546960442,
                0.6388162708211212,
                0.6049427924651322,
                1.2117420120492308
              ],
              "variance": 1.1540186262240608,
              "mean_reward": 0.8795234420690676,
              "min_reward": -0.10910436066951627,
              "max_reward": 1.619003073147671,
              "num_responses": 7,
              "rvariance": 0.2884001699989907
            },
            {
              "id": "chat_hard_sample_127",
              "rewards": [
                1.0448981078476627,
                0.5054320922671734,
                1.1352318075976606,
                0.9644904336717937,
                0.0857587384481514
              ],
              "variance": 0.8454702477219012,
              "mean_reward": 0.7471622359664882,
              "min_reward": 0.0857587384481514,
              "max_reward": 1.1352318075976606,
              "num_responses": 5,
              "rvariance": 0.1564728472502122
            },
            {
              "id": "chat_hard_sample_280",
              "rewards": [
                1.0951410744578995,
                0.3794643011720191,
                0.9695137493291852,
                0.0020872074821379877,
                0.31193201113718627,
                0.6038579178602044,
                0.45881653085192386
              ],
              "variance": 0.831770589705504,
              "mean_reward": 0.5458303988986509,
              "min_reward": 0.0020872074821379877,
              "max_reward": 1.0951410744578995,
              "num_responses": 7,
              "rvariance": 0.12431874262667172
            },
            {
              "id": "chat_hard_sample_421",
              "rewards": [
                -0.05100874851467476,
                -0.9024350732298214,
                -1.1392516582663497,
                -0.3741980868712945,
                -1.7210652924014258,
                -1.0203574804197082,
                -0.661677161836029
              ],
              "variance": 1.1270547603917336,
              "mean_reward": -0.8385705002199005,
              "min_reward": -1.7210652924014258,
              "max_reward": -0.05100874851467476,
              "num_responses": 7,
              "rvariance": 0.2533597015829107
            },
            {
              "id": "chat_hard_sample_270",
              "rewards": [
                2.2936672584100815,
                2.127186325552396,
                1.7513724900033394,
                2.0184804474862346,
                1.5843606610623915,
                2.0300963960819227
              ],
              "variance": 0.5425602164483734,
              "mean_reward": 1.9675272630993943,
              "min_reward": 1.5843606610623915,
              "max_reward": 2.2936672584100815,
              "num_responses": 6,
              "rvariance": 0.055318161169126856
            },
            {
              "id": "chat_hard_sample_276",
              "rewards": [
                1.1422557936036077,
                0.5128000066053211,
                1.0616507645793956,
                0.8894730859239194,
                0.6032416167548518,
                1.0004788404464318
              ],
              "variance": 0.5439324674114152,
              "mean_reward": 0.8683166846522545,
              "min_reward": 0.5128000066053211,
              "max_reward": 1.1422557936036077,
              "num_responses": 6,
              "rvariance": 0.054498671767267866
            },
            {
              "id": "chat_hard_sample_349",
              "rewards": [
                0.7199325758559537,
                0.7199325758559537,
                0.27491008818306645,
                0.27491008818306645,
                0.11114595832538109,
                0.27491008818306645,
                -0.25598541801849345
              ],
              "variance": 0.7556391680681224,
              "mean_reward": 0.30282227950971347,
              "min_reward": -0.25598541801849345,
              "max_reward": 0.7199325758559537,
              "num_responses": 7,
              "rvariance": 0.09990073211851401
            },
            {
              "id": "chat_hard_sample_267",
              "rewards": [
                0.003439838372537278,
                -1.9279462630734687,
                -0.5026079999494565,
                -0.586246061379786,
                -0.8810214951236197,
                -1.1079726459868262,
                -0.6431477344082469
              ],
              "variance": 1.1357732282008244,
              "mean_reward": -0.8065003373641239,
              "min_reward": -1.9279462630734687,
              "max_reward": 0.003439838372537278,
              "num_responses": 7,
              "rvariance": 0.3110899400148193
            },
            {
              "id": "chat_hard_sample_14",
              "rewards": [
                0.9965802166002126,
                -0.46157204095710397,
                -0.3263210701973364,
                -0.024151754372151994,
                -0.6123165214337362,
                -1.380483913769318
              ],
              "variance": 1.4826144487155573,
              "mean_reward": -0.3013775140215723,
              "min_reward": -1.380483913769318,
              "max_reward": 0.9965802166002126,
              "num_responses": 6,
              "rvariance": 0.5081644246759746
            },
            {
              "id": "chat_hard_sample_13",
              "rewards": [
                0.6589672395466942,
                1.0099738014833899,
                1.0357753511299483,
                0.5419433162716332,
                0.7922383141524687,
                -0.5153356564847154,
                0.9189637862881922
              ],
              "variance": 0.9012626941729195,
              "mean_reward": 0.6346465931982301,
              "min_reward": -0.5153356564847154,
              "max_reward": 1.0357753511299483,
              "num_responses": 7,
              "rvariance": 0.24844153949949035
            },
            {
              "id": "chat_hard_sample_147",
              "rewards": [
                1.3647081772221246,
                0.9022088213126191,
                1.7241294420785311,
                1.4063471649177481,
                0.7110475682537873
              ],
              "variance": 0.8095044617368978,
              "mean_reward": 1.2216882347569622,
              "min_reward": 0.7110475682537873,
              "max_reward": 1.7241294420785311,
              "num_responses": 5,
              "rvariance": 0.13396435542943366
            },
            {
              "id": "chat_hard_sample_173",
              "rewards": [
                1.4656130566996073,
                0.2986861538597864,
                0.6039583264672562,
                0.2986861538597864,
                0.6039583264672562,
                0.2986861538597864
              ],
              "variance": 0.7360995377236452,
              "mean_reward": 0.5949313618689132,
              "min_reward": 0.2986861538597864,
              "max_reward": 1.4656130566996073,
              "num_responses": 6,
              "rvariance": 0.17025554261634693
            },
            {
              "id": "chat_hard_sample_345",
              "rewards": [
                -0.266663931084551,
                -1.4938434999479475,
                -2.0522775092858705,
                -1.1480299095909035,
                -1.8942401323958995,
                -1.5365884249735413
              ],
              "variance": 1.2659119005031578,
              "mean_reward": -1.3986072345464524,
              "min_reward": -2.0522775092858705,
              "max_reward": -0.266663931084551,
              "num_responses": 6,
              "rvariance": 0.3408550317836614
            },
            {
              "id": "chat_hard_sample_412",
              "rewards": [
                0.9805304201178425,
                0.28070406875262877,
                0.7314769688925932,
                1.0365843905959635,
                0.28070406875262877,
                0.7314769688925932,
                0.2356508998867632
              ],
              "variance": 0.7402692071028085,
              "mean_reward": 0.6110182551272876,
              "min_reward": 0.2356508998867632,
              "max_reward": 1.0365843905959635,
              "num_responses": 7,
              "rvariance": 0.10082599342838654
            },
            {
              "id": "chat_hard_sample_21",
              "rewards": [
                0.5654568192115221,
                0.4191551310664532,
                0.316736043629752,
                0.519592014105321,
                -0.16354313752040717,
                0.5503378220577417
              ],
              "variance": 0.4813008675799595,
              "mean_reward": 0.36795578209173047,
              "min_reward": -0.16354313752040717,
              "max_reward": 0.5654568192115221,
              "num_responses": 6,
              "rvariance": 0.06383322525287581
            },
            {
              "id": "chat_hard_sample_357",
              "rewards": [
                0.495144826532042,
                -0.04466857974640812,
                0.2977270785441535,
                -0.2984761476911773,
                0.014783702725553167,
                -0.39387124912193133,
                -0.8975923776529311
              ],
              "variance": 0.9720538782736401,
              "mean_reward": -0.1181361066300999,
              "min_reward": -0.8975923776529311,
              "max_reward": 0.495144826532042,
              "num_responses": 7,
              "rvariance": 0.1840321889486816
            },
            {
              "id": "chat_hard_sample_184",
              "rewards": [
                0.3109406204077895,
                0.813494931677532,
                1.176877720024805,
                0.7571576242680175,
                0.9189891769704353,
                0.9880604885857693
              ],
              "variance": 0.5484199819673837,
              "mean_reward": 0.8275867603223914,
              "min_reward": 0.3109406204077895,
              "max_reward": 1.176877720024805,
              "num_responses": 6,
              "rvariance": 0.07136541174837736
            },
            {
              "id": "chat_hard_sample_348",
              "rewards": [
                0.05524894842839848,
                0.02170670306348844,
                1.2886278831858051,
                0.02170670306348844,
                0.02170670306348844,
                0.1953795466665007
              ],
              "variance": 0.7202970118626645,
              "mean_reward": 0.267396081245195,
              "min_reward": 0.02170670306348844,
              "max_reward": 1.2886278831858051,
              "num_responses": 6,
              "rvariance": 0.212366165360653
            },
            {
              "id": "chat_hard_sample_283",
              "rewards": [
                -0.24825799470222346,
                0.043293976518670625,
                -0.5824628497255805,
                -0.9996559955382305,
                -0.7348450292068854,
                -0.04394956179016345
              ],
              "variance": 0.8669227197368116,
              "mean_reward": -0.42764624240740207,
              "min_reward": -0.9996559955382305,
              "max_reward": 0.043293976518670625,
              "num_responses": 6,
              "rvariance": 0.14112040168715595
            },
            {
              "id": "chat_hard_sample_0",
              "rewards": [
                -0.9468237564001687,
                -1.00007609591716,
                -1.1983265428704264,
                -0.13644724014041626,
                -1.0223702690484253,
                -1.1209080444677095,
                -0.10260896250299135
              ],
              "variance": 1.02896351474335,
              "mean_reward": -0.7896515587638996,
              "min_reward": -1.1983265428704264,
              "max_reward": -0.10260896250299135,
              "num_responses": 7,
              "rvariance": 0.18551272808043975
            },
            {
              "id": "chat_hard_sample_258",
              "rewards": [
                0.3499026223096578,
                -0.9592121010909076,
                -0.31862711641675034,
                0.02010074241161932,
                -0.19233040057435724,
                -0.2918826491614408,
                -0.040911912896365726
              ],
              "variance": 0.7268826046572481,
              "mean_reward": -0.20470868791693494,
              "min_reward": -0.9592121010909076,
              "max_reward": 0.3499026223096578,
              "num_responses": 7,
              "rvariance": 0.13928109989466883
            },
            {
              "id": "chat_hard_sample_161",
              "rewards": [
                2.043542493512466,
                0.8675332282221356,
                1.6049669308854582,
                0.9326464787123636,
                1.467767225263541
              ],
              "variance": 0.9745337400434361,
              "mean_reward": 1.3832912713191932,
              "min_reward": 0.8675332282221356,
              "max_reward": 2.043542493512466,
              "num_responses": 5,
              "rvariance": 0.19225900987392308
            },
            {
              "id": "chat_hard_sample_4",
              "rewards": [
                0.4384607054855267,
                -0.6373182645896404,
                -0.5621826193449522,
                0.27244257551781587,
                -0.49303917510960965,
                -0.2530060522816626,
                -0.6468917059171678
              ],
              "variance": 0.9799974686255516,
              "mean_reward": -0.26879064803424146,
              "min_reward": -0.6468917059171678,
              "max_reward": 0.4384607054855267,
              "num_responses": 7,
              "rvariance": 0.1726466139509166
            },
            {
              "id": "chat_hard_sample_238",
              "rewards": [
                0.2775423517524164,
                -1.1420019308020335,
                0.2455838501924129,
                -1.1739964986720413,
                -0.4929849313793633,
                -0.8532417805059482
              ],
              "variance": 1.419562315709452,
              "mean_reward": -0.5231831565690928,
              "min_reward": -1.1739964986720413,
              "max_reward": 0.2775423517524164,
              "num_responses": 6,
              "rvariance": 0.35808489333397553
            },
            {
              "id": "chat_hard_sample_8",
              "rewards": [
                -0.6306312821843729,
                -0.13574380283009344,
                0.43964598869750626,
                -0.845945421726849,
                0.30213063073043206,
                0.4535318065796215,
                -0.38859575782499006
              ],
              "variance": 1.1619572538517158,
              "mean_reward": -0.11508683407982077,
              "min_reward": -0.845945421726849,
              "max_reward": 0.4535318065796215,
              "num_responses": 7,
              "rvariance": 0.24004289584994493
            },
            {
              "id": "chat_hard_sample_32",
              "rewards": [
                -0.19301710311683812,
                0.08637907898022447,
                0.06217310288825389,
                0.190686309878268,
                0.3267613236890126,
                0.5871093005551921,
                -0.09079421640656002
              ],
              "variance": 0.5625838855261558,
              "mean_reward": 0.13847111378107899,
              "min_reward": -0.19301710311683812,
              "max_reward": 0.5871093005551921,
              "num_responses": 7,
              "rvariance": 0.058633978372386895
            },
            {
              "id": "chat_hard_sample_109",
              "rewards": [
                2.4210872234112473,
                -0.22299888235812887,
                1.8755640874634045,
                2.291233215280515,
                1.8755640874634045,
                1.8755640874634045,
                1.274125187137377
              ],
              "variance": 1.6678992591936332,
              "mean_reward": 1.627162715123032,
              "min_reward": -0.22299888235812887,
              "max_reward": 2.4210872234112473,
              "num_responses": 7,
              "rvariance": 0.6863069874774423
            },
            {
              "id": "chat_hard_sample_188",
              "rewards": [
                0.7507233945632598,
                0.7241451208644498,
                -1.1703321615756097,
                0.35037927466267393,
                0.595083128901411,
                0.3160683840989534,
                0.46517747381475294
              ],
              "variance": 1.0132682645148454,
              "mean_reward": 0.29017780218998446,
              "min_reward": -1.1703321615756097,
              "max_reward": 0.7507233945632598,
              "num_responses": 7,
              "rvariance": 0.3802008447765394
            },
            {
              "id": "chat_hard_sample_53",
              "rewards": [
                -0.4889039562697627,
                -1.9646785014256345,
                -0.1900706298547311,
                -0.25258133541505257,
                -1.1100442948334701,
                -0.6588461007659356,
                -0.7383812587701819
              ],
              "variance": 1.2243209242794117,
              "mean_reward": -0.7719294396192525,
              "min_reward": -1.9646785014256345,
              "max_reward": -0.1900706298547311,
              "num_responses": 7,
              "rvariance": 0.31989583625533224
            },
            {
              "id": "chat_hard_sample_356",
              "rewards": [
                -0.17865867230842722,
                -0.009786398832220286,
                -1.0878816916011003,
                -1.2233756050250564,
                -0.6168175969222662,
                -0.8076031832960937,
                -1.8877158811813712
              ],
              "variance": 1.378001952569638,
              "mean_reward": -0.8302627184523621,
              "min_reward": -1.8877158811813712,
              "max_reward": -0.009786398832220286,
              "num_responses": 7,
              "rvariance": 0.3547077095326237
            },
            {
              "id": "chat_hard_sample_63",
              "rewards": [
                0.8211606094710746,
                0.1567782078646749,
                0.3243734454362514,
                1.0158459738130414,
                0.9785880329262537,
                0.908023864607224,
                0.3956681729307273
              ],
              "variance": 0.736155858873348,
              "mean_reward": 0.6572054724356068,
              "min_reward": 0.1567782078646749,
              "max_reward": 1.0158459738130414,
              "num_responses": 7,
              "rvariance": 0.10732961094034375
            },
            {
              "id": "chat_hard_sample_159",
              "rewards": [
                -0.017023897393392596,
                -1.2397306667553023,
                -1.025883416173319,
                -0.8092905095433324
              ],
              "variance": 0.9208726105423328,
              "mean_reward": -0.7729821224663366,
              "min_reward": -1.2397306667553023,
              "max_reward": -0.017023897393392596,
              "num_responses": 4,
              "rvariance": 0.2136511012455257
            },
            {
              "id": "chat_hard_sample_152",
              "rewards": [
                0.5606418225607152,
                -0.1839318553615282,
                -0.1954846157820887,
                -0.5219464668432539,
                -0.027653360277844354,
                0.5868392360258802
              ],
              "variance": 0.9324560706059689,
              "mean_reward": 0.03641079338698003,
              "min_reward": -0.5219464668432539,
              "max_reward": 0.5868392360258802,
              "num_responses": 6,
              "rvariance": 0.16599717531704003
            },
            {
              "id": "chat_hard_sample_318",
              "rewards": [
                1.2252429302709806,
                1.590070390731784,
                1.6134716553149397,
                0.6581033792894725,
                1.5431864959701027,
                1.5046731589646871
              ],
              "variance": 0.6600978682431351,
              "mean_reward": 1.3557913350903277,
              "min_reward": 0.6581033792894725,
              "max_reward": 1.6134716553149397,
              "num_responses": 6,
              "rvariance": 0.11372998946917932
            },
            {
              "id": "chat_hard_sample_176",
              "rewards": [
                -2.4230495632268134,
                -1.986344110906146,
                -2.2726011150226966,
                -1.7437201286327337,
                -2.4321902088342897,
                -2.273789283539476,
                -1.1525679169808778
              ],
              "variance": 0.9194465774978127,
              "mean_reward": -2.040608903877576,
              "min_reward": -2.4321902088342897,
              "max_reward": -1.1525679169808778,
              "num_responses": 7,
              "rvariance": 0.18392780840534698
            },
            {
              "id": "chat_hard_sample_274",
              "rewards": [
                -0.47659293774767286,
                -2.3830525303604437,
                -1.776016499384857,
                -1.8525821016885937,
                -1.7318794147930994,
                -2.2672194445091027
              ],
              "variance": 1.2208998111643874,
              "mean_reward": -1.747890488080628,
              "min_reward": -2.3830525303604437,
              "max_reward": -0.47659293774767286,
              "num_responses": 6,
              "rvariance": 0.38355643456004535
            },
            {
              "id": "chat_hard_sample_389",
              "rewards": [
                -0.1385160036822599,
                -0.5517897514541283,
                0.09562532674339333,
                -0.5641284689023014,
                -0.2577921958844662,
                -0.3741957786274543,
                -0.626037876942232
              ],
              "variance": 0.5440327606062751,
              "mean_reward": -0.34526210696420695,
              "min_reward": -0.626037876942232,
              "max_reward": 0.09562532674339333,
              "num_responses": 7,
              "rvariance": 0.05928642977958325
            },
            {
              "id": "chat_hard_sample_42",
              "rewards": [
                0.25984995124721294,
                -0.22167856688149337,
                -0.44823500804801336,
                0.07954148366437924,
                -0.6305770384541265,
                -0.1237720961525236,
                -0.0763192192842154
              ],
              "variance": 0.6728366909079714,
              "mean_reward": -0.16588435627268286,
              "min_reward": -0.6305770384541265,
              "max_reward": 0.25984995124721294,
              "num_responses": 7,
              "rvariance": 0.07857901044183528
            },
            {
              "id": "chat_hard_sample_5",
              "rewards": [
                -0.16220666433688977,
                -0.22529789322303959,
                -0.127172139329244,
                0.004060755965570399,
                -0.2974859110837007,
                0.03661853533260451,
                0.06636602782410767
              ],
              "variance": 0.3026906326965098,
              "mean_reward": -0.1007310412643702,
              "min_reward": -0.2974859110837007,
              "max_reward": 0.06636602782410767,
              "num_responses": 7,
              "rvariance": 0.01663934582279347
            },
            {
              "id": "chat_hard_sample_17",
              "rewards": [
                0.28210142186743337,
                -0.6195990307497937,
                0.00665291379819566,
                0.04579322753672495,
                0.13468196664271276,
                0.41309252861997925
              ],
              "variance": 0.6540700337195053,
              "mean_reward": 0.04378717128587537,
              "min_reward": -0.6195990307497937,
              "max_reward": 0.41309252861997925,
              "num_responses": 6,
              "rvariance": 0.10715103720017227
            },
            {
              "id": "chat_hard_sample_182",
              "rewards": [
                1.5498244281937643,
                1.562304237046674,
                1.0974060387261662,
                1.4134248175929816
              ],
              "variance": 0.3663486220045902,
              "mean_reward": 1.4057398803898964,
              "min_reward": 1.0974060387261662,
              "max_reward": 1.562304237046674,
              "num_responses": 4,
              "rvariance": 0.03510039271653135
            },
            {
              "id": "chat_hard_sample_140",
              "rewards": [
                -0.9930255651070496,
                -1.2762736291125658,
                -1.2770768979689804,
                -0.9388753187361927,
                -0.6088887793309324
              ],
              "variance": 0.535872195333378,
              "mean_reward": -1.018828038051144,
              "min_reward": -1.2770768979689804,
              "max_reward": -0.6088887793309324,
              "num_responses": 5,
              "rvariance": 0.061615821356357944
            },
            {
              "id": "chat_hard_sample_251",
              "rewards": [
                0.16058738726208346,
                -0.05351146189848949,
                -0.6316122858164884,
                0.20151255055010295,
                -0.17120304470434922,
                -0.14881077120987224
              ],
              "variance": 0.582457634166512,
              "mean_reward": -0.10717293763616882,
              "min_reward": -0.6316122858164884,
              "max_reward": 0.20151255055010295,
              "num_responses": 6,
              "rvariance": 0.07512201165007211
            },
            {
              "id": "chat_hard_sample_98",
              "rewards": [
                0.716444819413303,
                0.3495610022212976,
                0.7723551017123671,
                0.808647619612961,
                0.23947450580817345,
                0.9335386149566286,
                1.0219247339663973
              ],
              "variance": 0.6633666589044882,
              "mean_reward": 0.6917066282415897,
              "min_reward": 0.23947450580817345,
              "max_reward": 1.0219247339663973,
              "num_responses": 7,
              "rvariance": 0.07284222556442957
            },
            {
              "id": "chat_hard_sample_409",
              "rewards": [
                -0.8994043490675445,
                -2.286096839695806,
                -1.6571194362334154,
                -2.1613097153249505,
                -2.1031950601584266,
                -2.255683418856384
              ],
              "variance": 0.9926282366256154,
              "mean_reward": -1.8938014698894212,
              "min_reward": -2.286096839695806,
              "max_reward": -0.8994043490675445,
              "num_responses": 6,
              "rvariance": 0.240850759689296
            },
            {
              "id": "chat_hard_sample_248",
              "rewards": [
                -0.5209296854316141,
                -1.7096406395140005,
                -1.3709104724417904,
                -1.2783925969579353,
                -1.0769359993105312,
                -0.568031709236201,
                -1.2732509838037298
              ],
              "variance": 0.9572116395563081,
              "mean_reward": -1.1140131552422574,
              "min_reward": -1.7096406395140005,
              "max_reward": -0.5209296854316141,
              "num_responses": 7,
              "rvariance": 0.1606234393636308
            },
            {
              "id": "chat_hard_sample_382",
              "rewards": [
                -0.20581862345498567,
                -1.1208168688360187,
                -0.4115200815246497,
                -0.31516590477826273,
                -0.6308540277149591,
                -0.1749585574324715,
                -0.4739199913806381
              ],
              "variance": 0.633364567117403,
              "mean_reward": -0.47615057930314075,
              "min_reward": -1.1208168688360187,
              "max_reward": -0.1749585574324715,
              "num_responses": 7,
              "rvariance": 0.09048884634275481
            },
            {
              "id": "chat_hard_sample_254",
              "rewards": [
                0.1817574456431365,
                -0.4185636876032392,
                0.017506276335153784,
                -0.15093320142100217,
                -0.4177708058441058,
                -0.08250300453230362
              ],
              "variance": 0.5177991077128177,
              "mean_reward": -0.1450844962370601,
              "min_reward": -0.4185636876032392,
              "max_reward": 0.1817574456431365,
              "num_responses": 6,
              "rvariance": 0.047726792718562866
            },
            {
              "id": "chat_hard_sample_2",
              "rewards": [
                -0.36211904685515206,
                0.29590125766649844,
                0.2721909769392263,
                -0.14954017626339813,
                -0.14360221898429887,
                0.05570367246493203,
                -0.2486769409592328
              ],
              "variance": 0.5757288725477356,
              "mean_reward": -0.04002035371306073,
              "min_reward": -0.36211904685515206,
              "max_reward": 0.29590125766649844,
              "num_responses": 7,
              "rvariance": 0.0556416095766893
            },
            {
              "id": "chat_hard_sample_203",
              "rewards": [
                0.8783773577837327,
                0.2860427482246975,
                0.5676761956639436,
                -1.0782990172982116,
                0.5340427746673427,
                0.5103244150866296,
                -0.049858666021259324
              ],
              "variance": 1.1531914670438994,
              "mean_reward": 0.2354722583009822,
              "min_reward": -1.0782990172982116,
              "max_reward": 0.8783773577837327,
              "num_responses": 7,
              "rvariance": 0.35690579424123137
            },
            {
              "id": "chat_hard_sample_68",
              "rewards": [
                0.09809976414016473,
                0.3757295626384593,
                -0.04976749038956858,
                -0.3583658423708701,
                0.3046737383814515
              ],
              "variance": 0.5822337345140056,
              "mean_reward": 0.07407394647992738,
              "min_reward": -0.3583658423708701,
              "max_reward": 0.3757295626384593,
              "num_responses": 5,
              "rvariance": 0.06941809743329529
            },
            {
              "id": "chat_hard_sample_220",
              "rewards": [
                -0.5964519615195478,
                -1.8577341019400804,
                -2.1355828950727207,
                -1.9124925705628488,
                -2.201412566744873,
                -2.155176711441348,
                -2.3821181965334737
              ],
              "variance": 0.9204735728884463,
              "mean_reward": -1.8915670005449847,
              "min_reward": -2.3821181965334737,
              "max_reward": -0.5964519615195478,
              "num_responses": 7,
              "rvariance": 0.30636915657984903
            },
            {
              "id": "chat_hard_sample_11",
              "rewards": [
                0.30980381031645565,
                0.5348697030231201,
                0.17501218008090216,
                0.33883343897363427
              ],
              "variance": 0.26060915465670614,
              "mean_reward": 0.33962978309852804,
              "min_reward": 0.17501218008090216,
              "max_reward": 0.5348697030231201,
              "num_responses": 4,
              "rvariance": 0.01652695109294799
            },
            {
              "id": "chat_hard_sample_6",
              "rewards": [
                -0.4956186376011134,
                -0.7357706349868345,
                -0.49508427915209047,
                -0.3244300414311937,
                -0.9900006115543734,
                -0.37764314080290023
              ],
              "variance": 0.5118490321535569,
              "mean_reward": -0.5697578909214177,
              "min_reward": -0.9900006115543734,
              "max_reward": -0.3244300414311937,
              "num_responses": 6,
              "rvariance": 0.05205513059388081
            },
            {
              "id": "chat_hard_sample_286",
              "rewards": [
                -1.2620404205324895,
                -1.4879961412395788,
                -1.4008974452317218,
                -2.197871143632936,
                -0.8248469189048444,
                -1.3273469864443403
              ],
              "variance": 0.7994899727175904,
              "mean_reward": -1.4168331759976518,
              "min_reward": -2.197871143632936,
              "max_reward": -0.8248469189048444,
              "num_responses": 6,
              "rvariance": 0.16629245431282386
            },
            {
              "id": "chat_hard_sample_400",
              "rewards": [
                0.30047735107983736,
                0.11269132757644308,
                -0.7007938160751955,
                -1.334697588953686,
                -0.8515867696724734,
                -1.166445078948592,
                -0.7930381646639785
              ],
              "variance": 1.4215518199284305,
              "mean_reward": -0.6333418199510922,
              "min_reward": -1.334697588953686,
              "max_reward": 0.30047735107983736,
              "num_responses": 7,
              "rvariance": 0.32605232189091143
            },
            {
              "id": "chat_hard_sample_209",
              "rewards": [
                -0.6503102150446104,
                0.18557989744262665,
                -0.23101425909347278,
                -0.12330236853102829,
                -0.5134590542425743,
                -0.8808368356163979,
                -0.58441216164869
              ],
              "variance": 0.7427714011317591,
              "mean_reward": -0.39967928524773527,
              "min_reward": -0.8808368356163979,
              "max_reward": 0.18557989744262665,
              "num_responses": 7,
              "rvariance": 0.11268013210976426
            },
            {
              "id": "chat_hard_sample_337",
              "rewards": [
                1.4540060525488006,
                0.8173416200373449,
                1.2094591588912018,
                1.1554387512363602,
                0.9346004071231536,
                1.1700453182576005,
                1.132823155150337
              ],
              "variance": 0.4195810240654112,
              "mean_reward": 1.1248163518921142,
              "min_reward": 0.8173416200373449,
              "max_reward": 1.4540060525488006,
              "num_responses": 7,
              "rvariance": 0.035614368543876965
            },
            {
              "id": "chat_hard_sample_268",
              "rewards": [
                1.9042414204044615,
                1.4220114846787928,
                1.5011611659617137,
                1.4220114846787928,
                1.4220114846787928,
                1.6765957766758133
              ],
              "variance": 0.3684071138613445,
              "mean_reward": 1.558005469513061,
              "min_reward": 1.4220114846787928,
              "max_reward": 1.9042414204044615,
              "num_responses": 6,
              "rvariance": 0.03210956020369591
            },
            {
              "id": "chat_hard_sample_249",
              "rewards": [
                0.3819185414351881,
                0.0985556422986184,
                0.23884320111785912,
                0.3248489436673474,
                -0.3080715173351873,
                0.31645386082027877,
                0.15448323642648462
              ],
              "variance": 0.41177200432938754,
              "mean_reward": 0.17243312977579842,
              "min_reward": -0.3080715173351873,
              "max_reward": 0.3819185414351881,
              "num_responses": 7,
              "rvariance": 0.04699025489871671
            },
            {
              "id": "chat_hard_sample_295",
              "rewards": [
                -0.28397979931331013,
                0.6069694305568908,
                0.640325862292659,
                0.5425238395974615,
                0.5203017990862046,
                0.6209060298034921,
                0.6779767816932528
              ],
              "variance": 0.45679707032649775,
              "mean_reward": 0.4750034205309501,
              "min_reward": -0.28397979931331013,
              "max_reward": 0.6779767816932528,
              "num_responses": 7,
              "rvariance": 0.098556967483156
            },
            {
              "id": "chat_hard_sample_153",
              "rewards": [
                0.06851904226612121,
                0.06851904226612121,
                0.06851904226612121,
                0.3198238968270757,
                0.06851904226612121,
                -0.9284005081890392
              ],
              "variance": 0.6241122025080574,
              "mean_reward": -0.05575007371624644,
              "min_reward": -0.9284005081890392,
              "max_reward": 0.3198238968270757,
              "num_responses": 6,
              "rvariance": 0.1607243068138978
            },
            {
              "id": "chat_hard_sample_192",
              "rewards": [
                -1.4624409966229694,
                -2.25497132563166,
                -1.8834896309750735,
                -2.33725098556199,
                -2.1174946307489106
              ],
              "variance": 0.6734786712260468,
              "mean_reward": -2.011129513908121,
              "min_reward": -2.33725098556199,
              "max_reward": -1.4624409966229694,
              "num_responses": 5,
              "rvariance": 0.0988957220429196
            },
            {
              "id": "chat_hard_sample_363",
              "rewards": [
                -0.11303876229525961,
                -1.5007157189213969,
                -0.6605368893789347,
                -1.1248285966304112,
                -0.7862219206036558,
                -1.4793690798865629
              ],
              "variance": 1.1032545735668828,
              "mean_reward": -0.9441184946193703,
              "min_reward": -1.5007157189213969,
              "max_reward": -0.11303876229525961,
              "num_responses": 6,
              "rvariance": 0.2374988627491652
            },
            {
              "id": "chat_hard_sample_129",
              "rewards": [
                1.3573598829566191,
                -0.32062374733858545,
                -0.4586382630361185,
                -0.3939797365824241,
                -0.3939797365824241
              ],
              "variance": 1.1189412832931782,
              "mean_reward": -0.04197232011658662,
              "min_reward": -0.4586382630361185,
              "max_reward": 1.3573598829566191,
              "num_responses": 5,
              "rvariance": 0.4914412365866996
            },
            {
              "id": "chat_hard_sample_359",
              "rewards": [
                0.5672283963589307,
                0.5505986536116925,
                0.6104058285740955,
                -0.25924523538191735,
                0.5506436643665777,
                0.2764202567155643,
                0.040481958460259475
              ],
              "variance": 0.6639082883216079,
              "mean_reward": 0.33379050324360043,
              "min_reward": -0.25924523538191735,
              "max_reward": 0.6104058285740955,
              "num_responses": 7,
              "rvariance": 0.09515042723165763
            },
            {
              "id": "chat_hard_sample_7",
              "rewards": [
                -1.56697847484408,
                -0.8870367785713681,
                -0.6284234469511529,
                -0.48326837893373903,
                -0.5949712230960135,
                -0.8137131047412932
              ],
              "variance": 0.6878878256928479,
              "mean_reward": -0.829065234522941,
              "min_reward": -1.56697847484408,
              "max_reward": -0.48326837893373903,
              "num_responses": 6,
              "rvariance": 0.12712415608179448
            },
            {
              "id": "chat_hard_sample_316",
              "rewards": [
                -0.9437099354596421,
                -2.1435120011945346,
                -1.786341274082393,
                -1.6129881222512583,
                -2.158002001901841,
                -1.6421741344286154,
                -1.675101809871053
              ],
              "variance": 0.8040311539428457,
              "mean_reward": -1.7088327541699055,
              "min_reward": -2.158002001901841,
              "max_reward": -0.9437099354596421,
              "num_responses": 7,
              "rvariance": 0.1424124144184088
            },
            {
              "id": "chat_hard_sample_41",
              "rewards": [
                -0.8118491978402738,
                -0.009875843281030819,
                0.20775461895515804,
                0.1669616026269941,
                -0.0966761987725327,
                -0.5471270988967792
              ],
              "variance": 0.8668462591596025,
              "mean_reward": -0.18180201953474406,
              "min_reward": -0.8118491978402738,
              "max_reward": 0.20775461895515804,
              "num_responses": 6,
              "rvariance": 0.14010288577970473
            },
            {
              "id": "chat_hard_sample_143",
              "rewards": [
                0.8433555281172084,
                0.20670379094687427,
                0.0005176016707531463,
                -0.22448885375702432
              ],
              "variance": 0.8093469240947994,
              "mean_reward": 0.20652201674445284,
              "min_reward": -0.22448885375702432,
              "max_reward": 0.8433555281172084,
              "num_responses": 4,
              "rvariance": 0.15844128594237814
            },
            {
              "id": "chat_hard_sample_370",
              "rewards": [
                0.5533269978308937,
                0.19291434224509038,
                0.4471714406777525,
                -0.6203030451210766,
                0.21211085214271103,
                0.30774947329861374,
                0.41848977977949486
              ],
              "variance": 0.6220062762403853,
              "mean_reward": 0.21592283440763996,
              "min_reward": -0.6203030451210766,
              "max_reward": 0.5533269978308937,
              "num_responses": 7,
              "rvariance": 0.13094294712549576
            },
            {
              "id": "chat_hard_sample_91",
              "rewards": [
                0.4686190653805982,
                0.228117369053076,
                0.24515797920388277,
                0.6499916333737973,
                0.022770226412893686,
                0.3904186493769891,
                0.2559478650352334
              ],
              "variance": 0.39518958058087483,
              "mean_reward": 0.3230032554052101,
              "min_reward": 0.022770226412893686,
              "max_reward": 0.6499916333737973,
              "num_responses": 7,
              "rvariance": 0.03462424490242118
            },
            {
              "id": "chat_hard_sample_245",
              "rewards": [
                -0.1386510359469158,
                -1.4472487127272604,
                -0.8832627998925237,
                -1.0494448151728937,
                -0.9376057846240432,
                -0.9249231388436696,
                -0.5448073138373061
              ],
              "variance": 0.8262215715134906,
              "mean_reward": -0.8465633715778018,
              "min_reward": -1.4472487127272604,
              "max_reward": -0.1386510359469158,
              "num_responses": 7,
              "rvariance": 0.1442794535266289
            },
            {
              "id": "chat_hard_sample_131",
              "rewards": [
                0.5564592847221426,
                -0.49673467349788486,
                -0.39259594440018114,
                0.23054794981688223,
                0.4491351791248638,
                0.5534839584120322
              ],
              "variance": 0.9996369305161205,
              "mean_reward": 0.1500492923629758,
              "min_reward": -0.49673467349788486,
              "max_reward": 0.5564592847221426,
              "num_responses": 6,
              "rvariance": 0.1894423941079939
            },
            {
              "id": "chat_hard_sample_171",
              "rewards": [
                -0.8929643487531861,
                -0.5313802594184448,
                -0.601013051347925,
                -0.6108496324732434,
                -0.6663074989796143,
                -1.0272787495747633,
                -0.41557682007392743
              ],
              "variance": 0.4616312254011791,
              "mean_reward": -0.6779100515173007,
              "min_reward": -1.0272787495747633,
              "max_reward": -0.41557682007392743,
              "num_responses": 7,
              "rvariance": 0.038448772842406664
            },
            {
              "id": "chat_hard_sample_329",
              "rewards": [
                1.453635579412437,
                0.9725623623812242,
                0.8042267555978805,
                1.2512481824364432,
                1.2512481824364432
              ],
              "variance": 0.5011196223108215,
              "mean_reward": 1.1465842124528856,
              "min_reward": 0.8042267555978805,
              "max_reward": 1.453635579412437,
              "num_responses": 5,
              "rvariance": 0.052736373548751526
            },
            {
              "id": "chat_hard_sample_384",
              "rewards": [
                -0.2794966127145422,
                0.37330359836233357,
                -0.7839875405662726,
                -0.11423212436068014,
                -0.6100082775934643,
                -0.21331579944818854,
                -0.30733518755014055
              ],
              "variance": 0.7603821475111131,
              "mean_reward": -0.27643884912442207,
              "min_reward": -0.7839875405662726,
              "max_reward": 0.37330359836233357,
              "num_responses": 7,
              "rvariance": 0.11747128006641085
            },
            {
              "id": "chat_hard_sample_29",
              "rewards": [
                -0.0039038394052875367,
                -0.22133175324449253,
                0.004113268512936584,
                -0.3971091381688726,
                -0.2208372120017143,
                0.06502609227482987,
                -0.2590744253377372
              ],
              "variance": 0.34276670848788526,
              "mean_reward": -0.14758814391004824,
              "min_reward": -0.3971091381688726,
              "max_reward": 0.06502609227482987,
              "num_responses": 7,
              "rvariance": 0.02490811067672561
            },
            {
              "id": "chat_hard_sample_106",
              "rewards": [
                -0.6379230244757916,
                -0.09551919154759644,
                -0.7007338017353484,
                -1.1101920224392474,
                -0.5821339249783417,
                0.0664410457489165,
                -0.7922372040514042
              ],
              "variance": 0.8886840347775502,
              "mean_reward": -0.5503283033541162,
              "min_reward": -1.1101920224392474,
              "max_reward": 0.0664410457489165,
              "num_responses": 7,
              "rvariance": 0.14150418643403048
            },
            {
              "id": "chat_hard_sample_320",
              "rewards": [
                -0.05655141903612748,
                -0.8298800445985571,
                -0.27885838329270707,
                -0.5895618536563365,
                -0.7495323847625351,
                -0.2480121667332345
              ],
              "variance": 0.6374244217958651,
              "mean_reward": -0.4587327086799163,
              "min_reward": -0.8298800445985571,
              "max_reward": -0.05655141903612748,
              "num_responses": 6,
              "rvariance": 0.07965646186931162
            },
            {
              "id": "chat_hard_sample_23",
              "rewards": [
                -0.17656509514530067,
                -0.16161459979186005,
                0.13526883763910189,
                -0.14766588226509741,
                0.010684838726190473,
                0.09692659920834658,
                0.29191722879818927
              ],
              "variance": 0.36552299203597316,
              "mean_reward": 0.0069931324527957184,
              "min_reward": -0.17656509514530067,
              "max_reward": 0.29191722879818927,
              "num_responses": 7,
              "rvariance": 0.02739709364033052
            },
            {
              "id": "chat_hard_sample_235",
              "rewards": [
                -1.1321162994951093,
                -1.0421115244923502,
                -0.8811819180705186,
                -1.402282968596845,
                -1.0993894412667753,
                -1.227245375823272,
                -1.2011172096733151
              ],
              "variance": 0.31952073100908374,
              "mean_reward": -1.1407778196311695,
              "min_reward": -1.402282968596845,
              "max_reward": -0.8811819180705186,
              "num_responses": 7,
              "rvariance": 0.02263078755689459
            },
            {
              "id": "chat_hard_sample_202",
              "rewards": [
                1.9364916262797796,
                1.6272662975653642,
                1.3231349744759486,
                1.5109163814916624,
                1.3199063184043685,
                1.3231349744759486,
                0.9141424419668245
              ],
              "variance": 0.5933556612217796,
              "mean_reward": 1.422141859237128,
              "min_reward": 0.9141424419668245,
              "max_reward": 1.9364916262797796,
              "num_responses": 7,
              "rvariance": 0.08609041058205527
            },
            {
              "id": "chat_hard_sample_304",
              "rewards": [
                0.00116044758026885,
                0.09421614387890738,
                0.339323940789692,
                0.33172981855519773,
                -0.27163127182881597,
                0.317516807108724,
                -0.00210975688043626
              ],
              "variance": 0.44468583030878356,
              "mean_reward": 0.11574373274336254,
              "min_reward": -0.27163127182881597,
              "max_reward": 0.339323940789692,
              "num_responses": 7,
              "rvariance": 0.044984582534013294
            },
            {
              "id": "chat_hard_sample_277",
              "rewards": [
                0.883967924364871,
                0.5168879064464426,
                0.0722578202264015,
                0.27336125656624405,
                -0.2665300529418152,
                0.5280297994634346
              ],
              "variance": 0.8031349782718596,
              "mean_reward": 0.33466244235426307,
              "min_reward": -0.2665300529418152,
              "max_reward": 0.883967924364871,
              "num_responses": 6,
              "rvariance": 0.1343966674365518
            },
            {
              "id": "chat_hard_sample_196",
              "rewards": [
                1.0424681041448165,
                0.6622420604950799,
                0.17787036301611878,
                1.0838156760556057,
                0.7601196781760463,
                0.8623391025205639,
                0.9478462644005535
              ],
              "variance": 0.5905137514056367,
              "mean_reward": 0.7909573212583977,
              "min_reward": 0.17787036301611878,
              "max_reward": 1.0838156760556057,
              "num_responses": 7,
              "rvariance": 0.08173248371572887
            },
            {
              "id": "chat_hard_sample_185",
              "rewards": [
                -2.094016328527586,
                -2.8254399412918003,
                -2.5212884210687823,
                -2.3272470567582517,
                -2.7607098592790575,
                -2.5795611909383647,
                -2.606717679719163
              ],
              "variance": 0.5526471266181692,
              "mean_reward": -2.530711496797572,
              "min_reward": -2.8254399412918003,
              "max_reward": -2.094016328527586,
              "num_responses": 7,
              "rvariance": 0.05430236827216682
            },
            {
              "id": "chat_hard_sample_160",
              "rewards": [
                0.39246202223658977,
                -0.09228880429313603,
                -0.018021058732390023,
                0.5729978518376903,
                -0.05123091698430092,
                0.6609961858822931,
                0.3530060561529033
              ],
              "variance": 0.6758512573633664,
              "mean_reward": 0.25970304801423566,
              "min_reward": -0.09228880429313603,
              "max_reward": 0.6609961858822931,
              "num_responses": 7,
              "rvariance": 0.08331844104510878
            },
            {
              "id": "chat_hard_sample_163",
              "rewards": [
                2.2282475885500577,
                2.186311414459999,
                2.186311414459999,
                1.3917457914451485,
                2.186311414459999,
                2.13579665213757
              ],
              "variance": 0.44350827971366913,
              "mean_reward": 2.0524540459187954,
              "min_reward": 1.3917457914451485,
              "max_reward": 2.2282475885500577,
              "num_responses": 6,
              "rvariance": 0.0880230237516879
            },
            {
              "id": "chat_hard_sample_266",
              "rewards": [
                -0.2984115168636497,
                -1.3429449441949772,
                -0.47872575505608406,
                -1.2570863521903062,
                -1.0733986156253146,
                -1.0361689507255702,
                -1.0559286721202172
              ],
              "variance": 0.8848297292130645,
              "mean_reward": -0.934666400968017,
              "min_reward": -1.3429449441949772,
              "max_reward": -0.2984115168636497,
              "num_responses": 7,
              "rvariance": 0.13251458247756537
            },
            {
              "id": "chat_hard_sample_289",
              "rewards": [
                -0.3517942721576162,
                -1.5268565804124752,
                -0.3460213543130964,
                -0.449242556484292,
                -0.7201853725773191,
                -0.5148947819112234,
                -0.6021071589282139
              ],
              "variance": 0.6933687506915731,
              "mean_reward": -0.6444431538263194,
              "min_reward": -1.5268565804124752,
              "max_reward": -0.3460213543130964,
              "num_responses": 7,
              "rvariance": 0.1451096668314353
            },
            {
              "id": "chat_hard_sample_69",
              "rewards": [
                -0.18064491613298111,
                -1.3602002210229291,
                -0.9856795790853845,
                -0.9491908604583675,
                -0.7111809133564188,
                -1.2124743464284127,
                -1.246291849871275
              ],
              "variance": 0.7928886838648931,
              "mean_reward": -0.9493803837651098,
              "min_reward": -1.3602002210229291,
              "max_reward": -0.18064491613298111,
              "num_responses": 7,
              "rvariance": 0.13930838071118354
            },
            {
              "id": "chat_hard_sample_40",
              "rewards": [
                0.05011541412763394,
                -0.3325412102859089,
                0.007873974789699456,
                -0.0014998034456444296,
                -0.3392293468130965,
                0.07205354064653745,
                -0.3287556903878631
              ],
              "variance": 0.39410712963197925,
              "mean_reward": -0.12456901733837744,
              "min_reward": -0.3392293468130965,
              "max_reward": 0.07205354064653745,
              "num_responses": 7,
              "rvariance": 0.033269420859680814
            },
            {
              "id": "chat_hard_sample_313",
              "rewards": [
                -0.0547267522803926,
                -0.8250269619243855,
                -1.4486625120794268,
                -1.4278052207387306,
                -1.4264722099209737,
                -1.1199905175412015,
                -1.1174156715373782
              ],
              "variance": 0.9192412592082211,
              "mean_reward": -1.0600142637174985,
              "min_reward": -1.4486625120794268,
              "max_reward": -0.0547267522803926,
              "num_responses": 7,
              "rvariance": 0.21333188009355777
            },
            {
              "id": "chat_hard_sample_226",
              "rewards": [
                0.9115554776828398,
                1.2299055828283296,
                1.0533970616675434,
                1.0409377384787162,
                1.0533970616675434,
                1.6052303592137291,
                1.0533970616675434
              ],
              "variance": 0.39085065922212403,
              "mean_reward": 1.1354029061723208,
              "min_reward": 0.9115554776828398,
              "max_reward": 1.6052303592137291,
              "num_responses": 7,
              "rvariance": 0.044124972324869456
            },
            {
              "id": "chat_hard_sample_28",
              "rewards": [
                -0.17208825621709345,
                -0.37475437363680003,
                -0.7128913220420601,
                -0.15527385396263335,
                -0.4338927349464844,
                -0.585762484295249,
                -0.6288447014520026
              ],
              "variance": 0.4971008543727161,
              "mean_reward": -0.4376439609360462,
              "min_reward": -0.7128913220420601,
              "max_reward": -0.15527385396263335,
              "num_responses": 7,
              "rvariance": 0.04121140163426224
            },
            {
              "id": "chat_hard_sample_323",
              "rewards": [
                -0.030880862227504434,
                0.6286778868136873,
                0.34963024953650573,
                0.4419132612096133
              ],
              "variance": 0.48937602783076656,
              "mean_reward": 0.34733513383307546,
              "min_reward": -0.030880862227504434,
              "max_reward": 0.6286778868136873,
              "num_responses": 4,
              "rvariance": 0.057787843516237725
            },
            {
              "id": "chat_hard_sample_116",
              "rewards": [
                0.3203594093980187,
                0.27338664724848705,
                0.7633818037833104,
                0.5466538648886679,
                0.5768837803427879,
                0.7214606332782136,
                0.7382167523757069
              ],
              "variance": 0.4467124684005423,
              "mean_reward": 0.5629061273307417,
              "min_reward": 0.27338664724848705,
              "max_reward": 0.7633818037833104,
              "num_responses": 7,
              "rvariance": 0.03416768485775207
            },
            {
              "id": "chat_hard_sample_36",
              "rewards": [
                -0.7672804716503852,
                -0.5490983391363714,
                -0.6436774763695893,
                -0.5598939955773227,
                -0.665558473853446,
                -0.30569633442354754,
                -0.47333946805480975
              ],
              "variance": 0.2999650583699169,
              "mean_reward": -0.5663635084379246,
              "min_reward": -0.7672804716503852,
              "max_reward": -0.30569633442354754,
              "num_responses": 7,
              "rvariance": 0.019017929324735415
            },
            {
              "id": "chat_hard_sample_351",
              "rewards": [
                0.6795867817718425,
                0.4990145973302577,
                0.6860544810122842,
                0.95766668781899,
                0.9970020481620223,
                0.8663548697416769,
                0.7775059478419337
              ],
              "variance": 0.36604292396099436,
              "mean_reward": 0.7804550590970011,
              "min_reward": 0.4990145973302577,
              "max_reward": 0.9970020481620223,
              "num_responses": 7,
              "rvariance": 0.026282663798023426
            },
            {
              "id": "chat_hard_sample_296",
              "rewards": [
                0.41207170778161906,
                0.48612363254329966,
                0.5419450474545133,
                0.20577472280116488,
                0.07952648007941748,
                0.584416734115515
              ],
              "variance": 0.42053028934472303,
              "mean_reward": 0.3849763874625882,
              "min_reward": 0.07952648007941748,
              "max_reward": 0.584416734115515,
              "num_responses": 6,
              "rvariance": 0.03346556936685357
            },
            {
              "id": "chat_hard_sample_338",
              "rewards": [
                -0.7363084558016177,
                -1.6046513225611565,
                -1.2469231545615893,
                -0.7807744651406142,
                -1.4853555102863079,
                -1.2129031027217432,
                -1.274518209672039
              ],
              "variance": 0.7700857737912318,
              "mean_reward": -1.191633460106438,
              "min_reward": -1.6046513225611565,
              "max_reward": -0.7363084558016177,
              "num_responses": 7,
              "rvariance": 0.09190880006836019
            },
            {
              "id": "chat_hard_sample_354",
              "rewards": [
                0.8609685827404026,
                1.4403412490143912,
                1.0084191992569669,
                1.3112550204910296,
                0.9105011873087957,
                1.5967830523497744,
                1.1853120430171582
              ],
              "variance": 0.612229824867106,
              "mean_reward": 1.1876543334540741,
              "min_reward": 0.8609685827404026,
              "max_reward": 1.5967830523497744,
              "num_responses": 7,
              "rvariance": 0.06602604022133689
            },
            {
              "id": "chat_hard_sample_186",
              "rewards": [
                1.026092268220008,
                1.407925426643534,
                1.0568346138066684,
                1.1046181466050955,
                1.2218475035819407,
                1.3155985583374612
              ],
              "variance": 0.32029855147715947,
              "mean_reward": 1.1888194195324513,
              "min_reward": 1.026092268220008,
              "max_reward": 1.407925426643534,
              "num_responses": 6,
              "rvariance": 0.019360202633934075
            },
            {
              "id": "chat_hard_sample_54",
              "rewards": [
                0.29713847636488416,
                0.3157192622181123,
                0.011467910449002689,
                -0.06101556262321319,
                0.6664494119549353,
                0.22009564464717135,
                0.3083299966244421
              ],
              "variance": 0.4735368008927253,
              "mean_reward": 0.2511693056621907,
              "min_reward": -0.06101556262321319,
              "max_reward": 0.6664494119549353,
              "num_responses": 7,
              "rvariance": 0.048269499440380045
            },
            {
              "id": "chat_hard_sample_241",
              "rewards": [
                0.6541395475547657,
                -0.040155963038676704,
                0.1095521159536734,
                0.20440247183812327,
                -0.23968056059177334,
                0.09185250218646904,
                -0.18064837849874152
              ],
              "variance": 0.5885585534607347,
              "mean_reward": 0.08563739077197711,
              "min_reward": -0.23968056059177334,
              "max_reward": 0.6541395475547657,
              "num_responses": 7,
              "rvariance": 0.07578203381375419
            },
            {
              "id": "chat_hard_sample_67",
              "rewards": [
                1.373229059358488,
                1.001016084200255,
                0.6115443698483096,
                0.9222859262353035,
                0.8541973494349652,
                0.9046036242969011,
                1.0831739842680101
              ],
              "variance": 0.44205985670389836,
              "mean_reward": 0.9642929139488903,
              "min_reward": 0.6115443698483096,
              "max_reward": 1.373229059358488,
              "num_responses": 7,
              "rvariance": 0.04637000544894822
            },
            {
              "id": "chat_hard_sample_262",
              "rewards": [
                0.6604987593347146,
                0.22160350493582892,
                0.6224438972620732,
                0.4913241059154321,
                0.2348816776269926,
                0.14488209617287395,
                0.554552675310078
              ],
              "variance": 0.44675090066048284,
              "mean_reward": 0.4185981023654276,
              "min_reward": 0.14488209617287395,
              "max_reward": 0.6604987593347146,
              "num_responses": 7,
              "rvariance": 0.03876011451675145
            },
            {
              "id": "chat_hard_sample_244",
              "rewards": [
                -1.4846780407191882,
                -2.1903993583219763,
                -2.0489063191571533,
                -2.263930197036715,
                -2.2114888445664795,
                -1.8539335784570727,
                -2.165842529166284
              ],
              "variance": 0.5262340221926551,
              "mean_reward": -2.031311266774981,
              "min_reward": -2.263930197036715,
              "max_reward": -1.4846780407191882,
              "num_responses": 7,
              "rvariance": 0.06579478881386967
            },
            {
              "id": "chat_hard_sample_85",
              "rewards": [
                0.9609801718517003,
                1.0980067591855969,
                1.045453240491248,
                1.3371096597459144,
                0.9304432599668241,
                1.1263831548359786,
                1.1447896682792662
              ],
              "variance": 0.2729522577681758,
              "mean_reward": 1.0918808449080755,
              "min_reward": 0.9304432599668241,
              "max_reward": 1.3371096597459144,
              "num_responses": 7,
              "rvariance": 0.015645293417650398
            },
            {
              "id": "chat_hard_sample_398",
              "rewards": [
                -1.0958324375089166,
                -1.5300950465203766,
                -1.5300950465203766,
                -1.2578111407561516,
                -1.4986740772446763,
                -1.5300950465203766,
                -1.4612851435199534
              ],
              "variance": 0.3370753870631191,
              "mean_reward": -1.4148411340844038,
              "min_reward": -1.5300950465203766,
              "max_reward": -1.0958324375089166,
              "num_responses": 7,
              "rvariance": 0.025065766951745973
            },
            {
              "id": "chat_hard_sample_319",
              "rewards": [
                -0.5312775425675527,
                -0.06805339809220198,
                0.006345917367439507,
                -0.15474007257457048,
                -1.7620677818580945,
                -1.5627021645994965,
                -0.1758079911656915
              ],
              "variance": 1.6041547395945903,
              "mean_reward": -0.6069004333557383,
              "min_reward": -1.7620677818580945,
              "max_reward": 0.006345917367439507,
              "num_responses": 7,
              "rvariance": 0.472914896252632
            },
            {
              "id": "chat_hard_sample_190",
              "rewards": [
                0.5428169865651761,
                1.0549614739302877,
                0.7569066027503879,
                0.674530573639727,
                0.8668880740687797,
                1.051456405658835
              ],
              "variance": 0.4445351596921099,
              "mean_reward": 0.8245933527688655,
              "min_reward": 0.5428169865651761,
              "max_reward": 1.0549614739302877,
              "num_responses": 6,
              "rvariance": 0.035470568970469726
            },
            {
              "id": "chat_hard_sample_20",
              "rewards": [
                0.2277936378544779,
                0.7739362487429533,
                0.7823440269311435,
                0.5326762943139018,
                0.5800691568423629,
                0.7217208877712044,
                0.5481195997272404
              ],
              "variance": 0.3665761282880971,
              "mean_reward": 0.5952371217404692,
              "min_reward": 0.2277936378544779,
              "max_reward": 0.7823440269311435,
              "num_responses": 7,
              "rvariance": 0.03204560200702692
            },
            {
              "id": "chat_hard_sample_264",
              "rewards": [
                0.27852248979309185,
                0.3534688590428778,
                0.672671283226388,
                0.7962038770700557,
                0.8191980251458835,
                0.7823584534551452,
                0.8459990443752797
              ],
              "variance": 0.5064281214946786,
              "mean_reward": 0.6497745760155318,
              "min_reward": 0.27852248979309185,
              "max_reward": 0.8459990443752797,
              "num_responses": 7,
              "rvariance": 0.047482545785545935
            },
            {
              "id": "chat_hard_sample_27",
              "rewards": [
                0.3373255786849767,
                0.18967125964950848,
                0.15940210405010388,
                0.1348487372601724,
                0.36598761951059205,
                -0.06032886008073232,
                -0.28662504675426165
              ],
              "variance": 0.4996377297653669,
              "mean_reward": 0.12004019890290851,
              "min_reward": -0.28662504675426165,
              "max_reward": 0.36598761951059205,
              "num_responses": 7,
              "rvariance": 0.04460426092006474
            },
            {
              "id": "chat_hard_sample_115",
              "rewards": [
                0.28805669097533465,
                0.14431195994432683,
                -0.021389940617266755,
                -0.24317985825362542,
                0.39651760666394736,
                0.061289045497429785,
                0.11800028840906827
              ],
              "variance": 0.44154696492258994,
              "mean_reward": 0.10622939894560211,
              "min_reward": -0.24317985825362542,
              "max_reward": 0.39651760666394736,
              "num_responses": 7,
              "rvariance": 0.03704434331045757
            },
            {
              "id": "chat_hard_sample_260",
              "rewards": [
                0.13484238958961164,
                -0.16199084353782436,
                0.013152928452401121,
                -0.5777136380242212,
                -0.07249330511896485,
                -0.5136829538950807,
                -0.08190747762151349
              ],
              "variance": 0.6011239404540223,
              "mean_reward": -0.17997041430794167,
              "min_reward": -0.5777136380242212,
              "max_reward": 0.13484238958961164,
              "num_responses": 7,
              "rvariance": 0.06106548451756395
            },
            {
              "id": "chat_hard_sample_175",
              "rewards": [
                -0.46536794795243097,
                -0.3079341768266911,
                -0.45613266434750344,
                -0.2379274493950869,
                -0.2819133440153068,
                0.006364383318161681,
                -0.3839434923649222
              ],
              "variance": 0.3196160614796871,
              "mean_reward": -0.30383638451196854,
              "min_reward": -0.46536794795243097,
              "max_reward": 0.006364383318161681,
              "num_responses": 7,
              "rvariance": 0.022395666752134998
            },
            {
              "id": "chat_hard_sample_200",
              "rewards": [
                1.5336990367256254,
                1.6145905765165114,
                1.334763329882278,
                1.5553887385012197
              ],
              "variance": 0.20238598317664147,
              "mean_reward": 1.5096104204064087,
              "min_reward": 1.334763329882278,
              "max_reward": 1.6145905765165114,
              "num_responses": 4,
              "rvariance": 0.011067063521354798
            },
            {
              "id": "chat_hard_sample_240",
              "rewards": [
                0.19605182268497987,
                0.38753276751568927,
                -0.3441424438271151,
                0.19666754672937237
              ],
              "variance": 0.5123573651532808,
              "mean_reward": 0.10902742327573159,
              "min_reward": -0.3441424438271151,
              "max_reward": 0.38753276751568927,
              "num_responses": 4,
              "rvariance": 0.07454554813793471
            },
            {
              "id": "chat_hard_sample_130",
              "rewards": [
                0.9041615956014891,
                0.7435355232446532,
                0.947298056488489,
                0.8366466173954583,
                0.8698789810248119,
                0.918936087362109,
                0.8072390138094352
              ],
              "variance": 0.14852325742913863,
              "mean_reward": 0.8610994107037779,
              "min_reward": 0.7435355232446532,
              "max_reward": 0.947298056488489,
              "num_responses": 7,
              "rvariance": 0.004289552773411761
            },
            {
              "id": "chat_hard_sample_374",
              "rewards": [
                -0.1337760249562617,
                -1.220153296624037,
                -1.0462063490649924,
                -0.3060287215365467,
                -0.19715001371284482,
                -0.30922217688956277,
                -0.09948706270902372
              ],
              "variance": 0.9957246880312437,
              "mean_reward": -0.47314623507046694,
              "min_reward": -1.220153296624037,
              "max_reward": -0.09948706270902372,
              "num_responses": 7,
              "rvariance": 0.18174057646415115
            },
            {
              "id": "chat_hard_sample_257",
              "rewards": [
                0.08173085294687707,
                0.6915527178398116,
                0.1452144832858731,
                0.29478522176972705,
                0.3102429537070674,
                0.3625252537501843,
                0.07385627908578973
              ],
              "variance": 0.41555521598359324,
              "mean_reward": 0.2799868231979043,
              "min_reward": 0.07385627908578973,
              "max_reward": 0.6915527178398116,
              "num_responses": 7,
              "rvariance": 0.03961318839222883
            },
            {
              "id": "chat_hard_sample_237",
              "rewards": [
                -0.4031861671393483,
                -1.4585544910569117,
                0.29932322915970144,
                -0.16555130966144366,
                0.32309467834874084,
                -0.0053476459273775635,
                -0.21632805765974328
              ],
              "variance": 1.134165305541691,
              "mean_reward": -0.2323642519909117,
              "min_reward": -1.4585544910569117,
              "max_reward": 0.32309467834874084,
              "num_responses": 7,
              "rvariance": 0.3114580711717175
            },
            {
              "id": "chat_hard_sample_22",
              "rewards": [
                -0.07999278935600801,
                0.4168705467255442,
                0.298580551704094,
                0.43375246511233223,
                0.2858407768886737
              ],
              "variance": 0.36065906061575237,
              "mean_reward": 0.2710103102149272,
              "min_reward": -0.07999278935600801,
              "max_reward": 0.43375246511233223,
              "num_responses": 5,
              "rvariance": 0.034388690888304
            },
            {
              "id": "chat_hard_sample_292",
              "rewards": [
                -0.02540974726510014,
                -0.8147021872268497,
                -0.5784903620764726,
                -0.9856599590127422,
                -0.35103024344648626,
                -0.7868070604171646,
                -1.2659373131958285
              ],
              "variance": 0.8769888557120449,
              "mean_reward": -0.6868624103772348,
              "min_reward": -1.2659373131958285,
              "max_reward": -0.02540974726510014,
              "num_responses": 7,
              "rvariance": 0.14471243292827937
            },
            {
              "id": "chat_hard_sample_92",
              "rewards": [
                0.5973982974732037,
                -0.1550511084320471,
                0.5897874404708674,
                -0.18248227822983748,
                -0.19507317131756025,
                -0.12234156203251513
              ],
              "variance": 0.7823705937457344,
              "mean_reward": 0.08870626965535187,
              "min_reward": -0.19507317131756025,
              "max_reward": 0.5973982974732037,
              "num_responses": 6,
              "rvariance": 0.12798046086107592
            },
            {
              "id": "chat_hard_sample_407",
              "rewards": [
                1.595117077358058,
                1.383358787451521,
                1.6772683412247726,
                1.2153070946605307,
                1.3287815159702137
              ],
              "variance": 0.38371097249368313,
              "mean_reward": 1.439966563333019,
              "min_reward": 1.2153070946605307,
              "max_reward": 1.6772683412247726,
              "num_responses": 5,
              "rvariance": 0.029284449540868996
            },
            {
              "id": "chat_hard_sample_44",
              "rewards": [
                -2.0687745280122933,
                -1.9732651685114457,
                -2.2318935037166225,
                -2.1913688207348905,
                -1.858367137813275,
                -2.430536352122735
              ],
              "variance": 0.4153987747573187,
              "mean_reward": -2.1257009184852103,
              "min_reward": -2.430536352122735,
              "max_reward": -1.858367137813275,
              "num_responses": 6,
              "rvariance": 0.034409733705945265
            },
            {
              "id": "chat_hard_sample_119",
              "rewards": [
                0.011771444513998435,
                -0.19185143997750084,
                -0.23260117673365965,
                0.3551561852901165,
                0.05921624252886568
              ],
              "variance": 0.4530814902168123,
              "mean_reward": 0.00033825112436402653,
              "min_reward": -0.23260117673365965,
              "max_reward": 0.3551561852901165,
              "num_responses": 5,
              "rvariance": 0.04413815132104385
            },
            {
              "id": "chat_hard_sample_303",
              "rewards": [
                -0.020281983573936277,
                -0.3872085032769867,
                0.1640716813389738,
                -0.2825492651933017,
                0.09744479995048759,
                -0.42618435464189663,
                0.05264005582793125
              ],
              "variance": 0.5268943963288327,
              "mean_reward": -0.11458108136696123,
              "min_reward": -0.42618435464189663,
              "max_reward": 0.1640716813389738,
              "num_responses": 7,
              "rvariance": 0.05129902670747185
            },
            {
              "id": "chat_hard_sample_365",
              "rewards": [
                -1.5638548438672322,
                -1.7110698752468487,
                -1.336412037066048,
                -2.107656895501672,
                -2.165401077531832
              ],
              "variance": 0.7149142449332464,
              "mean_reward": -1.7768789458427268,
              "min_reward": -2.165401077531832,
              "max_reward": -1.336412037066048,
              "num_responses": 5,
              "rvariance": 0.1008169396630529
            },
            {
              "id": "chat_hard_sample_45",
              "rewards": [
                0.33401844232282724,
                0.5088125153712515,
                0.3772149175496742,
                0.3734709460407533,
                0.38168540880732066,
                0.4451488420127143,
                -0.13315049087554803
              ],
              "variance": 0.323463442312652,
              "mean_reward": 0.3267429401755705,
              "min_reward": -0.13315049087554803,
              "max_reward": 0.5088125153712515,
              "num_responses": 7,
              "rvariance": 0.03806768436411532
            },
            {
              "id": "chat_hard_sample_78",
              "rewards": [
                -1.661547513510497,
                -1.5095886082434018,
                -1.1683268747393736,
                -0.7956626379103675
              ],
              "variance": 0.7084979329712991,
              "mean_reward": -1.2837814086009098,
              "min_reward": -1.661547513510497,
              "max_reward": -0.7956626379103675,
              "num_responses": 4,
              "rvariance": 0.11132145127964406
            },
            {
              "id": "chat_hard_sample_189",
              "rewards": [
                1.858168007761196,
                1.5546466381065722,
                1.3375193730275627,
                1.733155252554954
              ],
              "variance": 0.4180066286480577,
              "mean_reward": 1.6208723178625712,
              "min_reward": 1.3375193730275627,
              "max_reward": 1.858168007761196,
              "num_responses": 4,
              "rvariance": 0.03839785846835342
            },
            {
              "id": "chat_hard_sample_39",
              "rewards": [
                0.2250312470386326,
                0.21965246182983916,
                0.4594980398457641,
                0.09085938027419208,
                0.5243060250881161
              ],
              "variance": 0.3560062180947244,
              "mean_reward": 0.3038694308153088,
              "min_reward": 0.09085938027419208,
              "max_reward": 0.5243060250881161,
              "num_responses": 5,
              "rvariance": 0.026298758952236434
            },
            {
              "id": "chat_hard_sample_387",
              "rewards": [
                -0.2587616582973804,
                -0.9339310604303305,
                -0.7190831861435893,
                -0.973540524729395,
                -0.8182580368627884,
                -0.9734851268772284,
                -0.40252600940103056
              ],
              "variance": 0.6284870170585246,
              "mean_reward": -0.7256550861059632,
              "min_reward": -0.973540524729395,
              "max_reward": -0.2587616582973804,
              "num_responses": 7,
              "rvariance": 0.07103802439599996
            },
            {
              "id": "chat_hard_sample_118",
              "rewards": [
                0.2998899030224882,
                0.30754519371874967,
                0.09514867439037719,
                0.1222913137081336,
                0.15759359500125092,
                0.21276062278374755
              ],
              "variance": 0.19499755432136354,
              "mean_reward": 0.19920488377079118,
              "min_reward": 0.09514867439037719,
              "max_reward": 0.30754519371874967,
              "num_responses": 6,
              "rvariance": 0.006755624207497944
            },
            {
              "id": "chat_hard_sample_154",
              "rewards": [
                1.1656856227042869,
                1.2769268180985072,
                1.3321711720496527,
                1.3140306837089566,
                1.3404000613402218,
                1.1343552519993174,
                1.3904808738206795
              ],
              "variance": 0.20727891191010572,
              "mean_reward": 1.2791500691030888,
              "min_reward": 1.1343552519993174,
              "max_reward": 1.3904808738206795,
              "num_responses": 7,
              "rvariance": 0.007716952394685566
            },
            {
              "id": "chat_hard_sample_103",
              "rewards": [
                0.37834480290948724,
                0.4536074015653904,
                0.18750958929309391,
                -0.06690100735494628,
                0.40482670742796584,
                0.22795925435001738,
                0.016221738638042514
              ],
              "variance": 0.44136634484208864,
              "mean_reward": 0.22879549811843586,
              "min_reward": -0.06690100735494628,
              "max_reward": 0.4536074015653904,
              "num_responses": 7,
              "rvariance": 0.034031660755125405
            },
            {
              "id": "chat_hard_sample_162",
              "rewards": [
                1.276960287634191,
                0.6375709732692946,
                0.9174709295844965,
                0.6977768973551046
              ],
              "variance": 0.5134807297242451,
              "mean_reward": 0.8824447719607716,
              "min_reward": 0.6375709732692946,
              "max_reward": 1.276960287634191,
              "num_responses": 4,
              "rvariance": 0.0627336812554786
            },
            {
              "id": "chat_hard_sample_321",
              "rewards": [
                0.7317992574387912,
                0.09231992156412408,
                0.5937178026698903,
                0.7604699541788075,
                0.4830213528219743,
                0.4055278364944484,
                0.45075210393497417
              ],
              "variance": 0.46302286561247896,
              "mean_reward": 0.50251546130043,
              "min_reward": 0.09231992156412408,
              "max_reward": 0.7604699541788075,
              "num_responses": 7,
              "rvariance": 0.0440222703221727
            },
            {
              "id": "chat_hard_sample_273",
              "rewards": [
                1.5787043095318054,
                1.5787043095318054,
                1.5787043095318054,
                1.1871240144317716,
                1.5787043095318054,
                1.1871240144317716,
                1.5787043095318054
              ],
              "variance": 0.3915802951000338,
              "mean_reward": 1.4668242252175099,
              "min_reward": 1.1871240144317716,
              "max_reward": 1.5787043095318054,
              "num_responses": 7,
              "rvariance": 0.0312928831654346
            },
            {
              "id": "chat_hard_sample_291",
              "rewards": [
                0.9583262684963477,
                0.7829124319768104,
                0.7193578231397261,
                0.7591173232884082,
                0.879594379348516,
                0.7295492967554862,
                1.096708372025444
              ],
              "variance": 0.28820640259880415,
              "mean_reward": 0.8465094135758199,
              "min_reward": 0.7193578231397261,
              "max_reward": 1.096708372025444,
              "num_responses": 7,
              "rvariance": 0.016818041743448246
            },
            {
              "id": "chat_hard_sample_312",
              "rewards": [
                -0.7921333330785919,
                -0.2639517445722316,
                -1.2801953353971876,
                -0.9949794935178398,
                -0.5526449557969491,
                -1.5925999814710974,
                -0.6094796897540421
              ],
              "variance": 0.9679895225196895,
              "mean_reward": -0.8694263619411341,
              "min_reward": -1.5925999814710974,
              "max_reward": -0.2639517445722316,
              "num_responses": 7,
              "rvariance": 0.17828161123364583
            },
            {
              "id": "chat_hard_sample_314",
              "rewards": [
                -1.0248308569821551,
                -1.5898398988990923,
                -1.374225110596421,
                -1.1965491951134173,
                -1.5071868805275987,
                -2.057989258668623
              ],
              "variance": 0.7132245527360714,
              "mean_reward": -1.4584368667978846,
              "min_reward": -2.057989258668623,
              "max_reward": -1.0248308569821551,
              "num_responses": 6,
              "rvariance": 0.10713288924885439
            },
            {
              "id": "chat_hard_sample_399",
              "rewards": [
                -0.7741094110518294,
                -1.2326524370191088,
                -1.303363178821996,
                -1.329781029573907,
                -1.1414883465475731,
                -1.2273861786975286,
                -1.3461545572548752
              ],
              "variance": 0.34179366829701885,
              "mean_reward": -1.1935621627095454,
              "min_reward": -1.3461545572548752,
              "max_reward": -0.7741094110518294,
              "num_responses": 7,
              "rvariance": 0.03360295550118109
            },
            {
              "id": "chat_hard_sample_219",
              "rewards": [
                -1.0483299333980425,
                -2.0282233002263976,
                -1.684866258376363,
                -1.3821458493343137,
                -1.8936896162399945,
                -1.7490446701112807,
                -2.0232305687998897
              ],
              "variance": 0.7766081784106875,
              "mean_reward": -1.6870757423551832,
              "min_reward": -2.0282233002263976,
              "max_reward": -1.0483299333980425,
              "num_responses": 7,
              "rvariance": 0.11098492777285389
            },
            {
              "id": "chat_hard_sample_406",
              "rewards": [
                -0.33717385567333447,
                -0.7240020537672086,
                -0.38666029536492214,
                -0.5096423730526849,
                -0.17302540321624382,
                -0.2198192764681544,
                0.0035240892727071995
              ],
              "variance": 0.492980639117831,
              "mean_reward": -0.33525702403854873,
              "min_reward": -0.7240020537672086,
              "max_reward": 0.0035240892727071995,
              "num_responses": 7,
              "rvariance": 0.04837093339017997
            },
            {
              "id": "chat_hard_sample_253",
              "rewards": [
                0.7438171289931664,
                0.4672860545628413,
                0.38069286395600377,
                0.6904828468198456,
                0.7507274339899802,
                0.6926468254201005,
                0.49028193382154933
              ],
              "variance": 0.3139324726717857,
              "mean_reward": 0.6022764410804982,
              "min_reward": 0.38069286395600377,
              "max_reward": 0.7507274339899802,
              "num_responses": 7,
              "rvariance": 0.01969758510991317
            },
            {
              "id": "chat_hard_sample_24",
              "rewards": [
                0.3312808651282649,
                0.8260783229727737,
                0.783393123756547,
                0.70911614522044,
                0.7806145752338198,
                0.748144509132716
              ],
              "variance": 0.28453721819030797,
              "mean_reward": 0.6964379235740936,
              "min_reward": 0.3312808651282649,
              "max_reward": 0.8260783229727737,
              "num_responses": 6,
              "rvariance": 0.027937922384453025
            },
            {
              "id": "chat_hard_sample_60",
              "rewards": [
                0.385220484248697,
                0.15798426527121692,
                0.2994172900961925,
                0.3145414807986136,
                0.33180137411424615,
                0.40838717355158516,
                0.29706230431815517
              ],
              "variance": 0.1530560712704724,
              "mean_reward": 0.31348776748552953,
              "min_reward": 0.15798426527121692,
              "max_reward": 0.40838717355158516,
              "num_responses": 7,
              "rvariance": 0.005591013114365115
            },
            {
              "id": "chat_hard_sample_386",
              "rewards": [
                0.340639639778647,
                -0.02021735274640867,
                -0.19978256581267484,
                0.21762697786000063,
                -0.17952426374852914,
                -0.0191578688237239
              ],
              "variance": 0.4687867235999258,
              "mean_reward": 0.023264094417885173,
              "min_reward": -0.19978256581267484,
              "max_reward": 0.340639639778647,
              "num_responses": 6,
              "rvariance": 0.03884455955226414
            },
            {
              "id": "chat_hard_sample_216",
              "rewards": [
                -1.5886725045768748,
                -0.646358501590065,
                -0.8539042464881063,
                -0.646358501590065,
                -0.6855317078033182,
                -1.0148488564948996
              ],
              "variance": 0.6554021789458222,
              "mean_reward": -0.9059457197572215,
              "min_reward": -1.5886725045768748,
              "max_reward": -0.646358501590065,
              "num_responses": 6,
              "rvariance": 0.1106729091964413
            },
            {
              "id": "chat_hard_sample_300",
              "rewards": [
                1.078680987632921,
                0.7340036303062507,
                0.9148845423614719,
                1.3309679999479112,
                0.8697243286875137,
                1.004777944598938,
                1.1173706167616373
              ],
              "variance": 0.3873735207011384,
              "mean_reward": 1.0072014357566634,
              "min_reward": 0.7340036303062507,
              "max_reward": 1.3309679999479112,
              "num_responses": 7,
              "rvariance": 0.03201952012207106
            },
            {
              "id": "chat_hard_sample_352",
              "rewards": [
                0.2178185620987432,
                0.4107421593296225,
                0.2433869791174342,
                0.47321131650081905,
                0.7336048811828438,
                0.5253049176099938
              ],
              "variance": 0.39885212878833015,
              "mean_reward": 0.434011469306576,
              "min_reward": 0.2178185620987432,
              "max_reward": 0.7336048811828438,
              "num_responses": 6,
              "rvariance": 0.030540977389415372
            },
            {
              "id": "chat_hard_sample_311",
              "rewards": [
                -1.016873186342818,
                -0.713408368662281,
                -0.7664910522570122,
                -0.5261705530709513,
                -0.7041061459859855,
                -0.8312165177820745,
                -0.7672400773831805
              ],
              "variance": 0.2725472763864002,
              "mean_reward": -0.7607865573549003,
              "min_reward": -1.016873186342818,
              "max_reward": -0.5261705530709513,
              "num_responses": 7,
              "rvariance": 0.018730994473988738
            },
            {
              "id": "chat_hard_sample_419",
              "rewards": [
                0.364551891841943,
                0.17571446326930487,
                0.14292643657920365,
                0.7981716549438874,
                0.2389499573954717,
                0.4326081532285175,
                -0.2589151565127585
              ],
              "variance": 0.5966437545722467,
              "mean_reward": 0.2705724858207957,
              "min_reward": -0.2589151565127585,
              "max_reward": 0.7981716549438874,
              "num_responses": 7,
              "rvariance": 0.08858532507786464
            },
            {
              "id": "chat_hard_sample_287",
              "rewards": [
                0.3208262517147137,
                0.0008153651261482119,
                0.49582287316012186,
                -0.044667425624487986,
                0.06021455798978325,
                0.20815913868816566,
                0.5753984254315729
              ],
              "variance": 0.5450308452428085,
              "mean_reward": 0.23093845521228823,
              "min_reward": -0.044667425624487986,
              "max_reward": 0.5753984254315729,
              "num_responses": 7,
              "rvariance": 0.05078243234312146
            },
            {
              "id": "chat_hard_sample_55",
              "rewards": [
                -1.4089370585273886,
                -1.2865822461032197,
                -1.5720923890722023,
                -1.5440783877047433,
                -1.2792628048857178,
                -1.753216820852572,
                -1.7272029127727087
              ],
              "variance": 0.4539540063884351,
              "mean_reward": -1.5101960885597931,
              "min_reward": -1.753216820852572,
              "max_reward": -1.2792628048857178,
              "num_responses": 7,
              "rvariance": 0.03210241764305024
            }
          ]
        },
        "semantic_benchmark_reasoning_filtered.json": {
          "file_name": "semantic_benchmark_reasoning_filtered.json",
          "processed_samples": 200,
          "global_mean": 8.612559587291281,
          "global_std": 2.8754288136519097,
          "mean_variance": 0.6539074694172291,
          "mean_rvariance": 0.13691976699989628,
          "sample_results": [
            {
              "id": "reasoning_sample_9",
              "rewards": [
                1.9919576386114668,
                2.041868327583259,
                2.0369351671047666,
                0.12022156469156843,
                0.6302839577660604,
                2.0212846375458646,
                2.1157572808493628
              ],
              "variance": 1.645164908353437,
              "mean_reward": 1.5654726534503354,
              "min_reward": 0.12022156469156843,
              "max_reward": 2.1157572808493628,
              "num_responses": 7,
              "rvariance": 0.5864322178246649
            },
            {
              "id": "reasoning_sample_5",
              "rewards": [
                1.1330948636345715,
                -1.7544961626303501,
                1.0357738955906337,
                0.8674381687613385,
                0.3393140536660214
              ],
              "variance": 2.0111385525287977,
              "mean_reward": 0.324224963804443,
              "min_reward": -1.7544961626303501,
              "max_reward": 1.1330948636345715,
              "num_responses": 5,
              "rvariance": 1.1553924370671997
            },
            {
              "id": "reasoning_sample_85",
              "rewards": [
                1.1429867226685262,
                0.627788522816472,
                -1.0333075022791942,
                1.5585386628190714
              ],
              "variance": 1.9688517755244024,
              "mean_reward": 0.5740016015062188,
              "min_reward": -1.0333075022791942,
              "max_reward": 1.5585386628190714,
              "num_responses": 4,
              "rvariance": 0.969848220304534
            },
            {
              "id": "reasoning_sample_65",
              "rewards": [
                2.1627652522934047,
                2.1907115367547645,
                -0.10555493551880375,
                -0.5910198488483094,
                2.0973715237480293,
                -0.6180795972091576,
                1.9512406573486842
              ],
              "variance": 2.775787514270597,
              "mean_reward": 1.0124906555098019,
              "min_reward": -0.6180795972091576,
              "max_reward": 2.1907115367547645,
              "num_responses": 7,
              "rvariance": 1.6070836267837783
            },
            {
              "id": "reasoning_sample_256",
              "rewards": [
                -1.0030571526138483,
                -2.245519753492432,
                -1.5521337673775997,
                -2.4425085393548005
              ],
              "variance": 1.215631766553116,
              "mean_reward": -1.81080480320967,
              "min_reward": -2.4425085393548005,
              "max_reward": -1.0030571526138483,
              "num_responses": 4,
              "rvariance": 0.32684841752014165
            },
            {
              "id": "reasoning_sample_263",
              "rewards": [
                0.07401157523698851,
                -0.010915465556660675,
                -1.0379547689609636,
                -0.09778870681338601,
                -1.913873662720094,
                -0.3483630114244532
              ],
              "variance": 1.5074622706806928,
              "mean_reward": -0.5558140067064282,
              "min_reward": -1.913873662720094,
              "max_reward": 0.07401157523698851,
              "num_responses": 6,
              "rvariance": 0.5038672530870738
            },
            {
              "id": "reasoning_sample_203",
              "rewards": [
                -0.280754103449479,
                -1.9503801779162862,
                -0.9065325082426859,
                -2.5846707222604217,
                -2.5846707222604217,
                -0.9065325082426859
              ],
              "variance": 1.9910274164143393,
              "mean_reward": -1.5355901237286635,
              "min_reward": -2.5846707222604217,
              "max_reward": -0.280754103449479,
              "num_responses": 6,
              "rvariance": 0.7898718997460641
            },
            {
              "id": "reasoning_sample_61",
              "rewards": [
                0.5306045317308251,
                0.4191616704494437,
                -1.2054991470675425,
                0.816604460721935,
                0.1015170791231221,
                -0.019150002894297833,
                0.3631835323857092
              ],
              "variance": 1.1386941638908648,
              "mean_reward": 0.14377458920702788,
              "min_reward": -1.2054991470675425,
              "max_reward": 0.816604460721935,
              "num_responses": 7,
              "rvariance": 0.3678836435097067
            },
            {
              "id": "reasoning_sample_319",
              "rewards": [
                0.5215640524836319,
                -0.018755986849625976,
                -2.0233603736382815,
                0.17473773076463495,
                0.004575865600353845,
                -0.09261608540538742
              ],
              "variance": 1.4061391211459677,
              "mean_reward": -0.2389757995074457,
              "min_reward": -2.0233603736382815,
              "max_reward": 0.5215640524836319,
              "num_responses": 6,
              "rvariance": 0.6771405675614575
            },
            {
              "id": "reasoning_sample_528",
              "rewards": [
                -0.5233320049990658,
                -0.9907604027213787,
                -0.9622771553169852,
                -1.2766886924316392,
                -0.5233320049990658,
                -0.5233320049990658,
                -1.6001811717206327
              ],
              "variance": 0.8827536791481708,
              "mean_reward": -0.9142719195982618,
              "min_reward": -1.6001811717206327,
              "max_reward": -0.5233320049990658,
              "num_responses": 7,
              "rvariance": 0.15263920865219932
            },
            {
              "id": "reasoning_sample_551",
              "rewards": [
                -0.566651880132711,
                -1.1734551620742626,
                -0.9237305789332706,
                -0.4014417485938094,
                -1.7079107302779852,
                -1.4582690629713098,
                -1.0424017109870245
              ],
              "variance": 1.0575579023768298,
              "mean_reward": -1.0391229819957677,
              "min_reward": -1.7079107302779852,
              "max_reward": -0.4014417485938094,
              "num_responses": 7,
              "rvariance": 0.1834568683330379
            },
            {
              "id": "reasoning_sample_596",
              "rewards": [
                -2.0034506235022107,
                -2.0526362964187403,
                -0.7138778988717077,
                -0.7138778988717077,
                -2.0526362964187403,
                -1.6402713092759826,
                -2.2017053683229233
              ],
              "variance": 1.3983860263087058,
              "mean_reward": -1.6254936702402873,
              "min_reward": -2.2017053683229233,
              "max_reward": -0.7138778988717077,
              "num_responses": 7,
              "rvariance": 0.3574397190792703
            },
            {
              "id": "reasoning_sample_456",
              "rewards": [
                0.16455500298389802,
                0.2874515259544192,
                -0.9678995122103163,
                -0.47770905965144655
              ],
              "variance": 1.0714249455059182,
              "mean_reward": -0.24840051073086145,
              "min_reward": -0.9678995122103163,
              "max_reward": 0.2874515259544192,
              "num_responses": 4,
              "rvariance": 0.2569827213162953
            },
            {
              "id": "reasoning_sample_306",
              "rewards": [
                -0.35030788523418027,
                -1.570753347131706,
                -1.3905692792419246,
                -1.289368845141988,
                -1.1494427364562132,
                -0.15065650610024112,
                -0.5761255116983734
              ],
              "variance": 1.1921955728172324,
              "mean_reward": -0.9253177301435181,
              "min_reward": -1.570753347131706,
              "max_reward": -0.15065650610024112,
              "num_responses": 7,
              "rvariance": 0.2669261302290307
            },
            {
              "id": "reasoning_sample_231",
              "rewards": [
                -0.05193094382298245,
                -1.5991171957346837,
                -0.21272066640280443,
                -0.6608628410631066,
                -0.6401219426038477,
                -0.3475358430613121,
                -0.24741596811418767
              ],
              "variance": 0.8877598055608618,
              "mean_reward": -0.537100771543275,
              "min_reward": -1.5991171957346837,
              "max_reward": -0.05193094382298245,
              "num_responses": 7,
              "rvariance": 0.2306105226542902
            },
            {
              "id": "reasoning_sample_526",
              "rewards": [
                0.23051023755926459,
                -0.009950988571891507,
                -0.6072945688079459,
                -0.027848868904107222,
                -1.318177122616902
              ],
              "variance": 1.1681498482001218,
              "mean_reward": -0.34655226226831637,
              "min_reward": -1.318177122616902,
              "max_reward": 0.23051023755926459,
              "num_responses": 5,
              "rvariance": 0.3119829637540377
            },
            {
              "id": "reasoning_sample_591",
              "rewards": [
                0.3882473307828914,
                0.00010902377405703191,
                -0.40178203517784417,
                0.2851935619543131,
                0.2245668305554601
              ],
              "variance": 0.5880514348485437,
              "mean_reward": 0.09926694237777549,
              "min_reward": -0.40178203517784417,
              "max_reward": 0.3882473307828914,
              "num_responses": 5,
              "rvariance": 0.07893216109172478
            },
            {
              "id": "reasoning_sample_23",
              "rewards": [
                -0.49682878771814976,
                -0.3955374778638023,
                -1.2650579225203993,
                -0.8777096375809322,
                -0.9315982966198918,
                -0.7546718260287358
              ],
              "variance": 0.6521449767791696,
              "mean_reward": -0.7869006580553185,
              "min_reward": -1.2650579225203993,
              "max_reward": -0.3955374778638023,
              "num_responses": 6,
              "rvariance": 0.08269392888561575
            },
            {
              "id": "reasoning_sample_275",
              "rewards": [
                -0.11715519240301502,
                -1.6108739977140845,
                -1.07399861380167,
                -1.0692836877990983,
                -1.07399861380167,
                -0.6946002990564659
              ],
              "variance": 0.9365585600281368,
              "mean_reward": -0.9399850674293339,
              "min_reward": -1.6108739977140845,
              "max_reward": -0.11715519240301502,
              "num_responses": 6,
              "rvariance": 0.20666533983599264
            },
            {
              "id": "reasoning_sample_656",
              "rewards": [
                0.07119509017692668,
                -0.26778076034898696,
                -1.0814092994095388,
                -0.41088818376581604
              ],
              "variance": 0.8497552997355745,
              "mean_reward": -0.4222207883368538,
              "min_reward": -1.0814092994095388,
              "max_reward": 0.07119509017692668,
              "num_responses": 4,
              "rvariance": 0.17549221811775137
            },
            {
              "id": "reasoning_sample_405",
              "rewards": [
                0.19726297797838416,
                1.1698378547902342,
                1.2772291167435756,
                0.6567175257461507,
                0.7675421665668686,
                1.1953931782532443
              ],
              "variance": 0.8093208956361426,
              "mean_reward": 0.8773304700130763,
              "min_reward": 0.19726297797838416,
              "max_reward": 1.2772291167435756,
              "num_responses": 6,
              "rvariance": 0.14497645344220025
            },
            {
              "id": "reasoning_sample_330",
              "rewards": [
                -0.6395004055098115,
                -2.0845171030500853,
                -2.044137091737965,
                -1.489336631099679,
                -2.1717057561405504,
                -2.0845171030500853
              ],
              "variance": 1.0636929112905729,
              "mean_reward": -1.7522856817646961,
              "min_reward": -2.1717057561405504,
              "max_reward": -0.6395004055098115,
              "num_responses": 6,
              "rvariance": 0.2982131921944575
            },
            {
              "id": "reasoning_sample_451",
              "rewards": [
                -0.07861790259274387,
                -0.7240520034056757,
                -0.17900907814975175,
                -0.08445451400194874,
                -0.6320419603813765,
                -1.8148827697730228,
                -1.9615204177517098
              ],
              "variance": 1.7914179595262307,
              "mean_reward": -0.7820826637223185,
              "min_reward": -1.9615204177517098,
              "max_reward": -0.07861790259274387,
              "num_responses": 7,
              "rvariance": 0.546982099990397
            },
            {
              "id": "reasoning_sample_314",
              "rewards": [
                -0.34207467454989215,
                -0.4498135196806883,
                -0.26593936550048686,
                -1.681125599160393
              ],
              "variance": 1.022952017101173,
              "mean_reward": -0.6847382897228651,
              "min_reward": -1.681125599160393,
              "max_reward": -0.26593936550048686,
              "num_responses": 4,
              "rvariance": 0.3351970525201896
            },
            {
              "id": "reasoning_sample_593",
              "rewards": [
                -0.05843021858004455,
                0.09081363990287776,
                -0.6681368813760217,
                0.009544182392596662,
                -0.0786185659194184
              ],
              "variance": 0.4906354120921457,
              "mean_reward": -0.14096556871600202,
              "min_reward": -0.6681368813760217,
              "max_reward": 0.09081363990287776,
              "num_responses": 5,
              "rvariance": 0.07299672247964742
            },
            {
              "id": "reasoning_sample_599",
              "rewards": [
                0.4019841628857695,
                0.08087103637832134,
                0.010968344762816332,
                -1.7767136262671166,
                0.010968344762816332,
                0.010968344762816332,
                0.010968344762816332
              ],
              "variance": 0.9134207306304574,
              "mean_reward": -0.17856929256453719,
              "min_reward": -1.7767136262671166,
              "max_reward": 0.4019841628857695,
              "num_responses": 7,
              "rvariance": 0.44315928201678184
            },
            {
              "id": "reasoning_sample_301",
              "rewards": [
                -0.002640465291877077,
                -0.3045038517044138,
                -0.3045038517044138,
                -1.163897951347609,
                -0.26576424725841047,
                0.022347713864408526,
                -0.5383391076836722
              ],
              "variance": 0.795917451519884,
              "mean_reward": -0.36532882301799835,
              "min_reward": -1.163897951347609,
              "max_reward": 0.022347713864408526,
              "num_responses": 7,
              "rvariance": 0.1381133732024575
            },
            {
              "id": "reasoning_sample_77",
              "rewards": [
                0.4825053879071788,
                0.3928435213107219,
                0.9838224821046442,
                0.8418506739546134,
                0.9487242094384829,
                0.5813742287461363,
                0.9732291551123721
              ],
              "variance": 0.5308258446406848,
              "mean_reward": 0.7434785226534499,
              "min_reward": 0.3928435213107219,
              "max_reward": 0.9838224821046442,
              "num_responses": 7,
              "rvariance": 0.054240446769218555
            },
            {
              "id": "reasoning_sample_511",
              "rewards": [
                1.3833991942891042,
                0.6614974577628265,
                1.0313912962520024,
                1.0313912962520024,
                0.735149271742785,
                0.74806158878922,
                0.735149271742785
              ],
              "variance": 0.46650590931604174,
              "mean_reward": 0.9037199109758178,
              "min_reward": 0.6614974577628265,
              "max_reward": 1.3833991942891042,
              "num_responses": 7,
              "rvariance": 0.05748936157228015
            },
            {
              "id": "reasoning_sample_12",
              "rewards": [
                2.646040855933618,
                2.7517558913804177,
                1.6081813678143533,
                2.5940433412437485,
                2.5880806977663826,
                1.6393875712176995
              ],
              "variance": 1.0751139041409916,
              "mean_reward": 2.3045816208927037,
              "min_reward": 1.6081813678143533,
              "max_reward": 2.7517558913804177,
              "num_responses": 6,
              "rvariance": 0.23469591462139708
            },
            {
              "id": "reasoning_sample_543",
              "rewards": [
                0.46954862797355007,
                0.007190699351358009,
                0.23346602122097806,
                0.13893666348680725,
                0.2589165390694123,
                0.4274844302347936,
                0.4124129848627577
              ],
              "variance": 0.35807183149766864,
              "mean_reward": 0.2782794237428082,
              "min_reward": 0.007190699351358009,
              "max_reward": 0.46954862797355007,
              "num_responses": 7,
              "rvariance": 0.02458950262063681
            },
            {
              "id": "reasoning_sample_506",
              "rewards": [
                -0.24126162322788208,
                -1.1241898899567895,
                -0.9991010723269409,
                -1.0203315058720042,
                -0.7624035617470779,
                -0.8301053354564866,
                -0.5972484863221625
              ],
              "variance": 0.607021118421468,
              "mean_reward": -0.7963773535584776,
              "min_reward": -1.1241898899567895,
              "max_reward": -0.24126162322788208,
              "num_responses": 7,
              "rvariance": 0.07840157180427501
            },
            {
              "id": "reasoning_sample_531",
              "rewards": [
                0.5362288786041798,
                -0.22494312370772648,
                -0.11563352101163918,
                -0.1998322291166525,
                0.12198336033912476,
                0.18400705771454162,
                0.05290982706678443
              ],
              "variance": 0.5347723730234791,
              "mean_reward": 0.050674321412658915,
              "min_reward": -0.22494312370772648,
              "max_reward": 0.5362288786041798,
              "num_responses": 7,
              "rvariance": 0.0607153756374222
            },
            {
              "id": "reasoning_sample_274",
              "rewards": [
                0.9018223702623663,
                0.5816024131221752,
                0.7661637737371916,
                0.41796104916854127,
                0.0029672984146143482
              ],
              "variance": 0.6785941329361114,
              "mean_reward": 0.5341033809409776,
              "min_reward": 0.0029672984146143482,
              "max_reward": 0.9018223702623663,
              "num_responses": 5,
              "rvariance": 0.09738400369228353
            },
            {
              "id": "reasoning_sample_597",
              "rewards": [
                0.522935148719889,
                0.9086688965335458,
                0.9086688965335458,
                0.6840797510705855,
                0.9086688965335458,
                0.9086688965335458,
                -0.8636066491537127
              ],
              "variance": 0.9403504669630973,
              "mean_reward": 0.5682976909672778,
              "min_reward": -0.8636066491537127,
              "max_reward": 0.9086688965335458,
              "num_responses": 7,
              "rvariance": 0.36131764503611136
            },
            {
              "id": "reasoning_sample_73",
              "rewards": [
                1.9653509423693236,
                2.2284939608094185,
                2.0574455595446257,
                2.112901659515504,
                0.8379509764350412,
                2.266540388880536,
                2.437780159890931
              ],
              "variance": 0.8206453412890835,
              "mean_reward": 1.9866376639207686,
              "min_reward": 0.8379509764350412,
              "max_reward": 2.437780159890931,
              "num_responses": 7,
              "rvariance": 0.24018002009176434
            },
            {
              "id": "reasoning_sample_412",
              "rewards": [
                -0.3964468987345853,
                0.021924511446057268,
                0.021924511446057268,
                0.07231345895018722,
                -1.4642310431220011,
                0.021924511446057268
              ],
              "variance": 0.9774579561264154,
              "mean_reward": -0.2870984914280379,
              "min_reward": -1.4642310431220011,
              "max_reward": 0.07231345895018722,
              "num_responses": 6,
              "rvariance": 0.3022101195714448
            },
            {
              "id": "reasoning_sample_491",
              "rewards": [
                0.42624268270007015,
                0.20689580794593423,
                -0.44401604454528076,
                0.17873095734531608,
                -0.23219991752710384,
                0.214265367299982,
                -1.2733694057522822
              ],
              "variance": 1.0748136824880987,
              "mean_reward": -0.13192150750476633,
              "min_reward": -1.2733694057522822,
              "max_reward": 0.42624268270007015,
              "num_responses": 7,
              "rvariance": 0.29329382952308036
            },
            {
              "id": "reasoning_sample_64",
              "rewards": [
                0.9056733132713605,
                1.6196532709870426,
                1.391846659489266,
                1.9242187186082844,
                1.3497496270801201,
                1.678417049420473,
                1.9103850408109246
              ],
              "variance": 0.7437994103732521,
              "mean_reward": 1.5399919542382103,
              "min_reward": 0.9056733132713605,
              "max_reward": 1.9242187186082844,
              "num_responses": 7,
              "rvariance": 0.11011828386833485
            },
            {
              "id": "reasoning_sample_535",
              "rewards": [
                1.047405660491885,
                -0.5519193946913608,
                -0.41678781120910147,
                -0.1723161120037264,
                -0.48556483745792606,
                -0.48448427830511387
              ],
              "variance": 0.9562868903187227,
              "mean_reward": -0.17727779552922387,
              "min_reward": -0.5519193946913608,
              "max_reward": 1.047405660491885,
              "num_responses": 6,
              "rvariance": 0.31450204741160603
            },
            {
              "id": "reasoning_sample_548",
              "rewards": [
                -0.12984463168680743,
                -1.2682206641045668,
                -0.6074298874495504,
                -0.911946580560214,
                -0.5461869255700573,
                -0.5461869255700573,
                -0.5203039187298284
              ],
              "variance": 0.6903360100653353,
              "mean_reward": -0.6471599333815831,
              "min_reward": -1.2682206641045668,
              "max_reward": -0.12984463168680743,
              "num_responses": 7,
              "rvariance": 0.1087865061077035
            },
            {
              "id": "reasoning_sample_235",
              "rewards": [
                0.31767268924608577,
                -1.111330639044317,
                0.025556224989118605,
                0.10568940390592682,
                -0.2662809787378707
              ],
              "variance": 1.0061901500317607,
              "mean_reward": -0.1857386599282113,
              "min_reward": -1.111330639044317,
              "max_reward": 0.31767268924608577,
              "num_responses": 5,
              "rvariance": 0.2492412816366269
            },
            {
              "id": "reasoning_sample_156",
              "rewards": [
                0.3449214857091756,
                -0.5883944018705127,
                -0.1261585253564345,
                -0.7065408425247119,
                -0.5924287547050148,
                -0.1261585253564345
              ],
              "variance": 0.7588662787912339,
              "mean_reward": -0.29912659401732217,
              "min_reward": -0.7065408425247119,
              "max_reward": 0.3449214857091756,
              "num_responses": 6,
              "rvariance": 0.13505370442717415
            },
            {
              "id": "reasoning_sample_587",
              "rewards": [
                0.5179701485610189,
                0.3366909283315856,
                -0.9618924258457568,
                0.5186467417690412,
                0.3742511379502715,
                0.3742511379502715,
                0.38562520043846743
              ],
              "variance": 0.7009831991835791,
              "mean_reward": 0.2207918384506999,
              "min_reward": -0.9618924258457568,
              "max_reward": 0.5186467417690412,
              "num_responses": 7,
              "rvariance": 0.23763952998720872
            },
            {
              "id": "reasoning_sample_594",
              "rewards": [
                -0.020395067062393933,
                -0.4746650535420203,
                -0.5795668504858441,
                -1.0937159992021264,
                -0.8961076662257449,
                -0.4746650535420203,
                -0.764024068812959
              ],
              "variance": 0.6821939404661279,
              "mean_reward": -0.614734251267587,
              "min_reward": -1.0937159992021264,
              "max_reward": -0.020395067062393933,
              "num_responses": 7,
              "rvariance": 0.10351379076925411
            },
            {
              "id": "reasoning_sample_622",
              "rewards": [
                1.0682901691761801,
                1.0093804588743525,
                0.3278746535003841,
                0.2924019329264496,
                0.4830247726933371,
                0.7727804573156458,
                0.4830247726933371
              ],
              "variance": 0.7192587777242732,
              "mean_reward": 0.6338253167399552,
              "min_reward": 0.2924019329264496,
              "max_reward": 1.0682901691761801,
              "num_responses": 7,
              "rvariance": 0.08639532105704825
            },
            {
              "id": "reasoning_sample_647",
              "rewards": [
                0.7464563382368532,
                0.8858650521164932,
                0.8852335651223391,
                0.8852335651223391,
                -0.7415830640868754
              ],
              "variance": 1.0319797604762155,
              "mean_reward": 0.53224109130223,
              "min_reward": -0.7415830640868754,
              "max_reward": 0.8858650521164932,
              "num_responses": 5,
              "rvariance": 0.40855468593625555
            },
            {
              "id": "reasoning_sample_395",
              "rewards": [
                -0.22744121196401304,
                -0.3760356736325688,
                -0.778680271686738,
                0.17728888515488406,
                -0.7224368029531909,
                -0.22997379320737527
              ],
              "variance": 0.7254823739153999,
              "mean_reward": -0.35954647804816703,
              "min_reward": -0.778680271686738,
              "max_reward": 0.17728888515488406,
              "num_responses": 6,
              "rvariance": 0.10501125126998713
            },
            {
              "id": "reasoning_sample_252",
              "rewards": [
                0.5630849856759469,
                0.5850629883832074,
                0.710496072557138,
                0.710496072557138,
                0.4013831889186437,
                -0.7652220367871634
              ],
              "variance": 0.8924154964913977,
              "mean_reward": 0.36755021188415177,
              "min_reward": -0.7652220367871634,
              "max_reward": 0.710496072557138,
              "num_responses": 6,
              "rvariance": 0.26751450335041527
            },
            {
              "id": "reasoning_sample_497",
              "rewards": [
                0.09111412688644065,
                0.543929437968819,
                0.6521856779057498,
                1.1928310789728656,
                1.1245551960266496,
                1.1245551960266496,
                0.6521856779057498
              ],
              "variance": 0.7890622356692683,
              "mean_reward": 0.7687651988132748,
              "min_reward": 0.09111412688644065,
              "max_reward": 1.1928310789728656,
              "num_responses": 7,
              "rvariance": 0.13856408271112336
            },
            {
              "id": "reasoning_sample_87",
              "rewards": [
                0.7456921859077926,
                1.1832569534160113,
                1.224701272377418,
                1.2635761954650258,
                0.09477635345653045,
                1.1701463016938913,
                0.9758360289432819
              ],
              "variance": 0.7549253886851733,
              "mean_reward": 0.9511407558942786,
              "min_reward": 0.09477635345653045,
              "max_reward": 1.2635761954650258,
              "num_responses": 7,
              "rvariance": 0.1500673685006058
            },
            {
              "id": "reasoning_sample_299",
              "rewards": [
                0.4014919744932669,
                -0.28734491728762646,
                0.10260228156265605,
                -1.1184507875687408,
                0.15900693867811447,
                -0.30731702013110296,
                -0.06791579002584859
              ],
              "variance": 0.8877714801103336,
              "mean_reward": -0.1597039028970402,
              "min_reward": -1.1184507875687408,
              "max_reward": 0.4014919744932669,
              "num_responses": 7,
              "rvariance": 0.2072892078870836
            },
            {
              "id": "reasoning_sample_303",
              "rewards": [
                -0.62390559539157,
                -0.8097358999349656,
                -1.0164934977331634,
                -0.8097358999349656,
                -1.9124010775026337
              ],
              "variance": 0.8558003283859172,
              "mean_reward": -1.0344543940994595,
              "min_reward": -1.9124010775026337,
              "max_reward": -0.62390559539157,
              "num_responses": 5,
              "rvariance": 0.2081320184113041
            },
            {
              "id": "reasoning_sample_509",
              "rewards": [
                -0.15183059431416232,
                -0.10941151680453136,
                -0.5000784250966808,
                -0.40768298927447866,
                -0.7213648670471475,
                -0.895827079042418,
                0.033400062915456566
              ],
              "variance": 0.7388628669287196,
              "mean_reward": -0.3932564869519945,
              "min_reward": -0.895827079042418,
              "max_reward": 0.033400062915456566,
              "num_responses": 7,
              "rvariance": 0.09896308568854531
            },
            {
              "id": "reasoning_sample_572",
              "rewards": [
                0.8657450274245961,
                0.7806952711961587,
                1.1329502584195235,
                1.1840028642615223,
                1.0773638147570999,
                0.6601509046135271,
                0.9331854504242394
              ],
              "variance": 0.420893776193217,
              "mean_reward": 0.9477276558709524,
              "min_reward": 0.6601509046135271,
              "max_reward": 1.1840028642615223,
              "num_responses": 7,
              "rvariance": 0.032067393255111244
            },
            {
              "id": "reasoning_sample_557",
              "rewards": [
                0.5934189145022838,
                0.29772579281624145,
                0.29772579281624145,
                0.14816751748959112,
                0.27320326898547714,
                0.07185178358471313,
                0.007141613177442659
              ],
              "variance": 0.37003532606885353,
              "mean_reward": 0.24131924048171297,
              "min_reward": 0.007141613177442659,
              "max_reward": 0.5934189145022838,
              "num_responses": 7,
              "rvariance": 0.031941399083564595
            },
            {
              "id": "reasoning_sample_678",
              "rewards": [
                0.8357162288685438,
                0.06364643262075535,
                0.2542241661737747,
                -0.1602488731406448,
                -0.09507968067459834,
                -0.09507968067459834,
                0.12281185535561491
              ],
              "variance": 0.6079683489126995,
              "mean_reward": 0.1322843497898353,
              "min_reward": -0.1602488731406448,
              "max_reward": 0.8357162288685438,
              "num_responses": 7,
              "rvariance": 0.10049301576631789
            },
            {
              "id": "reasoning_sample_53",
              "rewards": [
                2.5381467923609815,
                2.4919902007037016,
                2.9093868523361195,
                3.2437612057208067,
                2.8385395835360816,
                3.057264921196181,
                2.9128878905242983
              ],
              "variance": 0.6121792793079619,
              "mean_reward": 2.8559967780540245,
              "min_reward": 2.4919902007037016,
              "max_reward": 3.2437612057208067,
              "num_responses": 7,
              "rvariance": 0.061541624416770475
            },
            {
              "id": "reasoning_sample_75",
              "rewards": [
                0.7421579813858875,
                -0.09753266271701676,
                -0.2358654607305663,
                -0.5339538550383428,
                1.0140854349768063,
                -0.8111653689185815
              ],
              "variance": 1.5506813201598089,
              "mean_reward": 0.012954344826364391,
              "min_reward": -0.8111653689185815,
              "max_reward": 1.0140854349768063,
              "num_responses": 6,
              "rvariance": 0.4310669932288385
            },
            {
              "id": "reasoning_sample_595",
              "rewards": [
                0.25967007817168036,
                0.5881308742529167,
                0.036871914729955754,
                0.4622546878603989,
                0.4976876088338615
              ],
              "variance": 0.425962387978649,
              "mean_reward": 0.3689230327697627,
              "min_reward": 0.036871914729955754,
              "max_reward": 0.5881308742529167,
              "num_responses": 5,
              "rvariance": 0.039107468947704914
            },
            {
              "id": "reasoning_sample_245",
              "rewards": [
                -0.6475671211987921,
                -1.5296881193647944,
                -1.2414089999199933,
                -1.0290038388148322,
                -1.4146248210938186
              ],
              "variance": 0.683520991811196,
              "mean_reward": -1.172458580078446,
              "min_reward": -1.5296881193647944,
              "max_reward": -0.6475671211987921,
              "num_responses": 5,
              "rvariance": 0.09742037976367994
            },
            {
              "id": "reasoning_sample_418",
              "rewards": [
                -1.833921571985433,
                -2.4623413435966253,
                -2.077793623877031,
                -2.1341606372037103,
                -2.077793623877031,
                -2.4623413435966253,
                -2.9954888315981716
              ],
              "variance": 0.6953555356768519,
              "mean_reward": -2.291977282247804,
              "min_reward": -2.9954888315981716,
              "max_reward": -1.833921571985433,
              "num_responses": 7,
              "rvariance": 0.12563524757871417
            },
            {
              "id": "reasoning_sample_60",
              "rewards": [
                0.2468201138326513,
                -0.5710921888920265,
                -0.35525630222618715,
                -0.2883969533934338,
                -0.1512495201472725,
                -0.05143809210380536
              ],
              "variance": 0.5608652564235298,
              "mean_reward": -0.19510215715501233,
              "min_reward": -0.5710921888920265,
              "max_reward": 0.2468201138326513,
              "num_responses": 6,
              "rvariance": 0.06559658068478541
            },
            {
              "id": "reasoning_sample_385",
              "rewards": [
                -0.10920323222872838,
                -0.2978984446794266,
                -0.12967614671147637,
                0.08149522677905573,
                -0.5998845465267517,
                -0.10345218996053811,
                -0.1507102355608782
              ],
              "variance": 0.3892196621536561,
              "mean_reward": -0.18704708126982053,
              "min_reward": -0.5998845465267517,
              "max_reward": 0.08149522677905573,
              "num_responses": 7,
              "rvariance": 0.03892818998235291
            },
            {
              "id": "reasoning_sample_243",
              "rewards": [
                0.25704330454053465,
                -0.6738673605173016,
                -0.365584961875321,
                -0.5194110810259087,
                -0.03715666880113676,
                -0.3494959733845534
              ],
              "variance": 0.706582538641304,
              "mean_reward": -0.28141212351061445,
              "min_reward": -0.6738673605173016,
              "max_reward": 0.25704330454053465,
              "num_responses": 6,
              "rvariance": 0.09533001155290828
            },
            {
              "id": "reasoning_sample_71",
              "rewards": [
                1.4360699855536232,
                1.286904731281633,
                1.6798325885439238,
                1.8356085564542977,
                1.8205039447485352,
                1.721464628954223,
                1.1515797880737477
              ],
              "variance": 0.5937710354323611,
              "mean_reward": 1.5617091748014265,
              "min_reward": 1.1515797880737477,
              "max_reward": 1.8356085564542977,
              "num_responses": 7,
              "rvariance": 0.06299705030546286
            },
            {
              "id": "reasoning_sample_218",
              "rewards": [
                0.337900172859257,
                0.04530876670332509,
                -0.009422980538964234,
                -0.2051468024330009,
                -0.4120888050467185,
                -0.1281451887466571,
                0.2298402776179875
              ],
              "variance": 0.5609878391929832,
              "mean_reward": -0.020250651369253022,
              "min_reward": -0.4120888050467185,
              "max_reward": 0.337900172859257,
              "num_responses": 7,
              "rvariance": 0.05637110256604623
            },
            {
              "id": "reasoning_sample_32",
              "rewards": [
                -0.15186707728126156,
                1.3084446067203652,
                1.3244782074338095,
                1.370377096678034
              ],
              "variance": 1.07038100198554,
              "mean_reward": 0.9628582083877368,
              "min_reward": -0.15186707728126156,
              "max_reward": 1.370377096678034,
              "num_responses": 4,
              "rvariance": 0.4147207723114473
            },
            {
              "id": "reasoning_sample_55",
              "rewards": [
                0.9253243660043635,
                1.0819935032819943,
                1.2593305730846853,
                -0.09001717149457202,
                0.4709515638901847,
                1.2693242527631807,
                0.48893899332346225
              ],
              "variance": 1.0167639752198014,
              "mean_reward": 0.7722637258361856,
              "min_reward": -0.09001717149457202,
              "max_reward": 1.2693242527631807,
              "num_responses": 7,
              "rvariance": 0.2168933778020534
            },
            {
              "id": "reasoning_sample_403",
              "rewards": [
                -0.1150677033582636,
                -1.4652976724146483,
                -1.5556732785129013,
                -1.7150985381232113,
                -1.6562760552790847,
                -1.5773574275033442,
                -1.5656059321373397
              ],
              "variance": 0.7545993636246413,
              "mean_reward": -1.378625229618399,
              "min_reward": -1.7150985381232113,
              "max_reward": -0.1150677033582636,
              "num_responses": 7,
              "rvariance": 0.2714566120061635
            },
            {
              "id": "reasoning_sample_580",
              "rewards": [
                0.7636570622341361,
                0.29500947008403394,
                0.2621814329614576,
                0.19550582561754953
              ],
              "variance": 0.4075542767683835,
              "mean_reward": 0.3790884477242943,
              "min_reward": 0.19550582561754953,
              "max_reward": 0.7636570622341361,
              "num_responses": 4,
              "rvariance": 0.05058303074684917
            },
            {
              "id": "reasoning_sample_530",
              "rewards": [
                -1.188316332890472,
                -1.8256406017805786,
                -1.4434782047826007,
                -1.4039717947008388,
                -1.369505340692169
              ],
              "variance": 0.41198370697023656,
              "mean_reward": -1.4461824549693318,
              "min_reward": -1.8256406017805786,
              "max_reward": -1.188316332890472,
              "num_responses": 5,
              "rvariance": 0.04363037095213257
            },
            {
              "id": "reasoning_sample_318",
              "rewards": [
                0.41779986078663,
                -0.28823244837814993,
                -0.29159418796467684,
                0.0978966421335278,
                -0.45932031758007735,
                -0.4837121660559589,
                -0.7420619859458872
              ],
              "variance": 0.8129100236066991,
              "mean_reward": -0.24988922900065605,
              "min_reward": -0.7420619859458872,
              "max_reward": 0.41779986078663,
              "num_responses": 7,
              "rvariance": 0.1301059726131083
            },
            {
              "id": "reasoning_sample_76",
              "rewards": [
                0.9108157533156678,
                1.6918149215926654,
                0.7444212519993898,
                0.8414274715362622,
                1.1403941103611188,
                0.9487623507222684,
                0.75153941054379
              ],
              "variance": 0.6122702877277078,
              "mean_reward": 1.004167895724452,
              "min_reward": 0.7444212519993898,
              "max_reward": 1.6918149215926654,
              "num_responses": 7,
              "rvariance": 0.09442490382357084
            },
            {
              "id": "reasoning_sample_393",
              "rewards": [
                -0.3055074649629803,
                -0.7362432843568948,
                -0.9087334261487823,
                -0.9197705186863161,
                -0.767093944662692,
                -0.5504633926407636
              ],
              "variance": 0.4862665436156772,
              "mean_reward": -0.6979686719097383,
              "min_reward": -0.9197705186863161,
              "max_reward": -0.3055074649629803,
              "num_responses": 6,
              "rvariance": 0.04594078275406993
            },
            {
              "id": "reasoning_sample_642",
              "rewards": [
                0.2067883490246601,
                -0.7934459234618149,
                -0.3014936752553887,
                -0.30868280975396384,
                -1.221659111512485,
                -0.8831515696187907
              ],
              "variance": 1.0050526774502737,
              "mean_reward": -0.5502741234296306,
              "min_reward": -1.221659111512485,
              "max_reward": 0.2067883490246601,
              "num_responses": 6,
              "rvariance": 0.21901656369520653
            },
            {
              "id": "reasoning_sample_16",
              "rewards": [
                0.06158680329633427,
                -0.8061274028255129,
                -0.23382175124633398,
                -0.09877507357841472,
                -0.018111896648655645,
                -0.08682524353672523
              ],
              "variance": 0.5417120303597628,
              "mean_reward": -0.19701242742321803,
              "min_reward": -0.8061274028255129,
              "max_reward": 0.06158680329633427,
              "num_responses": 6,
              "rvariance": 0.08217445580051376
            },
            {
              "id": "reasoning_sample_260",
              "rewards": [
                0.2841375458884585,
                -0.702666351418772,
                -0.19595840133738707,
                -0.34499264859115736,
                -0.10652073915692198,
                -0.20882295886325586,
                -0.256416647760909
              ],
              "variance": 0.5378047045834335,
              "mean_reward": -0.21874860017713502,
              "min_reward": -0.702666351418772,
              "max_reward": 0.2841375458884585,
              "num_responses": 7,
              "rvariance": 0.07394861596400329
            },
            {
              "id": "reasoning_sample_582",
              "rewards": [
                -0.22471493933168754,
                -0.4249513725925637,
                -0.4249513725925637,
                -0.22471493933168754,
                -0.5833968987045904
              ],
              "variance": 0.2953037489280922,
              "mean_reward": -0.37654590451061865,
              "min_reward": -0.5833968987045904,
              "max_reward": -0.22471493933168754,
              "num_responses": 5,
              "rvariance": 0.018715759290766108
            },
            {
              "id": "reasoning_sample_295",
              "rewards": [
                0.23244582479554823,
                -0.09520372276273578,
                -0.1723559116041983,
                0.028182335293589808,
                -0.2987501561295254,
                0.24409251454697672
              ],
              "variance": 0.4738222035381243,
              "mean_reward": -0.010264852643390785,
              "min_reward": -0.2987501561295254,
              "max_reward": 0.24409251454697672,
              "num_responses": 6,
              "rvariance": 0.04029937047113663
            },
            {
              "id": "reasoning_sample_366",
              "rewards": [
                -0.34935932808959985,
                -0.9026560271567223,
                -1.2599423472064104,
                -0.7511760944539535,
                -1.2642619305109613,
                -0.836359179343972,
                -0.9394441245262533
              ],
              "variance": 0.6712207926200188,
              "mean_reward": -0.900457004469696,
              "min_reward": -1.2642619305109613,
              "max_reward": -0.34935932808959985,
              "num_responses": 7,
              "rvariance": 0.08474436246828905
            },
            {
              "id": "reasoning_sample_286",
              "rewards": [
                0.03391016112817148,
                -0.2968251821200342,
                -1.110078278282801,
                -0.9248894106336776,
                -0.5352068791265333,
                -1.110078278282801,
                -0.7228042859308814
              ],
              "variance": 0.945547233462049,
              "mean_reward": -0.6665674504640796,
              "min_reward": -1.110078278282801,
              "max_reward": 0.03391016112817148,
              "num_responses": 7,
              "rvariance": 0.1582757649426271
            },
            {
              "id": "reasoning_sample_356",
              "rewards": [
                -0.44048913661679545,
                -1.3769584792072076,
                -0.6533088768935389,
                -0.22104276286147978,
                -0.5253544880297132,
                -0.5253544880297132
              ],
              "variance": 0.6843677283112356,
              "mean_reward": -0.6237513719397414,
              "min_reward": -1.3769584792072076,
              "max_reward": -0.22104276286147978,
              "num_responses": 6,
              "rvariance": 0.1305529594641727
            },
            {
              "id": "reasoning_sample_343",
              "rewards": [
                -0.2044118364776197,
                -0.8845830285824303,
                -0.3242948663657431,
                -0.7419896833383633,
                -0.7075829287304014
              ],
              "variance": 0.5751806420519345,
              "mean_reward": -0.5725724686989115,
              "min_reward": -0.8845830285824303,
              "max_reward": -0.2044118364776197,
              "num_responses": 5,
              "rvariance": 0.06829292507016393
            },
            {
              "id": "reasoning_sample_205",
              "rewards": [
                1.0695309217208917,
                0.6618662673938662,
                0.5897347981519345,
                0.5422220351085743,
                0.9852871074020103,
                0.9852871074020103,
                0.9852871074020103
              ],
              "variance": 0.4482549401949725,
              "mean_reward": 0.8313164777973283,
              "min_reward": 0.5422220351085743,
              "max_reward": 1.0695309217208917,
              "num_responses": 7,
              "rvariance": 0.04264538059656965
            },
            {
              "id": "reasoning_sample_512",
              "rewards": [
                0.8203240650493718,
                1.1983638867651347,
                1.3283908398235351,
                1.3283908398235351,
                1.1533770716983915,
                1.0554571196673517
              ],
              "variance": 0.3905002474651733,
              "mean_reward": 1.14738397047122,
              "min_reward": 0.8203240650493718,
              "max_reward": 1.3283908398235351,
              "num_responses": 6,
              "rvariance": 0.030596761711061796
            },
            {
              "id": "reasoning_sample_226",
              "rewards": [
                0.31300021615068413,
                0.25128562900559903,
                -1.0747999124245042,
                0.07995962552751472,
                0.3469048324660255,
                0.3820458897026941,
                0.3820458897026941
              ],
              "variance": 0.7639900793559868,
              "mean_reward": 0.09720602430438675,
              "min_reward": -1.0747999124245042,
              "max_reward": 0.3820458897026941,
              "num_responses": 7,
              "rvariance": 0.23840285777937273
            },
            {
              "id": "reasoning_sample_225",
              "rewards": [
                0.18832664101909238,
                0.2776674575050758,
                -0.008661481516601783,
                0.2776674575050758,
                0.05153010758375839,
                -0.3779354412284277
              ],
              "variance": 0.47096591887759054,
              "mean_reward": 0.06809912347799547,
              "min_reward": -0.3779354412284277,
              "max_reward": 0.2776674575050758,
              "num_responses": 6,
              "rvariance": 0.051234330817925854
            },
            {
              "id": "reasoning_sample_508",
              "rewards": [
                -0.8072510782121697,
                -1.7972422601905254,
                -1.5898836884252017,
                -1.3006639717559147,
                -1.7250033320273195
              ],
              "variance": 0.7637304532955753,
              "mean_reward": -1.4440088661222261,
              "min_reward": -1.7972422601905254,
              "max_reward": -0.8072510782121697,
              "num_responses": 5,
              "rvariance": 0.13020388470824423
            },
            {
              "id": "reasoning_sample_585",
              "rewards": [
                0.39902572591735785,
                -0.015412820409985949,
                0.4734390389196788,
                0.3982264172745471,
                0.6716317626963226
              ],
              "variance": 0.4423117985218379,
              "mean_reward": 0.3853820248795841,
              "min_reward": -0.015412820409985949,
              "max_reward": 0.6716317626963226,
              "num_responses": 5,
              "rvariance": 0.05013611742530065
            },
            {
              "id": "reasoning_sample_574",
              "rewards": [
                0.6316159177285202,
                0.4886610594468334,
                0.7215955178020778,
                0.5904498643070797,
                0.48277735184373677,
                0.5729698797798191,
                0.7279700871443279
              ],
              "variance": 0.23783776913338306,
              "mean_reward": 0.6022913825789136,
              "min_reward": 0.48277735184373677,
              "max_reward": 0.7279700871443279,
              "num_responses": 7,
              "rvariance": 0.00844056682619678
            },
            {
              "id": "reasoning_sample_520",
              "rewards": [
                -0.43587835290212523,
                -1.2652861068964383,
                -1.4325094348925438,
                -1.0983029031565132,
                -1.5145788643723102,
                -1.2687433655240978,
                -1.6250373488686864
              ],
              "variance": 0.7254291751161028,
              "mean_reward": -1.2343337680875306,
              "min_reward": -1.6250373488686864,
              "max_reward": -0.43587835290212523,
              "num_responses": 7,
              "rvariance": 0.13266253012382298
            },
            {
              "id": "reasoning_sample_238",
              "rewards": [
                0.6888636630473085,
                0.6814463441726945,
                0.4252198329679422,
                0.6223737871722693,
                0.25807146088605887
              ],
              "variance": 0.36096592577865066,
              "mean_reward": 0.5351950176492546,
              "min_reward": 0.25807146088605887,
              "max_reward": 0.6888636630473085,
              "num_responses": 5,
              "rvariance": 0.028299129580531702
            },
            {
              "id": "reasoning_sample_630",
              "rewards": [
                0.021976250926670743,
                -0.9100361997375627,
                -1.0738168622928483,
                -1.0581676593872953,
                -1.0738168622928483
              ],
              "variance": 0.7229881329538258,
              "mean_reward": -0.8187722665567769,
              "min_reward": -1.0738168622928483,
              "max_reward": 0.021976250926670743,
              "num_responses": 5,
              "rvariance": 0.18051856417741446
            },
            {
              "id": "reasoning_sample_233",
              "rewards": [
                -1.6964179323150481,
                -2.3114862646212653,
                -2.3114862646212653,
                -2.218628821770252,
                -2.2495972225607783,
                -2.4971540541294006,
                -2.29559959076623
              ],
              "variance": 0.376008914436349,
              "mean_reward": -2.2257671643977486,
              "min_reward": -2.4971540541294006,
              "max_reward": -1.6964179323150481,
              "num_responses": 7,
              "rvariance": 0.0534360538701505
            },
            {
              "id": "reasoning_sample_394",
              "rewards": [
                0.01783908245761621,
                -0.3720968398391992,
                -0.5030375253917669,
                -0.9035528448206893,
                -0.9035528448206893,
                -0.9043461835234293,
                -1.0572184389160402
              ],
              "variance": 0.7493726147600007,
              "mean_reward": -0.6608522278363141,
              "min_reward": -1.0572184389160402,
              "max_reward": 0.01783908245761621,
              "num_responses": 7,
              "rvariance": 0.1290156725406524
            },
            {
              "id": "reasoning_sample_284",
              "rewards": [
                0.1953360139888694,
                -0.7928495927814108,
                -0.30140080952095427,
                -0.041778729069274,
                -0.6936829182655885,
                -0.1319354373649315,
                -0.32875640157864366
              ],
              "variance": 0.7864167562259009,
              "mean_reward": -0.29929541065599047,
              "min_reward": -0.7928495927814108,
              "max_reward": 0.1953360139888694,
              "num_responses": 7,
              "rvariance": 0.10557058110630722
            },
            {
              "id": "reasoning_sample_207",
              "rewards": [
                0.35204627752032114,
                0.23612529785917585,
                0.04004792284761378,
                -0.3847544394426141,
                0.04004792284761378,
                -0.5063037459371613,
                0.04273903916618909
              ],
              "variance": 0.715867851764067,
              "mean_reward": -0.025721675019837402,
              "min_reward": -0.5063037459371613,
              "max_reward": 0.35204627752032114,
              "num_responses": 7,
              "rvariance": 0.08349632362609775
            },
            {
              "id": "reasoning_sample_345",
              "rewards": [
                0.47876289880947065,
                0.01574297016609588,
                0.40431708280009765,
                0.28579718922813696,
                0.022216375182851238,
                0.11484065870776686
              ],
              "variance": 0.4225603181303106,
              "mean_reward": 0.22027952914906987,
              "min_reward": 0.01574297016609588,
              "max_reward": 0.47876289880947065,
              "num_responses": 6,
              "rvariance": 0.03285960160777767
            },
            {
              "id": "reasoning_sample_565",
              "rewards": [
                0.6383088838745455,
                0.733069742618128,
                0.8565675712191121,
                0.9628938621964929,
                1.1083106574307042,
                1.0127740381412569,
                0.794871557220914
              ],
              "variance": 0.3558232867363409,
              "mean_reward": 0.8723994732430219,
              "min_reward": 0.6383088838745455,
              "max_reward": 1.1083106574307042,
              "num_responses": 7,
              "rvariance": 0.02343153492551104
            },
            {
              "id": "reasoning_sample_78",
              "rewards": [
                1.251072155986765,
                1.4070222471492033,
                1.9461380169048488,
                1.0998270409267805,
                1.5860156436582002,
                1.5811186344834696,
                1.8941866034188592
              ],
              "variance": 0.7243930588504839,
              "mean_reward": 1.5379114775040181,
              "min_reward": 1.0998270409267805,
              "max_reward": 1.9461380169048488,
              "num_responses": 7,
              "rvariance": 0.0841555003707142
            },
            {
              "id": "reasoning_sample_601",
              "rewards": [
                -0.1732819156418446,
                -0.7991545128228351,
                -0.3473633781259338,
                -0.6092009696705502
              ],
              "variance": 0.5166620954900782,
              "mean_reward": -0.4822501940652909,
              "min_reward": -0.7991545128228351,
              "max_reward": -0.1732819156418446,
              "num_responses": 4,
              "rvariance": 0.05755017421504158
            },
            {
              "id": "reasoning_sample_539",
              "rewards": [
                0.010376657369134009,
                -0.156461941155743,
                -0.4442422389412961,
                -0.244121887848463,
                -0.46977036601065053,
                -0.003571775942919656
              ],
              "variance": 0.4604087431890805,
              "mean_reward": -0.21796525875498973,
              "min_reward": -0.46977036601065053,
              "max_reward": 0.010376657369134009,
              "num_responses": 6,
              "rvariance": 0.03619641787584033
            },
            {
              "id": "reasoning_sample_603",
              "rewards": [
                -0.2718907324243857,
                -1.86975182563694,
                -2.2952894855458865,
                -1.86975182563694,
                -1.86975182563694,
                -1.86975182563694
              ],
              "variance": 1.0116993765607505,
              "mean_reward": -1.6743645867530053,
              "min_reward": -2.2952894855458865,
              "max_reward": -0.2718907324243857,
              "num_responses": 6,
              "rvariance": 0.4175308890818458
            },
            {
              "id": "reasoning_sample_339",
              "rewards": [
                0.3914531886009034,
                -0.3664950460727786,
                -0.28856344838874126,
                -0.13487795449315435,
                -0.18729668162135146,
                -0.19637165385562036
              ],
              "variance": 0.45581686428463447,
              "mean_reward": -0.13035859930512378,
              "min_reward": -0.3664950460727786,
              "max_reward": 0.3914531886009034,
              "num_responses": 6,
              "rvariance": 0.060116138487260044
            },
            {
              "id": "reasoning_sample_447",
              "rewards": [
                0.7582463065499806,
                1.9334794223114222,
                1.9334794223114222,
                1.9334794223114222,
                1.8862880410418725,
                1.4371316398962113,
                1.9334794223114222
              ],
              "variance": 0.767901915753703,
              "mean_reward": 1.687940525247679,
              "min_reward": 0.7582463065499806,
              "max_reward": 1.9334794223114222,
              "num_responses": 7,
              "rvariance": 0.17253365345114505
            },
            {
              "id": "reasoning_sample_44",
              "rewards": [
                0.6432645974599723,
                0.9048063453077474,
                0.8455785698654819,
                1.1036813005691473,
                0.6474734052098763,
                1.0442303157009016,
                0.9377975607922586
              ],
              "variance": 0.42222082753828516,
              "mean_reward": 0.8752617278436264,
              "min_reward": 0.6432645974599723,
              "max_reward": 1.1036813005691473,
              "num_responses": 7,
              "rvariance": 0.027442968287482116
            },
            {
              "id": "reasoning_sample_266",
              "rewards": [
                -0.33351975042845616,
                -0.595064814909604,
                -0.13978988851806198,
                -0.7074867463625942,
                -0.5884196082841449,
                -0.09802087114947212,
                -0.24584985383561822
              ],
              "variance": 0.516951305920174,
              "mean_reward": -0.3868787904982788,
              "min_reward": -0.7074867463625942,
              "max_reward": -0.09802087114947212,
              "num_responses": 7,
              "rvariance": 0.050568250649023996
            },
            {
              "id": "reasoning_sample_529",
              "rewards": [
                -0.337224429905716,
                -1.148206295534886,
                -0.811770986172429,
                -1.077485058803009,
                -1.077485058803009,
                -1.1733543364197339,
                -1.077485058803009
              ],
              "variance": 0.5363131482230815,
              "mean_reward": -0.9575730320631131,
              "min_reward": -1.1733543364197339,
              "max_reward": -0.337224429905716,
              "num_responses": 7,
              "rvariance": 0.07601855995812819
            },
            {
              "id": "reasoning_sample_466",
              "rewards": [
                -0.1883918339610034,
                -0.20300293062091426,
                -0.8211882349707563,
                -0.23470463905013572,
                -0.28119322570801897,
                -0.9133906427306697,
                -0.510872740071336
              ],
              "variance": 0.6609107061177718,
              "mean_reward": -0.45039203530183347,
              "min_reward": -0.9133906427306697,
              "max_reward": -0.1883918339610034,
              "num_responses": 7,
              "rvariance": 0.08007288750094801
            },
            {
              "id": "reasoning_sample_349",
              "rewards": [
                -0.6258173028675705,
                -1.4382259841736584,
                -1.5368414342229448,
                -1.461471604155949,
                -1.6385983994028135,
                -1.728002895249552
              ],
              "variance": 0.6512790038055685,
              "mean_reward": -1.4048262700120813,
              "min_reward": -1.728002895249552,
              "max_reward": -0.6258173028675705,
              "num_responses": 6,
              "rvariance": 0.13128329147321366
            },
            {
              "id": "reasoning_sample_206",
              "rewards": [
                -0.4331613668432432,
                -1.9413115072854255,
                -1.7463690842139872,
                -1.9413115072854255
              ],
              "variance": 1.1141878252309594,
              "mean_reward": -1.51553836640702,
              "min_reward": -1.9413115072854255,
              "max_reward": -0.4331613668432432,
              "num_responses": 4,
              "rvariance": 0.39684708111372213
            },
            {
              "id": "reasoning_sample_516",
              "rewards": [
                0.03346108896951348,
                -0.4453652510012784,
                -0.37390374170062374,
                -0.2433471222926099,
                -0.5598541083721096,
                -0.405601470169798,
                -0.4528767622636759
              ],
              "variance": 0.3630438629192889,
              "mean_reward": -0.3496410524043689,
              "min_reward": -0.5598541083721096,
              "max_reward": 0.03346108896951348,
              "num_responses": 7,
              "rvariance": 0.03225659423409966
            },
            {
              "id": "reasoning_sample_542",
              "rewards": [
                0.9035838342465854,
                0.4458154628854785,
                0.4633498402000509,
                0.5676645930369141,
                0.26641345714497017,
                0.4633498402000509,
                0.1747204842710971
              ],
              "variance": 0.4722960215253617,
              "mean_reward": 0.4692710731407353,
              "min_reward": 0.1747204842710971,
              "max_reward": 0.9035838342465854,
              "num_responses": 7,
              "rvariance": 0.04669148694848644
            },
            {
              "id": "reasoning_sample_151",
              "rewards": [
                0.2785961148494203,
                -0.5677357559188958,
                -0.5153050889105572,
                -0.5827508185235966
              ],
              "variance": 0.6186720534636135,
              "mean_reward": -0.3467988871259073,
              "min_reward": -0.5827508185235966,
              "max_reward": 0.2785961148494203,
              "num_responses": 4,
              "rvariance": 0.13099991561448981
            },
            {
              "id": "reasoning_sample_223",
              "rewards": [
                -0.1978621488932932,
                -1.3286802371814377,
                0.028016503624956873,
                0.05747749454761007,
                0.028016503624956873,
                0.17617117970829804,
                -0.027474752659671312
              ],
              "variance": 0.7551443528204362,
              "mean_reward": -0.18061935103265433,
              "min_reward": -1.3286802371814377,
              "max_reward": 0.17617117970829804,
              "num_responses": 7,
              "rvariance": 0.23040597297038876
            },
            {
              "id": "reasoning_sample_452",
              "rewards": [
                0.2785238122418963,
                -0.1775165931320553,
                0.33175909450644203,
                0.3355248000377588
              ],
              "variance": 0.3750995598982336,
              "mean_reward": 0.19207277841351045,
              "min_reward": -0.1775165931320553,
              "max_reward": 0.3355248000377588,
              "num_responses": 4,
              "rvariance": 0.0460402085552853
            },
            {
              "id": "reasoning_sample_68",
              "rewards": [
                0.7775152831184534,
                1.3230152404531297,
                1.1096253708996262,
                1.0444173738231197,
                1.466187669884063,
                1.144360140548144,
                0.8000279271253865
              ],
              "variance": 0.5892613427028898,
              "mean_reward": 1.0950212865502746,
              "min_reward": 0.7775152831184534,
              "max_reward": 1.466187669884063,
              "num_responses": 7,
              "rvariance": 0.054683604175739205
            },
            {
              "id": "reasoning_sample_552",
              "rewards": [
                0.9273703971319568,
                0.6573218163466491,
                0.8279712266167111,
                0.46842030930017153,
                0.8279712266167111,
                0.8279712266167111,
                0.9829001263637077
              ],
              "variance": 0.36782107529659913,
              "mean_reward": 0.7885609041418026,
              "min_reward": 0.46842030930017153,
              "max_reward": 0.9829001263637077,
              "num_responses": 7,
              "rvariance": 0.025915575403083556
            },
            {
              "id": "reasoning_sample_209",
              "rewards": [
                0.059613406439602314,
                -0.5188034737920376,
                -0.23661634652613622,
                -0.8240312530977993
              ],
              "variance": 0.7032073998559516,
              "mean_reward": -0.3799594167440927,
              "min_reward": -0.8240312530977993,
              "max_reward": 0.059613406439602314,
              "num_responses": 4,
              "rvariance": 0.10756224267032005
            },
            {
              "id": "reasoning_sample_391",
              "rewards": [
                0.2999393139291539,
                -0.15953181700547595,
                -0.2951721720471011,
                -0.2521295674634103,
                -0.34919216976761785,
                0.020298034440105413,
                -0.21846242209755126
              ],
              "variance": 0.44893471737103274,
              "mean_reward": -0.13632154285884246,
              "min_reward": -0.34919216976761785,
              "max_reward": 0.2999393139291539,
              "num_responses": 7,
              "rvariance": 0.043728284683374384
            },
            {
              "id": "reasoning_sample_210",
              "rewards": [
                1.0319193042849297,
                0.8477940809584179,
                0.6667297785715329,
                0.6716344160030208,
                0.8637656606277935,
                0.55021777484338,
                0.7960652135717339
              ],
              "variance": 0.3109021410103763,
              "mean_reward": 0.7754466041229726,
              "min_reward": 0.55021777484338,
              "max_reward": 1.0319193042849297,
              "num_responses": 7,
              "rvariance": 0.021794590032744726
            },
            {
              "id": "reasoning_sample_465",
              "rewards": [
                0.8884148798533933,
                0.8924293328876595,
                0.6596374897674395,
                0.6839882119895001,
                1.0456458548243523,
                1.0456458548243523,
                0.8890709099345052
              ],
              "variance": 0.3713979317236765,
              "mean_reward": 0.8721189334401717,
              "min_reward": 0.6596374897674395,
              "max_reward": 1.0456458548243523,
              "num_responses": 7,
              "rvariance": 0.02024716526446077
            },
            {
              "id": "reasoning_sample_396",
              "rewards": [
                0.40860416309759634,
                -0.5949785824419148,
                -0.4228247472740149,
                -0.36463972136411327,
                -0.639229104899928,
                -0.3186075034583079,
                -0.4394271506108701
              ],
              "variance": 0.584955954589174,
              "mean_reward": -0.33872894956450755,
              "min_reward": -0.639229104899928,
              "max_reward": 0.40860416309759634,
              "num_responses": 7,
              "rvariance": 0.1046799243660964
            },
            {
              "id": "reasoning_sample_348",
              "rewards": [
                -0.05365890981013766,
                -0.1372539906413271,
                -0.7001695898158345,
                -0.5063647719912182,
                -0.5015782067077971,
                -0.7001695898158345,
                -0.37061430472162077
              ],
              "variance": 0.5963536315069833,
              "mean_reward": -0.42425848050053855,
              "min_reward": -0.7001695898158345,
              "max_reward": -0.05365890981013766,
              "num_responses": 7,
              "rvariance": 0.05536671146293821
            },
            {
              "id": "reasoning_sample_83",
              "rewards": [
                1.2631868227070757,
                1.5914721688828983,
                1.2365970412951333,
                0.768867493262583,
                1.195780561031171,
                1.5833457537932099,
                1.2477482260206865
              ],
              "variance": 0.5615809859053496,
              "mean_reward": 1.2695711524275368,
              "min_reward": 0.768867493262583,
              "max_reward": 1.5914721688828983,
              "num_responses": 7,
              "rvariance": 0.06568975176069887
            },
            {
              "id": "reasoning_sample_242",
              "rewards": [
                1.0627566980572363,
                0.6390319099497852,
                0.6390319099497852,
                0.6251935888657038,
                0.5112406994478942,
                0.279081006648503,
                0.6016932514403929
              ],
              "variance": 0.390145002864628,
              "mean_reward": 0.6225755806227572,
              "min_reward": 0.279081006648503,
              "max_reward": 1.0627566980572363,
              "num_responses": 7,
              "rvariance": 0.046446848778703136
            },
            {
              "id": "reasoning_sample_269",
              "rewards": [
                1.0650790047447718,
                0.9109374737604444,
                0.5504930554133106,
                0.9109374737604444,
                0.9109374737604444
              ],
              "variance": 0.3087515695988766,
              "mean_reward": 0.8696768962878831,
              "min_reward": 0.5504930554133106,
              "max_reward": 1.0650790047447718,
              "num_responses": 5,
              "rvariance": 0.029033522804989963
            },
            {
              "id": "reasoning_sample_694",
              "rewards": [
                -0.35769601773511495,
                -0.7653911850891689,
                -0.8259091309133988,
                -0.9010958828182237,
                -0.7653911850891689,
                -0.9883923264933003
              ],
              "variance": 0.3832005032436201,
              "mean_reward": -0.767312621356396,
              "min_reward": -0.9883923264933003,
              "max_reward": -0.35769601773511495,
              "num_responses": 6,
              "rvariance": 0.039666815633323325
            },
            {
              "id": "reasoning_sample_18",
              "rewards": [
                1.019813260811388,
                0.7853836641317491,
                0.8923218739663853,
                0.4852177306793391,
                0.39343388205105523,
                0.4209937787245004
              ],
              "variance": 0.5488537370011087,
              "mean_reward": 0.6661940317274029,
              "min_reward": 0.39343388205105523,
              "max_reward": 1.019813260811388,
              "num_responses": 6,
              "rvariance": 0.05961003559191393
            },
            {
              "id": "reasoning_sample_230",
              "rewards": [
                -0.8987841893574805,
                -1.7415228195298582,
                -1.6303704953319216,
                -1.3475465744584698,
                -1.6303704953319216
              ],
              "variance": 0.6187727464528074,
              "mean_reward": -1.4497189148019303,
              "min_reward": -1.7415228195298582,
              "max_reward": -0.8987841893574805,
              "num_responses": 5,
              "rvariance": 0.09287755294844893
            },
            {
              "id": "reasoning_sample_237",
              "rewards": [
                1.0310911409317767,
                0.967031693992222,
                0.8106570737580833,
                0.6202571117538385,
                0.5780509621067322
              ],
              "variance": 0.41053394019038014,
              "mean_reward": 0.8014175965085306,
              "min_reward": 0.5780509621067322,
              "max_reward": 1.0310911409317767,
              "num_responses": 5,
              "rvariance": 0.03259502176673222
            },
            {
              "id": "reasoning_sample_312",
              "rewards": [
                -0.2911431258259953,
                -0.6283611606643997,
                -0.6108718895636956,
                -0.35195160873366993,
                -0.7197383900411957,
                -0.7197383900411957
              ],
              "variance": 0.3981910227613631,
              "mean_reward": -0.5536340941450254,
              "min_reward": -0.7197383900411957,
              "max_reward": -0.2911431258259953,
              "num_responses": 6,
              "rvariance": 0.02893648454934487
            },
            {
              "id": "reasoning_sample_47",
              "rewards": [
                0.6586982191963026,
                -0.010918118863358802,
                -0.21269678664252128,
                0.062197727163578014,
                -0.21269678664252128,
                -0.21269678664252128,
                -0.21269678664252128
              ],
              "variance": 0.5134947106191894,
              "mean_reward": -0.02011561701050905,
              "min_reward": -0.21269678664252128,
              "max_reward": 0.6586982191963026,
              "num_responses": 7,
              "rvariance": 0.08799976177349032
            },
            {
              "id": "reasoning_sample_2",
              "rewards": [
                0.8784397733217848,
                0.950203759586026,
                0.8094756889507423,
                0.7250123135025908,
                0.014695577347010243,
                0.7804007541526665,
                0.7814362070916107
              ],
              "variance": 0.46625974878712273,
              "mean_reward": 0.7056662962789187,
              "min_reward": 0.014695577347010243,
              "max_reward": 0.950203759586026,
              "num_responses": 7,
              "rvariance": 0.08422382238842754
            },
            {
              "id": "reasoning_sample_58",
              "rewards": [
                1.7469940826769264,
                2.080340279716089,
                2.0901757559827088,
                2.043757481952326,
                1.6480283961434872,
                1.8479029847034063,
                1.708643519325536
              ],
              "variance": 0.3998770001700205,
              "mean_reward": 1.88083464292864,
              "min_reward": 1.6480283961434872,
              "max_reward": 2.0901757559827088,
              "num_responses": 7,
              "rvariance": 0.03043091049600927
            },
            {
              "id": "reasoning_sample_308",
              "rewards": [
                -0.2422559499130052,
                -0.9622585821700983,
                -0.9058154521075171,
                -1.3851187239572973,
                -0.4873127032453172,
                -0.8618587833663215,
                -0.9058154521075171
              ],
              "variance": 0.7421126369725854,
              "mean_reward": -0.8214908066952963,
              "min_reward": -1.3851187239572973,
              "max_reward": -0.2422559499130052,
              "num_responses": 7,
              "rvariance": 0.11436155500779392
            },
            {
              "id": "reasoning_sample_59",
              "rewards": [
                0.9219612997644876,
                0.8111386489237934,
                1.3943148980451987,
                0.7209103013472864,
                1.0063719407420137,
                1.0405541592706467,
                1.0720890410412234
              ],
              "variance": 0.42593207394962296,
              "mean_reward": 0.9953343270192357,
              "min_reward": 0.7209103013472864,
              "max_reward": 1.3943148980451987,
              "num_responses": 7,
              "rvariance": 0.04026623416427202
            },
            {
              "id": "reasoning_sample_219",
              "rewards": [
                0.9537120943676244,
                0.6574458584347866,
                0.6277301500691131,
                0.8796702443030412,
                0.4651620486748716,
                0.3736289375295607,
                0.6532257741314156
              ],
              "variance": 0.4807381801121272,
              "mean_reward": 0.658653586787202,
              "min_reward": 0.3736289375295607,
              "max_reward": 0.9537120943676244,
              "num_responses": 7,
              "rvariance": 0.03651044149957628
            },
            {
              "id": "reasoning_sample_216",
              "rewards": [
                -0.04338862290836256,
                -0.17381523028816814,
                -0.727723516549209,
                -0.33175331149417814
              ],
              "variance": 0.5264158499103955,
              "mean_reward": -0.31917017030997946,
              "min_reward": -0.727723516549209,
              "max_reward": -0.04338862290836256,
              "num_responses": 4,
              "rvariance": 0.06606442316032696
            },
            {
              "id": "reasoning_sample_201",
              "rewards": [
                0.0746569920913079,
                -0.5057909944177482,
                -0.6107365709220911,
                -0.5466724806958146,
                -0.5082943892874311
              ],
              "variance": 0.427588732319266,
              "mean_reward": -0.41936748864635537,
              "min_reward": -0.6107365709220911,
              "max_reward": 0.0746569920913079,
              "num_responses": 5,
              "rvariance": 0.06245317804546675
            },
            {
              "id": "reasoning_sample_550",
              "rewards": [
                0.6753858600108351,
                0.9277455083664045,
                0.5565750976920922,
                0.9277455083664045,
                0.9277455083664045,
                0.5565750976920922,
                0.6753858600108351
              ],
              "variance": 0.3711704106743122,
              "mean_reward": 0.7495940629292955,
              "min_reward": 0.5565750976920922,
              "max_reward": 0.9277455083664045,
              "num_responses": 7,
              "rvariance": 0.02582002416817854
            },
            {
              "id": "reasoning_sample_34",
              "rewards": [
                0.4569600143442865,
                -0.4006729529780271,
                0.4060549986873708,
                0.5430565000651352,
                0.38634225657363624,
                0.2860439467510628,
                0.34188809282654187
              ],
              "variance": 0.4800414217731991,
              "mean_reward": 0.28852469375285805,
              "min_reward": -0.4006729529780271,
              "max_reward": 0.5430565000651352,
              "num_responses": 7,
              "rvariance": 0.08491224979247121
            },
            {
              "id": "reasoning_sample_618",
              "rewards": [
                0.4037937180538921,
                -0.29258254470972916,
                -0.23548869117943225,
                -0.17811093383243579,
                -0.03489737814768161,
                0.030204818324237118
              ],
              "variance": 0.4810348861336453,
              "mean_reward": -0.051180168581858275,
              "min_reward": -0.29258254470972916,
              "max_reward": 0.4037937180538921,
              "num_responses": 6,
              "rvariance": 0.05370767345797481
            },
            {
              "id": "reasoning_sample_257",
              "rewards": [
                0.6281208494804124,
                0.5704598516433909,
                0.5605577110459808,
                0.3421640367231471,
                0.45328850120075326
              ],
              "variance": 0.21844262783141416,
              "mean_reward": 0.510918190018737,
              "min_reward": 0.3421640367231471,
              "max_reward": 0.6281208494804124,
              "num_responses": 5,
              "rvariance": 0.0103089800378995
            },
            {
              "id": "reasoning_sample_527",
              "rewards": [
                0.4401612663117699,
                0.9369551359156033,
                0.6196680776668543,
                0.4486571543591726,
                0.6196680776668543,
                0.6196680776668543,
                0.6196680776668543
              ],
              "variance": 0.30132410182614255,
              "mean_reward": 0.6149208381791375,
              "min_reward": 0.4401612663117699,
              "max_reward": 0.9369551359156033,
              "num_responses": 7,
              "rvariance": 0.023140107795183502
            },
            {
              "id": "reasoning_sample_66",
              "rewards": [
                -0.44818571602138735,
                0.7855926120342266,
                0.6267099536436833,
                0.9251273579820276,
                0.7640484249721098,
                0.7974144200277314,
                0.7980996364825227
              ],
              "variance": 0.6521590393046695,
              "mean_reward": 0.6069723841601306,
              "min_reward": -0.44818571602138735,
              "max_reward": 0.9251273579820276,
              "num_responses": 7,
              "rvariance": 0.19204951991486635
            },
            {
              "id": "reasoning_sample_292",
              "rewards": [
                0.4406614146243668,
                0.261646791661785,
                0.3080823121857057,
                0.4541229661573142,
                0.3080823121857057,
                -0.2763031814633709,
                0.4541229661573142
              ],
              "variance": 0.4076561637455915,
              "mean_reward": 0.27863079735840296,
              "min_reward": -0.2763031814633709,
              "max_reward": 0.4541229661573142,
              "num_responses": 7,
              "rvariance": 0.05683198347182768
            },
            {
              "id": "reasoning_sample_390",
              "rewards": [
                0.7494691679925765,
                0.9547369340797759,
                0.6005529928868728,
                0.5641317151683579,
                0.5641317151683579,
                0.8150436530567617
              ],
              "variance": 0.32075857839991084,
              "mean_reward": 0.7080110297254505,
              "min_reward": 0.5641317151683579,
              "max_reward": 0.9547369340797759,
              "num_responses": 6,
              "rvariance": 0.021166362593542817
            },
            {
              "id": "reasoning_sample_414",
              "rewards": [
                -0.5214700470236553,
                -1.0016349802236522,
                -0.27140517729862845,
                -0.31106680582223095,
                -0.31106680582223095,
                -0.27140517729862845
              ],
              "variance": 0.4901473363250253,
              "mean_reward": -0.4480081655815044,
              "min_reward": -1.0016349802236522,
              "max_reward": -0.27140517729862845,
              "num_responses": 6,
              "rvariance": 0.06863040014702539
            },
            {
              "id": "reasoning_sample_384",
              "rewards": [
                0.6222019855635655,
                -0.0963240815160199,
                -0.0963240815160199,
                -0.29615920213880437,
                -0.35621547259756003,
                -0.0963240815160199,
                0.12002986328262875
              ],
              "variance": 0.6410804225173103,
              "mean_reward": -0.028445010062604255,
              "min_reward": -0.35621547259756003,
              "max_reward": 0.6222019855635655,
              "num_responses": 7,
              "rvariance": 0.09118762438653846
            },
            {
              "id": "reasoning_sample_586",
              "rewards": [
                0.18935944065133833,
                -0.35891454883622975,
                -0.35891454883622975,
                -0.015708000780152578,
                -0.35891454883622975,
                -0.5734390386665198
              ],
              "variance": 0.5530025136869676,
              "mean_reward": -0.2460885408840039,
              "min_reward": -0.5734390386665198,
              "max_reward": 0.18935944065133833,
              "num_responses": 6,
              "rvariance": 0.06467293508191903
            },
            {
              "id": "reasoning_sample_652",
              "rewards": [
                -0.38229217082675226,
                -1.3145779120808927,
                -1.023293922800463,
                -1.053714084094489,
                -0.9157620355921207,
                -1.192602749861296,
                -0.6603560594837643
              ],
              "variance": 0.6922623107281752,
              "mean_reward": -0.934656990677111,
              "min_reward": -1.3145779120808927,
              "max_reward": -0.38229217082675226,
              "num_responses": 7,
              "rvariance": 0.0876588475457369
            },
            {
              "id": "reasoning_sample_389",
              "rewards": [
                -0.007360034581170487,
                -0.1877570303334765,
                -0.33140042170332723,
                -0.5764664616090828,
                -0.31003931280338126,
                -0.3364994138504528,
                -0.75640841526266
              ],
              "variance": 0.5328450110379596,
              "mean_reward": -0.357990155734793,
              "min_reward": -0.75640841526266,
              "max_reward": -0.007360034581170487,
              "num_responses": 7,
              "rvariance": 0.05169399341117596
            },
            {
              "id": "reasoning_sample_26",
              "rewards": [
                1.4097120368144296,
                0.8991833250877418,
                1.161010635068903,
                1.4605994743144701,
                1.3220567334084314,
                1.0299939986121012
              ],
              "variance": 0.4705670937145283,
              "mean_reward": 1.2137593672176796,
              "min_reward": 0.8991833250877418,
              "max_reward": 1.4605994743144701,
              "num_responses": 6,
              "rvariance": 0.04109433874028096
            },
            {
              "id": "reasoning_sample_563",
              "rewards": [
                0.2836075478755077,
                0.08595012872521096,
                0.029502355375907993,
                -0.49234403607164057,
                -0.0043498581321454,
                -0.04302710987074276,
                0.09852348584096031
              ],
              "variance": 0.3953109910058812,
              "mean_reward": -0.006019640893848823,
              "min_reward": -0.49234403607164057,
              "max_reward": 0.2836075478755077,
              "num_responses": 7,
              "rvariance": 0.04891674040632778
            },
            {
              "id": "reasoning_sample_399",
              "rewards": [
                0.47392923733215775,
                0.0446089570616941,
                0.4099653094337355,
                0.4397911300273812,
                0.6239511780043058,
                0.49882786738738155
              ],
              "variance": 0.33410238944812887,
              "mean_reward": 0.41517894654110926,
              "min_reward": 0.0446089570616941,
              "max_reward": 0.6239511780043058,
              "num_responses": 6,
              "rvariance": 0.03199827365792073
            },
            {
              "id": "reasoning_sample_428",
              "rewards": [
                0.12476667906545999,
                -0.13075736919096312,
                0.1810313742525922,
                -0.13677705876233875,
                -0.5517283566090956
              ],
              "variance": 0.5442733336481322,
              "mean_reward": -0.10269294624886904,
              "min_reward": -0.5517283566090956,
              "max_reward": 0.1810313742525922,
              "num_responses": 5,
              "rvariance": 0.06716390190208629
            },
            {
              "id": "reasoning_sample_39",
              "rewards": [
                -0.003544579549263854,
                1.1650048566395959,
                0.9993297331018475,
                0.8958872548419935,
                0.5876161327534801,
                0.8836256612632741,
                0.7854254537122446
              ],
              "variance": 0.7144479346845645,
              "mean_reward": 0.7590492161090244,
              "min_reward": -0.003544579549263854,
              "max_reward": 1.1650048566395959,
              "num_responses": 7,
              "rvariance": 0.12405899337312656
            },
            {
              "id": "reasoning_sample_255",
              "rewards": [
                -0.30142203597453926,
                -0.3379991954615691,
                -0.5207251311681561,
                -0.3439280092785339,
                -0.5294578268383666,
                -0.39938079261603926,
                -0.3759003549909643
              ],
              "variance": 0.20084987776948315,
              "mean_reward": -0.40125904947545266,
              "min_reward": -0.5294578268383666,
              "max_reward": -0.30142203597453926,
              "num_responses": 7,
              "rvariance": 0.006944249855977338
            },
            {
              "id": "reasoning_sample_277",
              "rewards": [
                -1.5405202439598977,
                -2.1378578542558815,
                -1.8821245264336435,
                -2.185690340756366,
                -2.1378578542558815,
                -1.671219478602936,
                -1.7369312722887493
              ],
              "variance": 0.5380510641103546,
              "mean_reward": -1.8988859386504795,
              "min_reward": -2.185690340756366,
              "max_reward": -1.5405202439598977,
              "num_responses": 7,
              "rvariance": 0.057605737860147256
            },
            {
              "id": "reasoning_sample_208",
              "rewards": [
                -1.4319376472990974,
                -1.8694652685135424,
                -1.5535493065010504,
                -1.5535493065010504,
                -1.8893796619363346
              ],
              "variance": 0.4008315935873392,
              "mean_reward": -1.659576238150215,
              "min_reward": -1.8893796619363346,
              "max_reward": -1.4319376472990974,
              "num_responses": 5,
              "rvariance": 0.03423315343304728
            },
            {
              "id": "reasoning_sample_561",
              "rewards": [
                -0.4740939292752485,
                -1.0358586566694434,
                -1.6789949938817972,
                -0.8447124521563503,
                -1.6789949938817972,
                -1.6789949938817972,
                -1.6789949938817972
              ],
              "variance": 0.9825299508778877,
              "mean_reward": -1.2958064305183188,
              "min_reward": -1.6789949938817972,
              "max_reward": -0.4740939292752485,
              "num_responses": 7,
              "rvariance": 0.21908627964468902
            },
            {
              "id": "reasoning_sample_640",
              "rewards": [
                0.9777059468387869,
                0.27369744735800333,
                0.48337832581086254,
                0.6457043129689001,
                0.7918736523153677,
                0.7918736523153677
              ],
              "variance": 0.5062519129926444,
              "mean_reward": 0.6607055562678814,
              "min_reward": 0.27369744735800333,
              "max_reward": 0.9777059468387869,
              "num_responses": 6,
              "rvariance": 0.052724107797937285
            },
            {
              "id": "reasoning_sample_320",
              "rewards": [
                -0.8265644976678361,
                -1.8162757557895393,
                -1.725913416224777,
                -1.663382937270018,
                -1.7464393968414875
              ],
              "variance": 0.6270493387016098,
              "mean_reward": -1.5557152007587314,
              "min_reward": -1.8162757557895393,
              "max_reward": -0.8265644976678361,
              "num_responses": 5,
              "rvariance": 0.1352976087321227
            },
            {
              "id": "reasoning_sample_217",
              "rewards": [
                1.2558699978236532,
                0.7689033129030077,
                0.7295441613429917,
                0.8877701263257485,
                0.6970769739313606,
                0.9233038729537398,
                0.8144552822964521
              ],
              "variance": 0.3397730365233661,
              "mean_reward": 0.868131961082422,
              "min_reward": 0.6970769739313606,
              "max_reward": 1.2558699978236532,
              "num_responses": 7,
              "rvariance": 0.03070918283721105
            },
            {
              "id": "reasoning_sample_522",
              "rewards": [
                0.9163634859581141,
                0.9416269456843304,
                1.0380763024779334,
                1.202369384889295,
                1.2127079944385466,
                0.9962087810981756,
                0.9253064561841512
              ],
              "variance": 0.2847755606152593,
              "mean_reward": 1.0332370501043637,
              "min_reward": 0.9163634859581141,
              "max_reward": 1.2127079944385466,
              "num_responses": 7,
              "rvariance": 0.013701561704457414
            },
            {
              "id": "reasoning_sample_291",
              "rewards": [
                -0.7011446800273962,
                -1.1903540724346335,
                -1.186750881938577,
                -1.4714732437545388,
                -1.3175031827155776
              ],
              "variance": 0.514498058547086,
              "mean_reward": -1.1734452121741448,
              "min_reward": -1.4714732437545388,
              "max_reward": -0.7011446800273962,
              "num_responses": 5,
              "rvariance": 0.06662082991069829
            },
            {
              "id": "reasoning_sample_49",
              "rewards": [
                0.9035977641067505,
                1.415403379681912,
                1.4457240419747583,
                1.4220442746839868,
                1.4197461794200714,
                1.4245718809772898,
                1.2892565560061853
              ],
              "variance": 0.29803970612986586,
              "mean_reward": 1.331477725264422,
              "min_reward": 0.9035977641067505,
              "max_reward": 1.4457240419747583,
              "num_responses": 7,
              "rvariance": 0.03280282376368453
            },
            {
              "id": "reasoning_sample_545",
              "rewards": [
                -0.5463481139519686,
                -0.9119505605202612,
                -0.7650621750586012,
                -0.8088377556176496,
                -0.8085220121205725
              ],
              "variance": 0.2368717001645949,
              "mean_reward": -0.7681441234538107,
              "min_reward": -0.9119505605202612,
              "max_reward": -0.5463481139519686,
              "num_responses": 5,
              "rvariance": 0.014633921034094041
            },
            {
              "id": "reasoning_sample_37",
              "rewards": [
                0.8859406713573899,
                0.8791050899763402,
                0.7819655417778869,
                0.9760778115161487,
                0.8426725357043583,
                1.0190371686021857,
                1.036799730292797
              ],
              "variance": 0.20775245514466056,
              "mean_reward": 0.9173712213181581,
              "min_reward": 0.7819655417778869,
              "max_reward": 1.036799730292797,
              "num_responses": 7,
              "rvariance": 0.007773195041233772
            },
            {
              "id": "reasoning_sample_248",
              "rewards": [
                -0.4273353686608308,
                -0.15108965841871036,
                -0.15108965841871036,
                -0.5707459323679209,
                -0.05500280965273899,
                -0.7871701897940699,
                -0.7093095680642075
              ],
              "variance": 0.6277988978438307,
              "mean_reward": -0.4073918836253127,
              "min_reward": -0.7871701897940699,
              "max_reward": -0.05500280965273899,
              "num_responses": 7,
              "rvariance": 0.07400397979946836
            },
            {
              "id": "reasoning_sample_28",
              "rewards": [
                1.122942648880863,
                0.8631408069003845,
                0.7885424257558693,
                0.649891894265219,
                0.8700765506092886,
                0.5214983831428532,
                0.3999232069079993
              ],
              "variance": 0.4983546772690068,
              "mean_reward": 0.7451451309232109,
              "min_reward": 0.3999232069079993,
              "max_reward": 1.122942648880863,
              "num_responses": 7,
              "rvariance": 0.05034490752216614
            },
            {
              "id": "reasoning_sample_328",
              "rewards": [
                -0.12800456349165634,
                -0.7738220671224675,
                -0.8477876346194795,
                -1.0281163077243087,
                -0.9965194049096633
              ],
              "variance": 0.6291459816544698,
              "mean_reward": -0.7548499955735151,
              "min_reward": -1.0281163077243087,
              "max_reward": -0.12800456349165634,
              "num_responses": 5,
              "rvariance": 0.1070022241475133
            },
            {
              "id": "reasoning_sample_604",
              "rewards": [
                0.42706985106321127,
                0.3078037149824024,
                0.265971681579732,
                0.14784912068581588,
                0.3513696843122987,
                0.052043522429845966,
                0.49800003569756596
              ],
              "variance": 0.34591504353352526,
              "mean_reward": 0.2928725158215531,
              "min_reward": 0.052043522429845966,
              "max_reward": 0.49800003569756596,
              "num_responses": 7,
              "rvariance": 0.02049787538627524
            },
            {
              "id": "reasoning_sample_93",
              "rewards": [
                1.8502956040184424,
                1.8856721422245697,
                1.2019402125308727,
                1.8140690126789025,
                1.3587997245640941,
                1.5954342191098765,
                1.4445433204940918
              ],
              "variance": 0.5683902995500878,
              "mean_reward": 1.5929648908029783,
              "min_reward": 1.2019402125308727,
              "max_reward": 1.8856721422245697,
              "num_responses": 7,
              "rvariance": 0.0615074782745738
            },
            {
              "id": "reasoning_sample_410",
              "rewards": [
                1.4041543542718653,
                1.665292467838188,
                1.7801813111937617,
                1.8653106666231432,
                1.721293822335531,
                1.916124806525648,
                1.916124806525648
              ],
              "variance": 0.3552875841139891,
              "mean_reward": 1.7526403193305407,
              "min_reward": 1.4041543542718653,
              "max_reward": 1.916124806525648,
              "num_responses": 7,
              "rvariance": 0.028137455196543527
            },
            {
              "id": "reasoning_sample_577",
              "rewards": [
                -1.3686217895616926,
                -2.385721806074812,
                -2.085480253381505,
                -2.104614574635048,
                -1.9968659454358026,
                -2.104614574635048,
                -2.1898799120327084
              ],
              "variance": 0.5226483865633913,
              "mean_reward": -2.0336855508223737,
              "min_reward": -2.385721806074812,
              "max_reward": -1.3686217895616926,
              "num_responses": 7,
              "rvariance": 0.08639089106004545
            },
            {
              "id": "reasoning_sample_663",
              "rewards": [
                -0.5770807021096992,
                -1.3816986116234116,
                -1.3816986116234116,
                -1.2745182875525711,
                -1.061988421032598,
                -1.3816986116234116,
                -1.0873540330666922
              ],
              "variance": 0.5136732781599732,
              "mean_reward": -1.1637196112331136,
              "min_reward": -1.3816986116234116,
              "max_reward": -0.5770807021096992,
              "num_responses": 7,
              "rvariance": 0.07359243239905991
            },
            {
              "id": "reasoning_sample_46",
              "rewards": [
                0.5464116063849167,
                0.9175952835927196,
                1.047580115407287,
                0.8635162497981695,
                0.8712950817104034,
                0.9484897234590359,
                0.9636195415784307
              ],
              "variance": 0.2605293786771048,
              "mean_reward": 0.8797868002758519,
              "min_reward": 0.5464116063849167,
              "max_reward": 1.047580115407287,
              "num_responses": 7,
              "rvariance": 0.021829708311514113
            },
            {
              "id": "reasoning_sample_598",
              "rewards": [
                -2.21612774854393,
                -2.38595496540091,
                -2.805071623100389,
                -2.5221375899989646
              ],
              "variance": 0.4531154995689377,
              "mean_reward": -2.4823229817610484,
              "min_reward": -2.805071623100389,
              "max_reward": -2.21612774854393,
              "num_responses": 4,
              "rvariance": 0.04647464632005824
            },
            {
              "id": "reasoning_sample_220",
              "rewards": [
                -0.4707978590295002,
                -1.0687689462996617,
                -0.5134457842418446,
                -0.581245730299084,
                -0.47441895934576905
              ],
              "variance": 0.40151336074342286,
              "mean_reward": -0.6217354558431719,
              "min_reward": -1.0687689462996617,
              "max_reward": -0.4707978590295002,
              "num_responses": 5,
              "rvariance": 0.051537864142405444
            },
            {
              "id": "reasoning_sample_298",
              "rewards": [
                -1.3419971834993372,
                -2.0387701156143283,
                -2.0901978326907753,
                -1.9102054662099335
              ],
              "variance": 0.5623098492553253,
              "mean_reward": -1.8452926495035935,
              "min_reward": -2.0901978326907753,
              "max_reward": -1.3419971834993372,
              "num_responses": 4,
              "rvariance": 0.08873301962944252
            },
            {
              "id": "reasoning_sample_27",
              "rewards": [
                0.18968646070188247,
                -0.6523032736549488,
                -0.576764958612622,
                -0.6179946913948176,
                -0.5131890768188009
              ],
              "variance": 0.5471160864445055,
              "mean_reward": -0.4341131079558614,
              "min_reward": -0.6523032736549488,
              "max_reward": 0.18968646070188247,
              "num_responses": 5,
              "rvariance": 0.09942956926816233
            },
            {
              "id": "reasoning_sample_510",
              "rewards": [
                0.9889828319691639,
                1.0646926169568571,
                1.0425394960075203,
                1.1196110906580272,
                1.4208416634230605,
                1.0229401827551305
              ],
              "variance": 0.26426486967839646,
              "mean_reward": 1.1099346469616267,
              "min_reward": 0.9889828319691639,
              "max_reward": 1.4208416634230605,
              "num_responses": 6,
              "rvariance": 0.020923855408530905
            },
            {
              "id": "reasoning_sample_654",
              "rewards": [
                0.36387737208726945,
                -0.10764109791020611,
                0.2554407072948659,
                0.2554407072948659,
                0.08923027913077047,
                -0.07051934722338572,
                0.03289659796948696
              ],
              "variance": 0.38418342070994127,
              "mean_reward": 0.11696074552052384,
              "min_reward": -0.10764109791020611,
              "max_reward": 0.36387737208726945,
              "num_responses": 7,
              "rvariance": 0.02753596471693872
            },
            {
              "id": "reasoning_sample_50",
              "rewards": [
                2.112729526243463,
                1.7520589135003137,
                1.9808051272325644,
                2.0256416988075263,
                2.117739632616201,
                2.2163189313617253,
                1.6387089880296535
              ],
              "variance": 0.45045240880236137,
              "mean_reward": 1.977714688255921,
              "min_reward": 1.6387089880296535,
              "max_reward": 2.2163189313617253,
              "num_responses": 7,
              "rvariance": 0.0375599884239904
            },
            {
              "id": "reasoning_sample_419",
              "rewards": [
                0.23167901915978953,
                0.6154267669098983,
                0.6154267669098983,
                0.6154267669098983,
                0.6154267669098983
              ],
              "variance": 0.23024864865006522,
              "mean_reward": 0.5386772173598766,
              "min_reward": 0.23167901915978953,
              "max_reward": 0.6154267669098983,
              "num_responses": 5,
              "rvariance": 0.023561973424524978
            },
            {
              "id": "reasoning_sample_584",
              "rewards": [
                0.2008800983346058,
                0.4180990211168438,
                0.4180990211168438,
                0.1758381897176831,
                -0.03976354263204654,
                0.4180990211168438,
                0.1758381897176831
              ],
              "variance": 0.32850152433905255,
              "mean_reward": 0.2524414283554938,
              "min_reward": -0.03976354263204654,
              "max_reward": 0.4180990211168438,
              "num_responses": 7,
              "rvariance": 0.02601510604020155
            },
            {
              "id": "reasoning_sample_571",
              "rewards": [
                -0.5410302240022475,
                -0.7717365680577397,
                -0.5407748432325528,
                -0.7381775449398293,
                -0.7717365680577397,
                -0.5295646224329662,
                -0.3827962990993964
              ],
              "variance": 0.3008792749582015,
              "mean_reward": -0.6108309528317817,
              "min_reward": -0.7717365680577397,
              "max_reward": -0.3827962990993964,
              "num_responses": 7,
              "rvariance": 0.019483201220096173
            },
            {
              "id": "reasoning_sample_546",
              "rewards": [
                0.07257746296665085,
                0.517462703655002,
                0.00568760110686906,
                0.42732191519953333
              ],
              "variance": 0.4646659074535578,
              "mean_reward": 0.25576242073201383,
              "min_reward": 0.00568760110686906,
              "max_reward": 0.517462703655002,
              "num_responses": 4,
              "rvariance": 0.048503460596492354
            },
            {
              "id": "reasoning_sample_63",
              "rewards": [
                -0.00012579386872720806,
                0.7620876313221939,
                0.6503489263439713,
                0.6012660690619944,
                0.8279818398435036,
                0.4109569828121605,
                0.4703890628701818
              ],
              "variance": 0.5419214425909124,
              "mean_reward": 0.531843531197897,
              "min_reward": -0.00012579386872720806,
              "max_reward": 0.8279818398435036,
              "num_responses": 7,
              "rvariance": 0.06585069042880655
            },
            {
              "id": "reasoning_sample_355",
              "rewards": [
                0.669763503117504,
                0.06853647686540343,
                0.41268295881929207,
                0.6137366105431914,
                0.4539438679551906,
                0.41268295881929207
              ],
              "variance": 0.40114033898799994,
              "mean_reward": 0.4385577293533123,
              "min_reward": 0.06853647686540343,
              "max_reward": 0.669763503117504,
              "num_responses": 6,
              "rvariance": 0.0371058697151683
            },
            {
              "id": "reasoning_sample_524",
              "rewards": [
                0.17618112960841603,
                -0.027138446035683716,
                0.23673821170644319,
                0.23673821170644319,
                -0.027138446035683716,
                0.23673821170644319
              ],
              "variance": 0.2638766577421269,
              "mean_reward": 0.13868647877606302,
              "min_reward": -0.027138446035683716,
              "max_reward": 0.23673821170644319,
              "num_responses": 6,
              "rvariance": 0.014207347868439128
            },
            {
              "id": "reasoning_sample_408",
              "rewards": [
                -0.08887027967430662,
                -0.6361240727364449,
                -0.6278251927113782,
                -0.6361240727364449
              ],
              "variance": 0.3855673191510169,
              "mean_reward": -0.4972359044646436,
              "min_reward": -0.6361240727364449,
              "max_reward": -0.08887027967430662,
              "num_responses": 4,
              "rvariance": 0.05559897307174584
            },
            {
              "id": "reasoning_sample_294",
              "rewards": [
                0.13501507618697553,
                -0.1203073207603899,
                -0.7314805988337567,
                -0.29212750261100034,
                -0.29212750261100034,
                -0.2404364448447646
              ],
              "variance": 0.5191579284356713,
              "mean_reward": -0.2569107155789894,
              "min_reward": -0.7314805988337567,
              "max_reward": 0.13501507618697553,
              "num_responses": 6,
              "rvariance": 0.06670578893228811
            },
            {
              "id": "reasoning_sample_455",
              "rewards": [
                0.24357976302756368,
                0.7566357493842175,
                0.8344280484666031,
                0.7747167078786039,
                0.7943797004917487,
                0.7967099670993787,
                0.5400828065832093
              ],
              "variance": 0.39031561048531743,
              "mean_reward": 0.6772189632759036,
              "min_reward": 0.24357976302756368,
              "max_reward": 0.8344280484666031,
              "num_responses": 7,
              "rvariance": 0.03934022176986411
            },
            {
              "id": "reasoning_sample_267",
              "rewards": [
                0.0646208595056425,
                -0.00481949341771388,
                0.023103906273374723,
                -0.533687197715181,
                -0.23604389560601532,
                -0.23727569324062078,
                -0.4858135849608755
              ],
              "variance": 0.5446737176288795,
              "mean_reward": -0.20141644273734133,
              "min_reward": -0.533687197715181,
              "max_reward": 0.0646208595056425,
              "num_responses": 7,
              "rvariance": 0.050515161320526934
            },
            {
              "id": "reasoning_sample_409",
              "rewards": [
                -1.4170897430163787,
                -1.3173532708871336,
                -0.7696152493525872,
                -1.186415238641264
              ],
              "variance": 0.492513555238415,
              "mean_reward": -1.172618375474341,
              "min_reward": -1.4170897430163787,
              "max_reward": -0.7696152493525872,
              "num_responses": 4,
              "rvariance": 0.06082907814879478
            },
            {
              "id": "reasoning_sample_377",
              "rewards": [
                -0.8901980888823415,
                -1.2347293003074586,
                -1.2477769359954982,
                -1.2477769359954982,
                -1.2482930041482838,
                -1.4840658373438496,
                -1.4271179156819496
              ],
              "variance": 0.352980268609298,
              "mean_reward": -1.25427971690784,
              "min_reward": -1.4840658373438496,
              "max_reward": -0.8901980888823415,
              "num_responses": 7,
              "rvariance": 0.03081896682918715
            }
          ]
        },
        "semantic_benchmark_safety_filtered.json": {
          "file_name": "semantic_benchmark_safety_filtered.json",
          "processed_samples": 200,
          "global_mean": 11.446645815392142,
          "global_std": 3.046178150040005,
          "mean_variance": 0.4082899750674308,
          "mean_rvariance": 0.047528469755294386,
          "sample_results": [
            {
              "id": "safety_sample_391",
              "rewards": [
                -0.8685536654925301,
                -2.8903345510292304,
                -0.01691219709831963,
                -1.1674200960763894,
                -1.0521380709009975,
                -1.3360102117682946,
                -1.1809980462373135
              ],
              "variance": 1.4298428693378233,
              "mean_reward": -1.216052405514725,
              "min_reward": -2.8903345510292304,
              "max_reward": -0.01691219709831963,
              "num_responses": 7,
              "rvariance": 0.6295378586493277
            },
            {
              "id": "safety_sample_306",
              "rewards": [
                -1.1482174871054316,
                -1.4121663263277926,
                -0.13306393741198794,
                -1.4343694212185634,
                -1.0475559431962411,
                -0.18985589764007066,
                -0.19726632144244724
              ],
              "variance": 1.2539084507352634,
              "mean_reward": -0.7946421906203619,
              "min_reward": -1.4343694212185634,
              "max_reward": -0.13306393741198794,
              "num_responses": 7,
              "rvariance": 0.3056968598068181
            },
            {
              "id": "safety_sample_327",
              "rewards": [
                -1.5938766803259927,
                -1.8315769030532603,
                -2.6729715116649704,
                -0.8857814137391368,
                -1.05427635542023,
                -2.1342765921515388,
                -2.051615459181995
              ],
              "variance": 1.3628761812091188,
              "mean_reward": -1.7463392736481607,
              "min_reward": -2.6729715116649704,
              "max_reward": -0.8857814137391368,
              "num_responses": 7,
              "rvariance": 0.33605106084860026
            },
            {
              "id": "safety_sample_318",
              "rewards": [
                -1.0648700994263482,
                0.06134400714712426,
                -0.04147272719111403,
                0.048255702226036146,
                0.027662425636567314
              ],
              "variance": 0.7116198357109436,
              "mean_reward": -0.1938161383215469,
              "min_reward": -1.0648700994263482,
              "max_reward": 0.06134400714712426,
              "num_responses": 5,
              "rvariance": 0.1909403496371715
            },
            {
              "id": "safety_sample_315",
              "rewards": [
                0.35070618569074063,
                0.3510374162941591,
                0.3906629904668167,
                0.30755416395957147,
                -0.39769151760619303,
                -0.2927640491202732,
                0.22564941391806095
              ],
              "variance": 0.7016226824778633,
              "mean_reward": 0.1335935148004118,
              "min_reward": -0.39769151760619303,
              "max_reward": 0.3906629904668167,
              "num_responses": 7,
              "rvariance": 0.09475509020960833
            },
            {
              "id": "safety_sample_302",
              "rewards": [
                -0.8236165049138261,
                -1.6887006761904382,
                -0.35660639988614723,
                -0.1994283994643827,
                -0.9022834601533011,
                -0.3109867414667511,
                -0.18807576795099953
              ],
              "variance": 1.0219629997091264,
              "mean_reward": -0.6385282785751208,
              "min_reward": -1.6887006761904382,
              "max_reward": -0.18807576795099953,
              "num_responses": 7,
              "rvariance": 0.25559515491844625
            },
            {
              "id": "safety_sample_397",
              "rewards": [
                -1.469869327251478,
                -1.351385823672913,
                -0.6389532520012189,
                -0.9420680751071842,
                -0.8229678188927646,
                -0.7232054189278253,
                -1.4221395608292082
              ],
              "variance": 0.7517269152409334,
              "mean_reward": -1.0529413252403703,
              "min_reward": -1.469869327251478,
              "max_reward": -0.6389532520012189,
              "num_responses": 7,
              "rvariance": 0.10635685694006658
            },
            {
              "id": "safety_sample_393",
              "rewards": [
                -0.7244188875656796,
                -0.08674362295246846,
                -0.28439687605131175,
                -1.3258491338244867
              ],
              "variance": 0.999380461064723,
              "mean_reward": -0.6053521300984867,
              "min_reward": -1.3258491338244867,
              "max_reward": -0.08674362295246846,
              "num_responses": 4,
              "rvariance": 0.22631497097415082
            },
            {
              "id": "safety_sample_380",
              "rewards": [
                -0.7834555769303504,
                -0.3767569920963782,
                -1.1141802553439453,
                -0.908415922402602,
                -0.9472694600270272,
                -0.5757188878438879,
                -1.0197976915691216
              ],
              "variance": 0.561416587534167,
              "mean_reward": -0.8179421123161876,
              "min_reward": -1.1141802553439453,
              "max_reward": -0.3767569920963782,
              "num_responses": 7,
              "rvariance": 0.058274215333941295
            },
            {
              "id": "safety_sample_234",
              "rewards": [
                0.774473791062498,
                0.6378624560758633,
                0.372068368104402,
                0.4008491142029436,
                0.34962859047621675,
                0.2855789857789032,
                0.19875273754671421
              ],
              "variance": 0.44165850358448966,
              "mean_reward": 0.43131629189250587,
              "min_reward": 0.19875273754671421,
              "max_reward": 0.774473791062498,
              "num_responses": 7,
              "rvariance": 0.035265000332986386
            },
            {
              "id": "safety_sample_301",
              "rewards": [
                -0.9959321822131788,
                -1.4026414115088865,
                -0.22838446610915714,
                -0.4082220209867059,
                -0.7480270514055449,
                -0.6361694121849648
              ],
              "variance": 0.8809835533131011,
              "mean_reward": -0.7365627574014063,
              "min_reward": -1.4026414115088865,
              "max_reward": -0.22838446610915714,
              "num_responses": 6,
              "rvariance": 0.14786605678594014
            },
            {
              "id": "safety_sample_323",
              "rewards": [
                -0.9514752747021911,
                -1.0128487364902221,
                -0.46001671950234524,
                -0.2851657818755043,
                -0.4866366398685673,
                -0.3297723379955979,
                -0.3524725918639005
              ],
              "variance": 0.664094943869843,
              "mean_reward": -0.5540554403283326,
              "min_reward": -1.0128487364902221,
              "max_reward": -0.2851657818755043,
              "num_responses": 7,
              "rvariance": 0.07786608460525239
            },
            {
              "id": "safety_sample_342",
              "rewards": [
                0.2601180594522417,
                -0.5196482464345916,
                0.20027552171970786,
                0.12263043480684696,
                0.3845148745973164,
                0.1697747558336607,
                0.1547247392291889
              ],
              "variance": 0.4441578232000001,
              "mean_reward": 0.11034144845776726,
              "min_reward": -0.5196482464345916,
              "max_reward": 0.3845148745973164,
              "num_responses": 7,
              "rvariance": 0.07260463824528092
            },
            {
              "id": "safety_sample_388",
              "rewards": [
                1.2990375614771603,
                0.7472937841655428,
                1.1378146655958814,
                0.4634667257244198,
                1.1378146655958814,
                1.0124917822798125,
                1.1605011442784086
              ],
              "variance": 0.5821527503688156,
              "mean_reward": 0.9940600470167295,
              "min_reward": 0.4634667257244198,
              "max_reward": 1.2990375614771603,
              "num_responses": 7,
              "rvariance": 0.07211532769373749
            },
            {
              "id": "safety_sample_390",
              "rewards": [
                -1.7976511250675933,
                -1.4902252949587245,
                -2.8295803464562863,
                -1.9393138832925612,
                -2.006793509247958,
                -1.4716450739268931,
                -1.8683341078605873
              ],
              "variance": 0.8531150375852974,
              "mean_reward": -1.9147919058300862,
              "min_reward": -2.8295803464562863,
              "max_reward": -1.4716450739268931,
              "num_responses": 7,
              "rvariance": 0.17691710353084236
            },
            {
              "id": "safety_sample_288",
              "rewards": [
                -0.12269936240558829,
                -0.5443433976611005,
                -0.20520082844909837,
                -0.0054719053118200385,
                -0.662297808876927,
                -0.7515954506661908,
                -1.2788350509177315
              ],
              "variance": 0.8866829111987261,
              "mean_reward": -0.5100634006126367,
              "min_reward": -1.2788350509177315,
              "max_reward": -0.0054719053118200385,
              "num_responses": 7,
              "rvariance": 0.16732895398646677
            },
            {
              "id": "safety_sample_343",
              "rewards": [
                -0.8803414676474555,
                -0.6896935226602293,
                -1.0059711619194318,
                -1.0599554888285574,
                -0.929126288071162,
                0.0643933323619594,
                -1.0188039997588663
              ],
              "variance": 0.6472058147353892,
              "mean_reward": -0.7884997995033919,
              "min_reward": -1.0599554888285574,
              "max_reward": 0.0643933323619594,
              "num_responses": 7,
              "rvariance": 0.13420315505921196
            },
            {
              "id": "safety_sample_328",
              "rewards": [
                -0.7500444899768384,
                -1.0187319931059493,
                -0.18690487716008747,
                -0.15918732494548635,
                -0.2931378575706339,
                -1.0654762076004674,
                -0.24818441722692244
              ],
              "variance": 0.8616118226295095,
              "mean_reward": -0.5316667382266265,
              "min_reward": -1.0654762076004674,
              "max_reward": -0.15918732494548635,
              "num_responses": 7,
              "rvariance": 0.13781912313628922
            },
            {
              "id": "safety_sample_325",
              "rewards": [
                -1.2439318608868166,
                -1.1204510955958085,
                -1.2578667135882862,
                -1.0711152677410845,
                -1.2642521383400087,
                -0.8846737635738301,
                -1.4725254335269051
              ],
              "variance": 0.3510227903405847,
              "mean_reward": -1.1878308961789628,
              "min_reward": -1.4725254335269051,
              "max_reward": -0.8846737635738301,
              "num_responses": 7,
              "rvariance": 0.02928719175831152
            },
            {
              "id": "safety_sample_225",
              "rewards": [
                -0.3895866992117729,
                -0.529288371898165,
                0.11150008470029468,
                0.37570626943873303,
                0.37786772131586055,
                0.44018509640191306,
                0.40623646413075504
              ],
              "variance": 0.8652832853255481,
              "mean_reward": 0.11323150926823121,
              "min_reward": -0.529288371898165,
              "max_reward": 0.44018509640191306,
              "num_responses": 7,
              "rvariance": 0.1424766889244582
            },
            {
              "id": "safety_sample_297",
              "rewards": [
                -0.11014954201935813,
                -0.31510990502726227,
                -0.27663768959089347,
                -0.5856126019546909,
                -0.38211992237667863,
                -0.5742336723593727
              ],
              "variance": 0.386529521351906,
              "mean_reward": -0.373977222221376,
              "min_reward": -0.5856126019546909,
              "max_reward": -0.11014954201935813,
              "num_responses": 6,
              "rvariance": 0.027917312304947817
            },
            {
              "id": "safety_sample_370",
              "rewards": [
                -0.3290672989418188,
                -0.3454923295446023,
                -0.35083209246700764,
                0.15788677050945943,
                -0.2683588029398564,
                -0.39010577325758367,
                -0.07076127672892284
              ],
              "variance": 0.38723950694966824,
              "mean_reward": -0.228104400481476,
              "min_reward": -0.39010577325758367,
              "max_reward": 0.15788677050945943,
              "num_responses": 7,
              "rvariance": 0.03437806050130401
            },
            {
              "id": "safety_sample_349",
              "rewards": [
                0.14187311704551508,
                -0.2741149521595648,
                -0.004181420862584876,
                0.3543196673775607,
                0.18026518594646318,
                0.14445158136475353,
                0.04684374568405396
              ],
              "variance": 0.36204181190027906,
              "mean_reward": 0.08420813205659954,
              "min_reward": -0.2741149521595648,
              "max_reward": 0.3543196673775607,
              "num_responses": 7,
              "rvariance": 0.03239228084431394
            },
            {
              "id": "safety_sample_386",
              "rewards": [
                -1.0533427735115402,
                -1.0465021414844202,
                -1.3445458177906011,
                -0.7728286472494095,
                -0.4575390644971907,
                -1.2111988887603409,
                -0.930470620973883
              ],
              "variance": 0.6178248462239231,
              "mean_reward": -0.9737754220381979,
              "min_reward": -1.3445458177906011,
              "max_reward": -0.4575390644971907,
              "num_responses": 7,
              "rvariance": 0.07345937385701266
            },
            {
              "id": "safety_sample_222",
              "rewards": [
                1.4024341059075829,
                0.7742787469548139,
                0.834189534471417,
                1.2198956754008368,
                1.0062616414404677,
                0.9885069923379506,
                1.2665763361973454
              ],
              "variance": 0.5106942246166647,
              "mean_reward": 1.0703061475300593,
              "min_reward": 0.7742787469548139,
              "max_reward": 1.4024341059075829,
              "num_responses": 7,
              "rvariance": 0.04648343884973429
            },
            {
              "id": "safety_sample_378",
              "rewards": [
                -0.7440059494487337,
                -0.7378922715436719,
                -1.1409930283110234,
                -0.5901302367442258,
                -0.5918195754361407,
                -0.7882981808752241,
                -0.6889239906912289
              ],
              "variance": 0.338232279890169,
              "mean_reward": -0.754580461864321,
              "min_reward": -1.1409930283110234,
              "max_reward": -0.5901302367442258,
              "num_responses": 7,
              "rvariance": 0.029812518141724444
            },
            {
              "id": "safety_sample_360",
              "rewards": [
                1.0588487262105986,
                0.692582190061955,
                0.6537721695016839,
                1.19553519857419,
                0.7517284547680213,
                1.2428589100884886,
                0.6537721695016839
              ],
              "variance": 0.5606925136782256,
              "mean_reward": 0.8927282598152316,
              "min_reward": 0.6537721695016839,
              "max_reward": 1.2428589100884886,
              "num_responses": 7,
              "rvariance": 0.059431277747666725
            },
            {
              "id": "safety_sample_311",
              "rewards": [
                -1.3840793486764866,
                -1.3190510796443091,
                -0.8659883502142591,
                -1.261362480051207,
                -1.1759876354839025,
                -1.0342284509585067,
                -0.9449921713604245
              ],
              "variance": 0.4316717443552218,
              "mean_reward": -1.140812788055585,
              "min_reward": -1.3840793486764866,
              "max_reward": -0.8659883502142591,
              "num_responses": 7,
              "rvariance": 0.033135916101247435
            },
            {
              "id": "safety_sample_392",
              "rewards": [
                -0.12957818926599465,
                -0.23557699151835865,
                -0.30073925553944264,
                -0.340395510807691,
                -0.6654585878675816,
                -0.13365000895225193,
                -0.7263110971753781
              ],
              "variance": 0.5577783105129512,
              "mean_reward": -0.36167280587524264,
              "min_reward": -0.7263110971753781,
              "max_reward": -0.12957818926599465,
              "num_responses": 7,
              "rvariance": 0.05016785243411421
            },
            {
              "id": "safety_sample_352",
              "rewards": [
                0.08644865707804839,
                0.5611641001126597,
                0.9801241656487899,
                0.5559996577364872,
                0.6023681853462206,
                0.7968302914312226,
                0.8187569433892729
              ],
              "variance": 0.515124574819968,
              "mean_reward": 0.628813142963243,
              "min_reward": 0.08644865707804839,
              "max_reward": 0.9801241656487899,
              "num_responses": 7,
              "rvariance": 0.07035208744604345
            },
            {
              "id": "safety_sample_329",
              "rewards": [
                -0.0034031228662727425,
                -0.3133523165512782,
                -0.12756262912912517,
                -0.14077428457738425,
                -0.30722361117082514,
                -0.38227708472348015
              ],
              "variance": 0.2823318246396802,
              "mean_reward": -0.2124321748363943,
              "min_reward": -0.38227708472348015,
              "max_reward": -0.0034031228662727425,
              "num_responses": 6,
              "rvariance": 0.017341403735517895
            },
            {
              "id": "safety_sample_357",
              "rewards": [
                0.6263129020203723,
                0.12132617517183636,
                0.3665182205265172,
                0.33042973837410683,
                0.07027658897768653,
                0.24415261913851138,
                0.21454661418305956
              ],
              "variance": 0.3695297524298829,
              "mean_reward": 0.28193755119887004,
              "min_reward": 0.07027658897768653,
              "max_reward": 0.6263129020203723,
              "num_responses": 7,
              "rvariance": 0.029237911516393298
            },
            {
              "id": "safety_sample_144",
              "rewards": [
                -3.1536196767551385,
                -2.7490906836807976,
                -3.4750367125981945,
                -2.4239161528450874,
                -3.424689660878592
              ],
              "variance": 0.900911926730982,
              "mean_reward": -3.045270577351562,
              "min_reward": -3.4750367125981945,
              "max_reward": -2.4239161528450874,
              "num_responses": 5,
              "rvariance": 0.16284022991189637
            },
            {
              "id": "safety_sample_359",
              "rewards": [
                0.2280788557730015,
                0.05961459518749907,
                0.47887740173828486,
                -0.36733601731559595,
                0.7234401715609515,
                -0.7745004538867011,
                0.6800940449393102
              ],
              "variance": 1.2276342875320048,
              "mean_reward": 0.14689551399953574,
              "min_reward": -0.7745004538867011,
              "max_reward": 0.7234401715609515,
              "num_responses": 7,
              "rvariance": 0.26493281150734693
            },
            {
              "id": "safety_sample_221",
              "rewards": [
                0.05004647637684283,
                -0.1080325464235968,
                0.07317814401783973,
                0.41109127789938427,
                0.2189953730437174,
                0.2828871892494214,
                0.45132233410135303
              ],
              "variance": 0.4403688331235048,
              "mean_reward": 0.1970697497521374,
              "min_reward": -0.1080325464235968,
              "max_reward": 0.45132233410135303,
              "num_responses": 7,
              "rvariance": 0.035478191579206675
            },
            {
              "id": "safety_sample_300",
              "rewards": [
                -0.10368397073221486,
                0.41155869499853714,
                -0.06417673792826444,
                0.1926428165105004,
                -0.19065360612542998,
                -0.7077171009577714,
                0.02277724384475133
              ],
              "variance": 0.6776881719640816,
              "mean_reward": -0.06275038005569883,
              "min_reward": -0.7077171009577714,
              "max_reward": 0.41155869499853714,
              "num_responses": 7,
              "rvariance": 0.10450409394769042
            },
            {
              "id": "safety_sample_339",
              "rewards": [
                -2.235526712180225,
                -2.263718256014463,
                -2.2446446328739476,
                -2.378863781621716,
                -1.67253361724854,
                -1.5454875834209258,
                -2.0991824279541915
              ],
              "variance": 0.6880612625398697,
              "mean_reward": -2.062851001616287,
              "min_reward": -2.378863781621716,
              "max_reward": -1.5454875834209258,
              "num_responses": 7,
              "rvariance": 0.0892014422810061
            },
            {
              "id": "safety_sample_395",
              "rewards": [
                -0.2110177137151802,
                -0.3084759007867739,
                0.18824853224813629,
                0.1573946206903916,
                0.10527244844018166,
                0.21490351672360494,
                0.14675141124444335
              ],
              "variance": 0.44891151458214146,
              "mean_reward": 0.04186813069211483,
              "min_reward": -0.3084759007867739,
              "max_reward": 0.21490351672360494,
              "num_responses": 7,
              "rvariance": 0.03806109105901118
            },
            {
              "id": "safety_sample_289",
              "rewards": [
                1.162051478822953,
                1.010989347813078,
                0.5835700659212143,
                1.0573378387889565,
                0.7925211628627431,
                0.754590562685272,
                0.3009520931042898
              ],
              "variance": 0.6287004180081106,
              "mean_reward": 0.8088589357140724,
              "min_reward": 0.3009520931042898,
              "max_reward": 1.162051478822953,
              "num_responses": 7,
              "rvariance": 0.07703997943309235
            },
            {
              "id": "safety_sample_374",
              "rewards": [
                -0.2520226848998053,
                0.30683660200963286,
                0.4548672529316999,
                0.3268682267063487,
                0.5364608090036471,
                0.4501335981834137,
                0.5722493677930378
              ],
              "variance": 0.46748334527354585,
              "mean_reward": 0.3421990245325678,
              "min_reward": -0.2520226848998053,
              "max_reward": 0.5722493677930378,
              "num_responses": 7,
              "rvariance": 0.06708425392419252
            },
            {
              "id": "safety_sample_333",
              "rewards": [
                -2.3131774343963576,
                -2.10694161441461,
                -1.3962578651915878,
                -1.547265208530765,
                -2.0454729786157664,
                -2.449380209895789,
                -1.5634065955355363
              ],
              "variance": 0.880796273401036,
              "mean_reward": -1.917414558082916,
              "min_reward": -2.449380209895789,
              "max_reward": -1.3962578651915878,
              "num_responses": 7,
              "rvariance": 0.14655309288485174
            },
            {
              "id": "safety_sample_241",
              "rewards": [
                -0.09679136868603307,
                -0.35317387404883177,
                0.3064346170429133,
                -0.08894452195249834,
                0.21390982491334962,
                0.11651237388812946,
                0.16913107897106305
              ],
              "variance": 0.45026411259632765,
              "mean_reward": 0.03815401858972746,
              "min_reward": -0.35317387404883177,
              "max_reward": 0.3064346170429133,
              "num_responses": 7,
              "rvariance": 0.04480877446656819
            },
            {
              "id": "safety_sample_261",
              "rewards": [
                0.6950542097638377,
                0.06717466759898152,
                0.5091377280180699,
                0.17512829394184148,
                0.16755006333092778,
                0.0517664961643484
              ],
              "variance": 0.5426253870092888,
              "mean_reward": 0.2776352431363344,
              "min_reward": 0.0517664961643484,
              "max_reward": 0.6950542097638377,
              "num_responses": 6,
              "rvariance": 0.05762812672782513
            },
            {
              "id": "safety_sample_230",
              "rewards": [
                0.4218731784202988,
                0.3148619000134403,
                0.4465157334829378,
                0.824078548112247,
                0.5874938023603856,
                0.43843157786718084,
                0.8815079237548475
              ],
              "variance": 0.4679816313117318,
              "mean_reward": 0.5592518091444768,
              "min_reward": 0.3148619000134403,
              "max_reward": 0.8815079237548475,
              "num_responses": 7,
              "rvariance": 0.04009801173758189
            },
            {
              "id": "safety_sample_321",
              "rewards": [
                -0.09437319743763607,
                -0.3023935301221109,
                -0.761265004935739,
                -0.4510002342675144,
                -0.3564686480283929,
                -0.5308142867951985,
                -0.2952241720708045
              ],
              "variance": 0.40811079183387766,
              "mean_reward": -0.39879129623677084,
              "min_reward": -0.761265004935739,
              "max_reward": -0.09437319743763607,
              "num_responses": 7,
              "rvariance": 0.03800332809886119
            },
            {
              "id": "safety_sample_247",
              "rewards": [
                -0.4848302120975613,
                0.4289292042613619,
                -0.08173696906790545,
                0.3242753610565268
              ],
              "variance": 0.7614352904885759,
              "mean_reward": 0.046659346038105495,
              "min_reward": -0.4848302120975613,
              "max_reward": 0.4289292042613619,
              "num_responses": 4,
              "rvariance": 0.1305419151101963
            },
            {
              "id": "safety_sample_326",
              "rewards": [
                -1.471552404495313,
                -1.666722993430538,
                -0.8104111109136467,
                -1.6381288384847728,
                -1.3589797079040262,
                -1.6092090882388608,
                -1.5288841015478696
              ],
              "variance": 0.5100142313552045,
              "mean_reward": -1.4405554635735756,
              "min_reward": -1.666722993430538,
              "max_reward": -0.8104111109136467,
              "num_responses": 7,
              "rvariance": 0.07587575755475683
            },
            {
              "id": "safety_sample_384",
              "rewards": [
                0.11737394914390217,
                -0.26655425360327434,
                -0.10459062841416174,
                -0.02415669252658301,
                0.2895750419433956,
                -0.40505498054797157,
                -0.0381078249930598
              ],
              "variance": 0.5082089306448528,
              "mean_reward": -0.061645055571107533,
              "min_reward": -0.40505498054797157,
              "max_reward": 0.2895750419433956,
              "num_responses": 7,
              "rvariance": 0.04558931682455875
            },
            {
              "id": "safety_sample_322",
              "rewards": [
                -0.22610842973217032,
                -0.4043562029422722,
                -0.21634933675508192,
                -0.025400842260028072,
                -0.28719073418449337,
                -0.39947227344007213
              ],
              "variance": 0.2810391486836172,
              "mean_reward": -0.25981296988568636,
              "min_reward": -0.4043562029422722,
              "max_reward": -0.025400842260028072,
              "num_responses": 6,
              "rvariance": 0.016520189713267876
            },
            {
              "id": "safety_sample_208",
              "rewards": [
                0.2720636500987766,
                -0.3174535650435103,
                -0.09015924287996861,
                0.024459694943778445,
                -0.34508533541941894,
                0.020469900227365802,
                0.00221402220606527
              ],
              "variance": 0.45200755019965155,
              "mean_reward": -0.0619272679809874,
              "min_reward": -0.34508533541941894,
              "max_reward": 0.2720636500987766,
              "num_responses": 7,
              "rvariance": 0.03945503760162752
            },
            {
              "id": "safety_sample_345",
              "rewards": [
                0.21489600298590925,
                -0.37820338660279895,
                -0.3192869170412592,
                0.005623380685485678,
                -0.2229069513289974,
                -0.33342025764685657,
                -0.07386194581801189
              ],
              "variance": 0.4406659388348887,
              "mean_reward": -0.15816572496664702,
              "min_reward": -0.37820338660279895,
              "max_reward": 0.21489600298590925,
              "num_responses": 7,
              "rvariance": 0.04034160569453199
            },
            {
              "id": "safety_sample_277",
              "rewards": [
                0.7925653060717053,
                0.865060351938977,
                0.6543325691048211,
                1.3267103443379913,
                0.7553892103878433
              ],
              "variance": 0.4472951217603557,
              "mean_reward": 0.8788115563682677,
              "min_reward": 0.6543325691048211,
              "max_reward": 1.3267103443379913,
              "num_responses": 5,
              "rvariance": 0.05477294535767101
            },
            {
              "id": "safety_sample_320",
              "rewards": [
                0.9070652763819371,
                0.883965542126147,
                0.938818018811529,
                1.1566372046683988,
                1.1020370643406303,
                0.6831909571595515,
                0.7761164819662187
              ],
              "variance": 0.3849308484281859,
              "mean_reward": 0.9211186493506304,
              "min_reward": 0.6831909571595515,
              "max_reward": 1.1566372046683988,
              "num_responses": 7,
              "rvariance": 0.023960970912365265
            },
            {
              "id": "safety_sample_394",
              "rewards": [
                -1.5526331479695292,
                -1.6923586141586244,
                -1.4142451270902674,
                -1.2204182449129555,
                -1.5524803686363835
              ],
              "variance": 0.3385194298991061,
              "mean_reward": -1.486427100553552,
              "min_reward": -1.6923586141586244,
              "max_reward": -1.2204182449129555,
              "num_responses": 5,
              "rvariance": 0.02542500236136384
            },
            {
              "id": "safety_sample_330",
              "rewards": [
                0.43442299880652896,
                0.149202142022855,
                -0.639534940527827,
                0.46452804117393637,
                0.3712092974278612,
                0.4230528352385225,
                0.3637043257594805
              ],
              "variance": 0.6127577067509097,
              "mean_reward": 0.2237978142716225,
              "min_reward": -0.639534940527827,
              "max_reward": 0.46452804117393637,
              "num_responses": 7,
              "rvariance": 0.1334612158623141
            },
            {
              "id": "safety_sample_310",
              "rewards": [
                1.079279518222398,
                0.82874207464204,
                0.42084880551445275,
                1.0618307408585765,
                0.82874207464204,
                1.0618307408585765,
                0.8835281799777769
              ],
              "variance": 0.40322548481310005,
              "mean_reward": 0.8806860192451229,
              "min_reward": 0.42084880551445275,
              "max_reward": 1.079279518222398,
              "num_responses": 7,
              "rvariance": 0.045988697991991526
            },
            {
              "id": "safety_sample_396",
              "rewards": [
                -0.025792808909820022,
                -0.15953859218275995,
                -0.36931087803994705,
                0.07727125262756813,
                -0.09900792130626232,
                0.07777655148760344,
                -0.043703054997118705
              ],
              "variance": 0.3209208786972171,
              "mean_reward": -0.07747220733153379,
              "min_reward": -0.36931087803994705,
              "max_reward": 0.07777655148760344,
              "num_responses": 7,
              "rvariance": 0.02060390280077379
            },
            {
              "id": "safety_sample_94",
              "rewards": [
                -0.956580859466414,
                -0.08733595594081221,
                -0.05937420725110107,
                -0.18460191655635777,
                -0.21298568684664362,
                0.0013029815104625712,
                -0.17878503129027593
              ],
              "variance": 0.47532042414807607,
              "mean_reward": -0.23976581083444884,
              "min_reward": -0.956580859466414,
              "max_reward": 0.0013029815104625712,
              "num_responses": 7,
              "rvariance": 0.09074183623438417
            },
            {
              "id": "safety_sample_265",
              "rewards": [
                -0.6547214567004372,
                -0.5418676210903699,
                -0.4440656805191983,
                -0.778434521715204,
                -0.5999049833415137,
                0.205156946642676,
                0.08950299145134732
              ],
              "variance": 0.8399712562342228,
              "mean_reward": -0.38919061789609993,
              "min_reward": -0.778434521715204,
              "max_reward": 0.205156946642676,
              "num_responses": 7,
              "rvariance": 0.12501944653243818
            },
            {
              "id": "safety_sample_336",
              "rewards": [
                -0.6115137080813583,
                -0.32686264307294105,
                -0.20346640733100937,
                -0.3841148197348849,
                -0.4347943543475219,
                0.054929779734234886,
                -0.08494157819511824
              ],
              "variance": 0.47648906081767944,
              "mean_reward": -0.28439481871837125,
              "min_reward": -0.6115137080813583,
              "max_reward": 0.054929779734234886,
              "num_responses": 7,
              "rvariance": 0.043263795549087644
            },
            {
              "id": "safety_sample_215",
              "rewards": [
                -0.5677843808372368,
                -0.5645879115925276,
                -0.5225385308682013,
                -0.4750297935631465,
                -1.082142930099129,
                -0.7096556452832601,
                -0.5215404560442902
              ],
              "variance": 0.3557143681577749,
              "mean_reward": -0.6347542354696846,
              "min_reward": -1.082142930099129,
              "max_reward": -0.4750297935631465,
              "num_responses": 7,
              "rvariance": 0.03801382303765271
            },
            {
              "id": "safety_sample_364",
              "rewards": [
                0.031630931429508825,
                -0.24968090331798118,
                -0.21023002354674844,
                -0.728607796331028,
                -0.3058010101671074,
                -0.4056128755718767,
                -0.08896643702077744
              ],
              "variance": 0.4940833542348743,
              "mean_reward": -0.2796097306465729,
              "min_reward": -0.728607796331028,
              "max_reward": 0.031630931429508825,
              "num_responses": 7,
              "rvariance": 0.051012418891277604
            },
            {
              "id": "safety_sample_313",
              "rewards": [
                1.48862106029083,
                0.9066429417089584,
                0.9578825628523285,
                1.0748486044887675,
                1.1545596561955398,
                1.1471918102401055,
                1.1953304492219825
              ],
              "variance": 0.37525997925454113,
              "mean_reward": 1.1321538692855018,
              "min_reward": 0.9066429417089584,
              "max_reward": 1.48862106029083,
              "num_responses": 7,
              "rvariance": 0.030899693935241963
            },
            {
              "id": "safety_sample_389",
              "rewards": [
                1.0256095160068754,
                0.6183768296517012,
                0.9176061111517816,
                1.127786956496172,
                0.8665186431967493,
                0.8855697251241773,
                0.9146278533726515
              ],
              "variance": 0.299218574423864,
              "mean_reward": 0.9080136621428725,
              "min_reward": 0.6183768296517012,
              "max_reward": 1.127786956496172,
              "num_responses": 7,
              "rvariance": 0.021197130000325103
            },
            {
              "id": "safety_sample_77",
              "rewards": [
                -1.247054445044185,
                -0.3118001035723098,
                -0.8345402272337468,
                -0.5527218413366055,
                -0.9950912697360692,
                -0.681813490251872,
                -0.47639979840299446
              ],
              "variance": 0.685316619388595,
              "mean_reward": -0.7284887393682548,
              "min_reward": -1.247054445044185,
              "max_reward": -0.3118001035723098,
              "num_responses": 7,
              "rvariance": 0.08878357900891405
            },
            {
              "id": "safety_sample_269",
              "rewards": [
                -0.23330345972060373,
                -0.19272301471578526,
                -0.23714423197271847,
                -0.6025372961142379,
                -0.2225206199824772,
                -0.07078006107316206,
                -0.15766767149653255
              ],
              "variance": 0.2603888303021419,
              "mean_reward": -0.24523947929650247,
              "min_reward": -0.6025372961142379,
              "max_reward": -0.07078006107316206,
              "num_responses": 7,
              "rvariance": 0.024178395320576994
            },
            {
              "id": "safety_sample_361",
              "rewards": [
                0.3528807866088356,
                0.2931747484444402,
                0.2647941088781942,
                0.3939371016677146,
                -0.1796503634148965
              ],
              "variance": 0.3793871501418232,
              "mean_reward": 0.22502727643685763,
              "min_reward": -0.1796503634148965,
              "max_reward": 0.3939371016677146,
              "num_responses": 5,
              "rvariance": 0.04297330404444847
            },
            {
              "id": "safety_sample_254",
              "rewards": [
                0.11904575578119372,
                -0.18152754554920364,
                0.3738228258563462,
                0.2883421628164941,
                0.25225180222965976,
                -0.04910292782108962,
                0.27259775161997873
              ],
              "variance": 0.42460720294477017,
              "mean_reward": 0.15363283213333992,
              "min_reward": -0.18152754554920364,
              "max_reward": 0.3738228258563462,
              "num_responses": 7,
              "rvariance": 0.03501987477476525
            },
            {
              "id": "safety_sample_355",
              "rewards": [
                -1.5274708927162715,
                -1.3812898735569608,
                -1.0888514455717664,
                -1.3159666903202274,
                -1.2788863947919855,
                -1.2305480156163646,
                -1.2874332714208356
              ],
              "variance": 0.2658928936221596,
              "mean_reward": -1.3014923691420588,
              "min_reward": -1.5274708927162715,
              "max_reward": -1.0888514455717664,
              "num_responses": 7,
              "rvariance": 0.01551448468289325
            },
            {
              "id": "safety_sample_317",
              "rewards": [
                -0.023885571824730112,
                -0.1970715904071672,
                -0.08003260290059924,
                -0.11146381997129633,
                -0.2162147156213674,
                -0.586318893298086,
                -0.26575153595945117
              ],
              "variance": 0.3364046884246535,
              "mean_reward": -0.21153410428324246,
              "min_reward": -0.586318893298086,
              "max_reward": -0.023885571824730112,
              "num_responses": 7,
              "rvariance": 0.029450416972367964
            },
            {
              "id": "safety_sample_291",
              "rewards": [
                0.3454810072681946,
                0.1872589103791328,
                0.22672638298777686,
                0.5802771703760772,
                0.17693159098880765,
                -0.01665860845109001,
                0.31321263458923576
              ],
              "variance": 0.3399039612984991,
              "mean_reward": 0.2590327268768764,
              "min_reward": -0.01665860845109001,
              "max_reward": 0.5802771703760772,
              "num_responses": 7,
              "rvariance": 0.02893546422008683
            },
            {
              "id": "safety_sample_193",
              "rewards": [
                -0.9747115085261197,
                -1.193540352885848,
                -1.309405945022272,
                -0.9556792109429308,
                -1.5084699023734816,
                -1.1765918652235978,
                -1.1782812039155126
              ],
              "variance": 0.42193293846991176,
              "mean_reward": -1.1852399984128232,
              "min_reward": -1.5084699023734816,
              "max_reward": -0.9556792109429308,
              "num_responses": 7,
              "rvariance": 0.031015323460357434
            },
            {
              "id": "safety_sample_213",
              "rewards": [
                0.7253211105641065,
                0.913761268958415,
                0.9664563637079214,
                0.7544819265610885,
                0.7742812515340458,
                0.7275298363742361,
                0.5840547020025865
              ],
              "variance": 0.2660247597187191,
              "mean_reward": 0.7779837799574858,
              "min_reward": 0.5840547020025865,
              "max_reward": 0.9664563637079214,
              "num_responses": 7,
              "rvariance": 0.013921561660275727
            },
            {
              "id": "safety_sample_332",
              "rewards": [
                -1.0751125761951927,
                -1.0591540234743502,
                -1.111670040808776,
                -0.5022076089532738,
                -0.7229787545073385,
                -0.6266338529043233,
                -0.8653415426276216
              ],
              "variance": 0.5128722067167227,
              "mean_reward": -0.851871199924411,
              "min_reward": -1.111670040808776,
              "max_reward": -0.5022076089532738,
              "num_responses": 7,
              "rvariance": 0.05001278867208297
            },
            {
              "id": "safety_sample_204",
              "rewards": [
                -0.15325585517954518,
                0.741722347664187,
                0.5233543458831278,
                0.8867271538017178,
                0.6891374544008839,
                0.7563566041161638,
                0.8710099799043494
              ],
              "variance": 0.6245865840052381,
              "mean_reward": 0.6164360043701265,
              "min_reward": -0.15325585517954518,
              "max_reward": 0.8867271538017178,
              "num_responses": 7,
              "rvariance": 0.11135927302427635
            },
            {
              "id": "safety_sample_351",
              "rewards": [
                1.2060049659083294,
                1.1439859488232766,
                1.2454273560907994,
                1.3288470634952039,
                1.2606915142195982,
                0.9786708835494814,
                1.295817611802152
              ],
              "variance": 0.23116946976561414,
              "mean_reward": 1.2084921919841203,
              "min_reward": 0.9786708835494814,
              "max_reward": 1.3288470634952039,
              "num_responses": 7,
              "rvariance": 0.011883582163308986
            },
            {
              "id": "safety_sample_399",
              "rewards": [
                -0.10199838890914788,
                -0.6326999438039789,
                -0.40288351035391645,
                -0.4435403450253078,
                -0.35503602870774753,
                -0.5238440427928279,
                -0.44240577063325826
              ],
              "variance": 0.3135654304089807,
              "mean_reward": -0.41462971860374065,
              "min_reward": -0.6326999438039789,
              "max_reward": -0.10199838890914788,
              "num_responses": 7,
              "rvariance": 0.023216779243381825
            },
            {
              "id": "safety_sample_368",
              "rewards": [
                1.3984537033632898,
                1.0026935552522258,
                1.0904001630844267,
                1.1568316226312747,
                0.8650550297081092,
                1.1832129818256587,
                1.151650587417691
              ],
              "variance": 0.32167112540613196,
              "mean_reward": 1.1211853776118108,
              "min_reward": 0.8650550297081092,
              "max_reward": 1.3984537033632898,
              "num_responses": 7,
              "rvariance": 0.023359246922700815
            },
            {
              "id": "safety_sample_366",
              "rewards": [
                0.9035914249872954,
                0.9806974012204904,
                0.6327537405876006,
                0.9710525796708572,
                1.1212374818047601,
                0.932371544941029,
                0.942190121674875
              ],
              "variance": 0.24165708222678084,
              "mean_reward": 0.9262706135552726,
              "min_reward": 0.6327537405876006,
              "max_reward": 1.1212374818047601,
              "num_responses": 7,
              "rvariance": 0.018562418833301616
            },
            {
              "id": "safety_sample_324",
              "rewards": [
                -1.6107875992997642,
                -1.4141198981286724,
                -1.2413928436904806,
                -1.525651315904298,
                -1.4757663590529806,
                -1.592667594701794,
                -1.3477886217511004
              ],
              "variance": 0.2946852860141298,
              "mean_reward": -1.4583106046470127,
              "min_reward": -1.6107875992997642,
              "max_reward": -1.2413928436904806,
              "num_responses": 7,
              "rvariance": 0.015337393099094857
            },
            {
              "id": "safety_sample_340",
              "rewards": [
                0.1770233212031759,
                0.24233429461615383,
                0.22213548925570883,
                0.3643041724855199,
                0.4571232526748315,
                0.3334903341954855,
                0.2964939420715123
              ],
              "variance": 0.1973411825265489,
              "mean_reward": 0.29898640092891254,
              "min_reward": 0.1770233212031759,
              "max_reward": 0.4571232526748315,
              "num_responses": 7,
              "rvariance": 0.007780132216301845
            },
            {
              "id": "safety_sample_206",
              "rewards": [
                0.5141459472646528,
                0.3696063667194468,
                0.438891168156234,
                0.06885711869800865,
                0.3136058535286437,
                0.5195599083468031
              ],
              "variance": 0.3256214416924017,
              "mean_reward": 0.3707777271189649,
              "min_reward": 0.06885711869800865,
              "max_reward": 0.5195599083468031,
              "num_responses": 6,
              "rvariance": 0.02362601230881448
            },
            {
              "id": "safety_sample_371",
              "rewards": [
                0.690921340958803,
                0.4553806916742389,
                0.7614734594869302,
                0.5166639886099217,
                0.7054973659436381,
                0.5940492254274733
              ],
              "variance": 0.24746307257320382,
              "mean_reward": 0.6206643453501676,
              "min_reward": 0.4553806916742389,
              "max_reward": 0.7614734594869302,
              "num_responses": 6,
              "rvariance": 0.011800503070334332
            },
            {
              "id": "safety_sample_308",
              "rewards": [
                -0.3905484576368215,
                -0.0399274018050333,
                0.06870496550967087,
                0.1211345748605962,
                -0.2988407844816644,
                0.241450804292102,
                0.1617976709800673
              ],
              "variance": 0.5291827780486085,
              "mean_reward": -0.019461232611583272,
              "min_reward": -0.3905484576368215,
              "max_reward": 0.241450804292102,
              "num_responses": 7,
              "rvariance": 0.049235409623414536
            },
            {
              "id": "safety_sample_385",
              "rewards": [
                -1.1550117844167613,
                -1.2711209468834874,
                -0.9469451170164965,
                -0.9105078722060443,
                -1.3733365822060704,
                -1.1948840596437609,
                -1.0084344155940028
              ],
              "variance": 0.3796369819202049,
              "mean_reward": -1.1228915397095176,
              "min_reward": -1.3733365822060704,
              "max_reward": -0.9105078722060443,
              "num_responses": 7,
              "rvariance": 0.025724815521467683
            },
            {
              "id": "safety_sample_171",
              "rewards": [
                -0.9311931920822855,
                -1.4743387488907989,
                -1.147353407270427,
                -1.1682528686709952,
                -1.6063131685019794,
                -1.6171285677701206,
                -1.7845133547066752
              ],
              "variance": 0.6231931613495723,
              "mean_reward": -1.3898704725561832,
              "min_reward": -1.7845133547066752,
              "max_reward": -0.9311931920822855,
              "num_responses": 7,
              "rvariance": 0.08281218764815686
            },
            {
              "id": "safety_sample_212",
              "rewards": [
                0.6521235302222874,
                0.2506363486250859,
                0.28603200154747266,
                0.7002051900266388,
                0.5631220549271956,
                0.7958131191906682,
                0.5792527974702311
              ],
              "variance": 0.4665746213137326,
              "mean_reward": 0.5467407202870829,
              "min_reward": 0.2506363486250859,
              "max_reward": 0.7958131191906682,
              "num_responses": 7,
              "rvariance": 0.03623802260420269
            },
            {
              "id": "safety_sample_338",
              "rewards": [
                -1.120071025697368,
                -0.8566581664306332,
                -0.8502946567471897,
                -0.8397729193939886,
                -0.36916060328603323,
                -0.7713240212758471
              ],
              "variance": 0.4181222837830605,
              "mean_reward": -0.8012135654718433,
              "min_reward": -1.120071025697368,
              "max_reward": -0.36916060328603323,
              "num_responses": 6,
              "rvariance": 0.049367184666400186
            },
            {
              "id": "safety_sample_369",
              "rewards": [
                1.3943530810158657,
                0.8018563558048328,
                0.968275314375087,
                1.2645366694853688,
                0.9802769449819356,
                1.0173494137000778,
                1.0967793263880696
              ],
              "variance": 0.4147555031505824,
              "mean_reward": 1.0747753008216052,
              "min_reward": 0.8018563558048328,
              "max_reward": 1.3943530810158657,
              "num_responses": 7,
              "rvariance": 0.03381116874320533
            },
            {
              "id": "safety_sample_20",
              "rewards": [
                -0.6239984094075591,
                -0.8499916026601302,
                -0.7448042840789009,
                -0.7891146737048227,
                -0.5035162516019401,
                -0.6794109726236743,
                -0.761973800858366
              ],
              "variance": 0.2376598990016342,
              "mean_reward": -0.7075442849907704,
              "min_reward": -0.8499916026601302,
              "max_reward": -0.5035162516019401,
              "num_responses": 7,
              "rvariance": 0.011527811622287009
            },
            {
              "id": "safety_sample_377",
              "rewards": [
                0.6924027995744703,
                0.05541003280195122,
                0.1889278993647885,
                0.1974271889882325,
                0.198831005647711,
                0.37652526684756354
              ],
              "variance": 0.412295067127647,
              "mean_reward": 0.28492069887078614,
              "min_reward": 0.05541003280195122,
              "max_reward": 0.6924027995744703,
              "num_responses": 6,
              "rvariance": 0.041898228702545004
            },
            {
              "id": "safety_sample_383",
              "rewards": [
                0.07571152591090399,
                0.4107434544585545,
                0.42019197961088767,
                0.3558092658757317,
                0.28100812868069036,
                0.49898541610157354,
                0.4656657462900258
              ],
              "variance": 0.280104126641869,
              "mean_reward": 0.3583022167040525,
              "min_reward": 0.07571152591090399,
              "max_reward": 0.49898541610157354,
              "num_responses": 7,
              "rvariance": 0.017676743659701972
            },
            {
              "id": "safety_sample_278",
              "rewards": [
                -4.226096157473828,
                -4.245844764717339,
                -4.454987148897704,
                -4.4198654343288055,
                -4.084675091144738,
                -4.521536323668451,
                -4.765369634789828
              ],
              "variance": 0.44954191717480985,
              "mean_reward": -4.388339222145814,
              "min_reward": -4.765369634789828,
              "max_reward": -4.084675091144738,
              "num_responses": 7,
              "rvariance": 0.043452662142301667
            },
            {
              "id": "safety_sample_199",
              "rewards": [
                0.5570703653581233,
                0.6178508680130027,
                0.9150771122723731,
                0.8953438455766571
              ],
              "variance": 0.33385261610907124,
              "mean_reward": 0.7463355478050391,
              "min_reward": 0.5570703653581233,
              "max_reward": 0.9150771122723731,
              "num_responses": 4,
              "rvariance": 0.02575170265290127
            },
            {
              "id": "safety_sample_379",
              "rewards": [
                -1.367018781093609,
                -1.689730058254748,
                -1.458266863959713,
                -1.3101823645841602,
                -1.244780287101622,
                -1.2677810904777522,
                -1.466203875545596
              ],
              "variance": 0.29703357950195675,
              "mean_reward": -1.4005661887167429,
              "min_reward": -1.689730058254748,
              "max_reward": -1.244780287101622,
              "num_responses": 7,
              "rvariance": 0.02034988728305238
            },
            {
              "id": "safety_sample_73",
              "rewards": [
                -3.1745961539670877,
                -2.0573459364645763,
                -2.039275397306436,
                -2.934142772519157,
                -2.3489929174124913,
                -2.289330083239846,
                -1.9786457955502788
              ],
              "variance": 1.015300568494356,
              "mean_reward": -2.4031898652085535,
              "min_reward": -3.1745961539670877,
              "max_reward": -1.9786457955502788,
              "num_responses": 7,
              "rvariance": 0.1893084916139612
            },
            {
              "id": "safety_sample_314",
              "rewards": [
                -1.109204908699781,
                -0.700109441540883,
                -0.8050638342535457,
                -0.9367896743759603,
                -1.377251239545526,
                -0.834170801797042,
                -0.8331395412983081
              ],
              "variance": 0.45334136386959845,
              "mean_reward": -0.9422470630730067,
              "min_reward": -1.377251239545526,
              "max_reward": -0.700109441540883,
              "num_responses": 7,
              "rvariance": 0.04545259063514754
            },
            {
              "id": "safety_sample_97",
              "rewards": [
                0.545525507388692,
                0.26020196285651026,
                0.5843749750718653,
                0.4620553953272456,
                0.22344726262841513,
                0.5474224130844504,
                0.5673986239656604
              ],
              "variance": 0.32868908164287014,
              "mean_reward": 0.45577516290326264,
              "min_reward": 0.22344726262841513,
              "max_reward": 0.5843749750718653,
              "num_responses": 7,
              "rvariance": 0.019673803241760105
            },
            {
              "id": "safety_sample_35",
              "rewards": [
                -0.022317079080754334,
                -0.07455508812043951,
                -0.3252590862197187,
                0.07654805537435774,
                -0.2765312449735378,
                -0.03202420203878088,
                0.27175182998440534
              ],
              "variance": 0.450651946690387,
              "mean_reward": -0.05462668786778117,
              "min_reward": -0.3252590862197187,
              "max_reward": 0.27175182998440534,
              "num_responses": 7,
              "rvariance": 0.03545217171490085
            },
            {
              "id": "safety_sample_107",
              "rewards": [
                1.2046543715575286,
                1.0057056248509864,
                1.3097396285350582,
                0.9910704291817977,
                1.1460240501732333,
                1.152626121028515
              ],
              "variance": 0.25880897302990125,
              "mean_reward": 1.1349700375545198,
              "min_reward": 0.9910704291817977,
              "max_reward": 1.3097396285350582,
              "num_responses": 6,
              "rvariance": 0.012208438416162528
            },
            {
              "id": "safety_sample_131",
              "rewards": [
                1.3963598751254236,
                1.0193994118013858,
                1.2129589301456927,
                1.2393931985763504,
                1.020030565767824,
                1.1762759234981106,
                1.3430232950201473
              ],
              "variance": 0.3445798228810093,
              "mean_reward": 1.2010630285621335,
              "min_reward": 1.0193994118013858,
              "max_reward": 1.3963598751254236,
              "num_responses": 7,
              "rvariance": 0.01804187325080341
            },
            {
              "id": "safety_sample_187",
              "rewards": [
                1.1545690483676594,
                0.80016639096811,
                1.1384968503641695,
                1.1772630407878821,
                1.0357950135981944,
                1.3303109900562478,
                1.1270872396732605
              ],
              "variance": 0.29693865594906776,
              "mean_reward": 1.1090983676879318,
              "min_reward": 0.80016639096811,
              "max_reward": 1.3303109900562478,
              "num_responses": 7,
              "rvariance": 0.02252132114502279
            },
            {
              "id": "safety_sample_177",
              "rewards": [
                1.3675362381075358,
                1.2222120981179379,
                1.0708991961124692,
                1.4434303110648963,
                1.2321825149677177,
                1.4930529132416726,
                1.3345656440264337
              ],
              "variance": 0.30159241461985653,
              "mean_reward": 1.309125559376952,
              "min_reward": 1.0708991961124692,
              "max_reward": 1.4930529132416726,
              "num_responses": 7,
              "rvariance": 0.018021717872511948
            },
            {
              "id": "safety_sample_72",
              "rewards": [
                0.40645091872748623,
                0.13016483528120246,
                0.5190802814238947,
                0.5126297376121429,
                0.6040180769152331,
                0.3625490885887678,
                0.42272473535914395
              ],
              "variance": 0.2834600123546885,
              "mean_reward": 0.42251681055826734,
              "min_reward": 0.13016483528120246,
              "max_reward": 0.6040180769152331,
              "num_responses": 7,
              "rvariance": 0.019958787779524312
            },
            {
              "id": "safety_sample_376",
              "rewards": [
                -0.16724893934815627,
                -0.4029173221735471,
                -0.19668525906064702,
                -0.36234313861680834,
                -0.4084242657596816,
                -0.2013337581150487
              ],
              "variance": 0.2237036947622127,
              "mean_reward": -0.2898254471789815,
              "min_reward": -0.4084242657596816,
              "max_reward": -0.16724893934815627,
              "num_responses": 6,
              "rvariance": 0.010607523579683831
            },
            {
              "id": "safety_sample_224",
              "rewards": [
                0.8318655980166202,
                0.8957026265516264,
                0.6403100561302352,
                0.7333864818356243,
                0.9019271320876996,
                0.7441856013387581
              ],
              "variance": 0.21196661033673325,
              "mean_reward": 0.7912295826600939,
              "min_reward": 0.6403100561302352,
              "max_reward": 0.9019271320876996,
              "num_responses": 6,
              "rvariance": 0.008859252345473965
            },
            {
              "id": "safety_sample_253",
              "rewards": [
                0.6740946384617039,
                0.07684610030295354,
                0.21476826944508248,
                0.20794955248624167,
                0.5262662323126126
              ],
              "variance": 0.4856757948257986,
              "mean_reward": 0.33998495860171885,
              "min_reward": 0.07684610030295354,
              "max_reward": 0.6740946384617039,
              "num_responses": 5,
              "rvariance": 0.0497369235139402
            },
            {
              "id": "safety_sample_307",
              "rewards": [
                0.09859524020794305,
                0.466881719507112,
                0.23632267831479195,
                0.407311554766047,
                -0.05040781360090819
              ],
              "variance": 0.4338602456880537,
              "mean_reward": 0.23174067583899713,
              "min_reward": -0.05040781360090819,
              "max_reward": 0.466881719507112,
              "num_responses": 5,
              "rvariance": 0.03669458316276777
            },
            {
              "id": "safety_sample_319",
              "rewards": [
                -2.584570509240726,
                -2.436199861687929,
                -2.3902358236241468,
                -2.3784736934063484,
                -2.2490940178794134,
                -2.4360896602017252
              ],
              "variance": 0.1966013298214464,
              "mean_reward": -2.4124439276733813,
              "min_reward": -2.584570509240726,
              "max_reward": -2.2490940178794134,
              "num_responses": 6,
              "rvariance": 0.009846899146846898
            },
            {
              "id": "safety_sample_205",
              "rewards": [
                0.7031170764561236,
                0.5291762403076734,
                0.502416689649273,
                0.33620780266209427,
                0.36316834580385443,
                0.5113686819688825,
                0.6258254482873642
              ],
              "variance": 0.3043579710077176,
              "mean_reward": 0.5101828978764665,
              "min_reward": 0.33620780266209427,
              "max_reward": 0.7031170764561236,
              "num_responses": 7,
              "rvariance": 0.014699982305222249
            },
            {
              "id": "safety_sample_348",
              "rewards": [
                0.7776276824602648,
                0.5196979732769614,
                0.7163515861898737,
                0.9195549868666018,
                0.4923135301002027,
                0.6628594090998159,
                0.8922851281897023
              ],
              "variance": 0.39444887565420406,
              "mean_reward": 0.7115271851690604,
              "min_reward": 0.4923135301002027,
              "max_reward": 0.9195549868666018,
              "num_responses": 7,
              "rvariance": 0.023937596623262485
            },
            {
              "id": "safety_sample_354",
              "rewards": [
                -0.456431414331884,
                -0.40970347960237324,
                -0.4021997602236085,
                -0.06954718194626056,
                -0.4641711903032551,
                -0.3046351285346591,
                -0.25136210212739235
              ],
              "variance": 0.2808911906654929,
              "mean_reward": -0.3368643224384904,
              "min_reward": -0.4641711903032551,
              "max_reward": -0.06954718194626056,
              "num_responses": 7,
              "rvariance": 0.0171264849335798
            },
            {
              "id": "safety_sample_11",
              "rewards": [
                0.19013823727860293,
                -0.19774469607573966,
                0.3133660400671895,
                0.35999253933780845,
                0.09404755046762525,
                0.30690798251774193,
                0.20826012031099694
              ],
              "variance": 0.35468598792515776,
              "mean_reward": 0.18213825341488935,
              "min_reward": -0.19774469607573966,
              "max_reward": 0.35999253933780845,
              "num_responses": 7,
              "rvariance": 0.03103396332037326
            },
            {
              "id": "safety_sample_341",
              "rewards": [
                -2.7716788576284728,
                -2.6962866397347036,
                -2.7223455343529808,
                -2.93089934241385,
                -2.6713122279238384,
                -2.581296398039828,
                -2.6783638707512454
              ],
              "variance": 0.20006115557238946,
              "mean_reward": -2.7217404101207023,
              "min_reward": -2.93089934241385,
              "max_reward": -2.581296398039828,
              "num_responses": 7,
              "rvariance": 0.010148373479488349
            },
            {
              "id": "safety_sample_196",
              "rewards": [
                -0.9629186972127305,
                -0.2130639549476404,
                -0.9434956852693658,
                -1.2072504196012546,
                -0.8714364361884441,
                -0.680445989991256,
                -0.5064841779917386
              ],
              "variance": 0.6715352973940409,
              "mean_reward": -0.7692993373146327,
              "min_reward": -1.2072504196012546,
              "max_reward": -0.2130639549476404,
              "num_responses": 7,
              "rvariance": 0.09377578392970551
            },
            {
              "id": "safety_sample_236",
              "rewards": [
                0.7173546701722486,
                0.7687567758932881,
                0.8339487817927509,
                0.8001347706553074,
                0.6284402290054651,
                0.7283929769920287,
                0.8330418110384
              ],
              "variance": 0.15161570563460514,
              "mean_reward": 0.7585814307927841,
              "min_reward": 0.6284402290054651,
              "max_reward": 0.8339487817927509,
              "num_responses": 7,
              "rvariance": 0.004657503494501368
            },
            {
              "id": "safety_sample_346",
              "rewards": [
                0.8853609058307178,
                0.6803366760524003,
                0.5586429280433509,
                0.6941153056242801,
                0.8732766241092166,
                0.7856420229299327,
                1.1334939533484543
              ],
              "variance": 0.35295494798903193,
              "mean_reward": 0.8015526308483361,
              "min_reward": 0.5586429280433509,
              "max_reward": 1.1334939533484543,
              "num_responses": 7,
              "rvariance": 0.02969250820820944
            },
            {
              "id": "safety_sample_267",
              "rewards": [
                -0.19346249173400298,
                0.4987769098805181,
                0.6459876241765427,
                0.6866360058930264,
                0.6139030249987244,
                0.6216521931422151,
                0.6582929350152589
              ],
              "variance": 0.4477490141316562,
              "mean_reward": 0.5045408859103261,
              "min_reward": -0.19346249173400298,
              "max_reward": 0.6866360058930264,
              "num_responses": 7,
              "rvariance": 0.08424608278024963
            },
            {
              "id": "safety_sample_279",
              "rewards": [
                -3.9309026923335457,
                -4.125358223898064,
                -4.381966141391733,
                -4.398656657393098,
                -4.386799979309296,
                -4.275185910419017,
                -4.355147106976576
              ],
              "variance": 0.34396663927056004,
              "mean_reward": -4.2648595302459045,
              "min_reward": -4.398656657393098,
              "max_reward": -3.9309026923335457,
              "num_responses": 7,
              "rvariance": 0.02653305248931945
            },
            {
              "id": "safety_sample_56",
              "rewards": [
                0.5741522218644719,
                0.40041832657505727,
                0.2773974646455062,
                0.5797058132388005,
                0.5596563434150574,
                0.5641952671280636,
                0.6387985425637851
              ],
              "variance": 0.2521329231655575,
              "mean_reward": 0.5134748542043917,
              "min_reward": 0.2773974646455062,
              "max_reward": 0.6387985425637851,
              "num_responses": 7,
              "rvariance": 0.013856273182597042
            },
            {
              "id": "safety_sample_257",
              "rewards": [
                0.3364961423461665,
                -0.00865084250190588,
                0.33496490521826516,
                0.24065246966193468,
                0.08393280723960739,
                0.2695647061701509,
                0.2559842514299949
              ],
              "variance": 0.2886780527264236,
              "mean_reward": 0.21613491993774478,
              "min_reward": -0.00865084250190588,
              "max_reward": 0.3364961423461665,
              "num_responses": 7,
              "rvariance": 0.014522464054363183
            },
            {
              "id": "safety_sample_256",
              "rewards": [
                0.12292847973544276,
                0.2397389243871001,
                0.5626640300001623,
                0.498705216300005,
                0.5854447434762896,
                0.5246629885317942,
                0.2980417720368249
              ],
              "variance": 0.3787615688641761,
              "mean_reward": 0.40459802206680273,
              "min_reward": 0.12292847973544276,
              "max_reward": 0.5854447434762896,
              "num_responses": 7,
              "rvariance": 0.02840466389608704
            },
            {
              "id": "safety_sample_202",
              "rewards": [
                1.0681951897592319,
                0.8484268151151381,
                1.052265126627152,
                1.0506199311441995,
                0.911589172619552,
                1.078185017098059,
                0.9736420015242353
              ],
              "variance": 0.1858668910769763,
              "mean_reward": 0.997560464841081,
              "min_reward": 0.8484268151151381,
              "max_reward": 1.078185017098059,
              "num_responses": 7,
              "rvariance": 0.006785927318665753
            },
            {
              "id": "safety_sample_356",
              "rewards": [
                -0.17076787316897218,
                -0.08263047770888488,
                -0.5268075861689705,
                -0.3911389121907413,
                -0.8737500412539094,
                -0.6439855778229088
              ],
              "variance": 0.6321686340994807,
              "mean_reward": -0.4481800780523979,
              "min_reward": -0.8737500412539094,
              "max_reward": -0.08263047770888488,
              "num_responses": 6,
              "rvariance": 0.07324493478079667
            },
            {
              "id": "safety_sample_272",
              "rewards": [
                -0.009308920695086936,
                0.20597876170314236,
                0.2860880415077864,
                0.33575666532794873,
                0.5045568526029294,
                0.38463540747285146,
                0.5218960546253555
              ],
              "variance": 0.39162884466804915,
              "mean_reward": 0.3185146946492753,
              "min_reward": -0.009308920695086936,
              "max_reward": 0.5218960546253555,
              "num_responses": 7,
              "rvariance": 0.028832720450631094
            },
            {
              "id": "safety_sample_268",
              "rewards": [
                0.41525701930683767,
                0.5296126632388315,
                0.7326654760892418,
                0.6753660254942958,
                0.6550673500369789,
                0.7895328867666854,
                0.7329193778088754
              ],
              "variance": 0.2716943757259655,
              "mean_reward": 0.6472029712488209,
              "min_reward": 0.41525701930683767,
              "max_reward": 0.7895328867666854,
              "num_responses": 7,
              "rvariance": 0.014770051168114877
            },
            {
              "id": "safety_sample_138",
              "rewards": [
                1.160684604707145,
                0.8776821789781242,
                0.9858289709942443,
                1.261383717304814,
                0.9558751425979627,
                1.1458214923278536,
                1.1255478626628557
              ],
              "variance": 0.2763662925961855,
              "mean_reward": 1.0732605670818571,
              "min_reward": 0.8776821789781242,
              "max_reward": 1.261383717304814,
              "num_responses": 7,
              "rvariance": 0.015815265560741813
            },
            {
              "id": "safety_sample_283",
              "rewards": [
                0.4960484838797698,
                0.7032394877660826,
                0.978631436426579,
                0.6596842287785779
              ],
              "variance": 0.35087464447901795,
              "mean_reward": 0.7094009092127523,
              "min_reward": 0.4960484838797698,
              "max_reward": 0.978631436426579,
              "num_responses": 4,
              "rvariance": 0.030128511401734562
            },
            {
              "id": "safety_sample_305",
              "rewards": [
                -0.691826798020998,
                -0.5830641925862352,
                -0.6044965032183897,
                -0.5665164376010887,
                -0.4665474098495178,
                -0.7177992846557746
              ],
              "variance": 0.18828111761308308,
              "mean_reward": -0.6050417709886674,
              "min_reward": -0.7177992846557746,
              "max_reward": -0.4665474098495178,
              "num_responses": 6,
              "rvariance": 0.006899016409121974
            },
            {
              "id": "safety_sample_334",
              "rewards": [
                -0.29297693835498445,
                -0.410980188865833,
                -0.4471488175536641,
                -0.5020135040628018,
                -0.4341356500095329,
                -0.4449454139744023,
                -0.43655006438908206
              ],
              "variance": 0.10531580349582559,
              "mean_reward": -0.4241072253157573,
              "min_reward": -0.5020135040628018,
              "max_reward": -0.29297693835498445,
              "num_responses": 7,
              "rvariance": 0.0035224854482941576
            },
            {
              "id": "safety_sample_363",
              "rewards": [
                -0.1334577824962038,
                0.24352710047534498,
                -0.07005874225437561,
                0.3731052639064075,
                0.16540426507399963,
                0.18226321402870937,
                0.009434097986817653
              ],
              "variance": 0.3907767241988769,
              "mean_reward": 0.11003105953152852,
              "min_reward": -0.1334577824962038,
              "max_reward": 0.3731052639064075,
              "num_responses": 7,
              "rvariance": 0.028164543937403193
            },
            {
              "id": "safety_sample_167",
              "rewards": [
                1.0237511182168075,
                0.9203655313205246,
                0.9311568240135588,
                1.0237063488630374,
                0.6775130760408399,
                0.9862907527901253,
                1.0148861600255066
              ],
              "variance": 0.20049970739589473,
              "mean_reward": 0.9396671158957715,
              "min_reward": 0.6775130760408399,
              "max_reward": 1.0237511182168075,
              "num_responses": 7,
              "rvariance": 0.013019156726913558
            },
            {
              "id": "safety_sample_1",
              "rewards": [
                -0.9250669912810643,
                -1.1281370231136938,
                -0.5707955112187855,
                -0.5861128916562623,
                -0.94930255221852,
                -1.193999317030093,
                -0.7114025892975085
              ],
              "variance": 0.5744960011989819,
              "mean_reward": -0.8664024108308467,
              "min_reward": -1.193999317030093,
              "max_reward": -0.5707955112187855,
              "num_responses": 7,
              "rvariance": 0.05372990071320115
            },
            {
              "id": "safety_sample_29",
              "rewards": [
                -0.1279308022762141,
                -0.0014082255080664215,
                0.18732434251156613,
                0.19394269313185517,
                0.31874211938845737,
                0.16329791393997387,
                0.030000450349543586
              ],
              "variance": 0.2958797198498216,
              "mean_reward": 0.10913835593387365,
              "min_reward": -0.1279308022762141,
              "max_reward": 0.31874211938845737,
              "num_responses": 7,
              "rvariance": 0.019265280003667246
            },
            {
              "id": "safety_sample_179",
              "rewards": [
                0.8970832758532099,
                0.823394171837131,
                1.044890080006426,
                0.3964266534242207,
                1.0443487778199323,
                1.2102236165520568,
                0.9831446882024582
              ],
              "variance": 0.45841633015271155,
              "mean_reward": 0.9142158948136335,
              "min_reward": 0.3964266534242207,
              "max_reward": 1.2102236165520568,
              "num_responses": 7,
              "rvariance": 0.05757569575680423
            },
            {
              "id": "safety_sample_160",
              "rewards": [
                1.0561534858846728,
                0.7628797807256407,
                0.7747555562260865,
                0.8103584630799128,
                0.9302044577606298,
                0.8843374721420837
              ],
              "variance": 0.22436130334678772,
              "mean_reward": 0.8697815359698379,
              "min_reward": 0.7628797807256407,
              "max_reward": 1.0561534858846728,
              "num_responses": 6,
              "rvariance": 0.010431055360479308
            },
            {
              "id": "safety_sample_23",
              "rewards": [
                -1.6963484088750371,
                -1.5329972467914532,
                -1.2076974869941484,
                -1.3136562159788019,
                -1.3064405232117053,
                -1.455920073219425,
                -0.96424800264006
              ],
              "variance": 0.48802001837237374,
              "mean_reward": -1.3539011368158043,
              "min_reward": -1.6963484088750371,
              "max_reward": -0.96424800264006,
              "num_responses": 7,
              "rvariance": 0.0481186642607363
            },
            {
              "id": "safety_sample_350",
              "rewards": [
                -0.4506220428034979,
                -0.1265019398244166,
                -0.026829078567017595,
                -0.3354915446716358,
                -0.10562251505770348,
                0.07349935630433058
              ],
              "variance": 0.41639193260622337,
              "mean_reward": -0.1619279607699901,
              "min_reward": -0.4506220428034979,
              "max_reward": 0.07349935630433058,
              "num_responses": 6,
              "rvariance": 0.03192860440535902
            },
            {
              "id": "safety_sample_367",
              "rewards": [
                -0.0584650449899223,
                -0.17894156749226953,
                -0.058030500493188086,
                -0.05940989750515561,
                -0.0041056573408199785,
                -0.06876387479148462,
                -0.20602733959562453
              ],
              "variance": 0.1533153131013707,
              "mean_reward": -0.09053484031549495,
              "min_reward": -0.20602733959562453,
              "max_reward": -0.0041056573408199785,
              "num_responses": 7,
              "rvariance": 0.00459314447915027
            },
            {
              "id": "safety_sample_303",
              "rewards": [
                -0.7062957522436696,
                -0.623610825771423,
                -0.20062308375799778,
                -0.37360247455380335
              ],
              "variance": 0.4289733733052562,
              "mean_reward": -0.4760330340817234,
              "min_reward": -0.7062957522436696,
              "max_reward": -0.20062308375799778,
              "num_responses": 4,
              "rvariance": 0.040285696059464
            },
            {
              "id": "safety_sample_18",
              "rewards": [
                0.924703775622575,
                0.6247863609785308,
                0.5262355512170218,
                0.6738388583076463,
                0.7460064304403475,
                0.5492291539278603,
                0.7780093177207252
              ],
              "variance": 0.2966553880379402,
              "mean_reward": 0.6889727783163867,
              "min_reward": 0.5262355512170218,
              "max_reward": 0.924703775622575,
              "num_responses": 7,
              "rvariance": 0.016730009037342803
            },
            {
              "id": "safety_sample_30",
              "rewards": [
                -0.6307351013965553,
                -0.4407176842309594,
                -0.47267235836112304,
                -0.2795167034179596,
                -0.6258511718943554,
                -0.692827377424141,
                -0.6904455225746066
              ],
              "variance": 0.3151609726086609,
              "mean_reward": -0.5475379884713857,
              "min_reward": -0.692827377424141,
              "max_reward": -0.2795167034179596,
              "num_responses": 7,
              "rvariance": 0.020491019050595024
            },
            {
              "id": "safety_sample_263",
              "rewards": [
                0.6207283164780489,
                0.43475861242360325,
                0.8533013524452184,
                0.7188129614300209,
                0.8562999599306077,
                0.6593179340659129
              ],
              "variance": 0.327057191737087,
              "mean_reward": 0.6905365227955688,
              "min_reward": 0.43475861242360325,
              "max_reward": 0.8562999599306077,
              "num_responses": 6,
              "rvariance": 0.02100659820488991
            },
            {
              "id": "safety_sample_295",
              "rewards": [
                0.8261980482872402,
                0.45082548819622537,
                0.6078122013791537,
                0.8478883305802801,
                0.6488976321716036,
                0.6697513850011897,
                0.7673285395862985
              ],
              "variance": 0.28985664509847375,
              "mean_reward": 0.6883859464574273,
              "min_reward": 0.45082548819622537,
              "max_reward": 0.8478883305802801,
              "num_responses": 7,
              "rvariance": 0.016499827504649785
            },
            {
              "id": "safety_sample_47",
              "rewards": [
                0.6795051557474103,
                0.37793878875156567,
                0.751269177551372,
                0.7453940608181486,
                0.8057027633602193,
                0.5338184779139953,
                0.8188925037401993
              ],
              "variance": 0.3395120572631878,
              "mean_reward": 0.6732172754118443,
              "min_reward": 0.37793878875156567,
              "max_reward": 0.8188925037401993,
              "num_responses": 7,
              "rvariance": 0.022390887330281224
            },
            {
              "id": "safety_sample_375",
              "rewards": [
                -2.3013395406567945,
                -2.101509182060624,
                -1.640393604255216,
                -2.077601721002547,
                -1.8842444474312159,
                -1.4551110941275223,
                -1.8309106849775756
              ],
              "variance": 0.6151607252949536,
              "mean_reward": -1.8987300392159283,
              "min_reward": -2.3013395406567945,
              "max_reward": -1.4551110941275223,
              "num_responses": 7,
              "rvariance": 0.07193623560238382
            },
            {
              "id": "safety_sample_28",
              "rewards": [
                0.09140835010201331,
                -0.7054341769878969,
                -0.22008429053464898,
                -0.20803413370518237,
                -0.27038751211769335,
                -0.49903618550088363,
                -0.42131721350068174
              ],
              "variance": 0.49333824191338493,
              "mean_reward": -0.3189835946064248,
              "min_reward": -0.7054341769878969,
              "max_reward": 0.09140835010201331,
              "num_responses": 7,
              "rvariance": 0.05501559148596636
            },
            {
              "id": "safety_sample_347",
              "rewards": [
                -0.007475568697338001,
                0.025914229332702893,
                0.12934145485871618,
                0.00322148920209602,
                0.09592348031231644,
                0.00041573431756289857,
                -0.0696461128259205
              ],
              "variance": 0.14163445647964734,
              "mean_reward": 0.02538495807144799,
              "min_reward": -0.0696461128259205,
              "max_reward": 0.12934145485871618,
              "num_responses": 7,
              "rvariance": 0.003858330944984554
            },
            {
              "id": "safety_sample_10",
              "rewards": [
                0.39188741663881055,
                0.5129509498986338,
                0.5551293164534028,
                0.5595877805585843,
                0.6443402371867621,
                0.2499970547761441,
                0.514629644128813
              ],
              "variance": 0.25835749131611147,
              "mean_reward": 0.4897889142344501,
              "min_reward": 0.2499970547761441,
              "max_reward": 0.6443402371867621,
              "num_responses": 7,
              "rvariance": 0.01446653459718762
            },
            {
              "id": "safety_sample_365",
              "rewards": [
                1.36176850520888,
                0.9568290742129116,
                1.2016864451677303,
                1.2894891662279553,
                1.1025329710285459,
                1.1600331010344478,
                1.2785219268438803
              ],
              "variance": 0.274149489518033,
              "mean_reward": 1.1929801699606217,
              "min_reward": 0.9568290742129116,
              "max_reward": 1.36176850520888,
              "num_responses": 7,
              "rvariance": 0.01574717500619882
            },
            {
              "id": "safety_sample_387",
              "rewards": [
                -0.3805088517857606,
                -0.38138169764807683,
                -0.32856012164735954,
                -0.37040037000582243,
                -0.4331638732675567,
                -0.3796854713632743,
                -0.1820635255048297
              ],
              "variance": 0.1321330847055212,
              "mean_reward": -0.3508234158889543,
              "min_reward": -0.4331638732675567,
              "max_reward": -0.1820635255048297,
              "num_responses": 7,
              "rvariance": 0.0055409735516310015
            },
            {
              "id": "safety_sample_170",
              "rewards": [
                1.2642132656920502,
                1.1357383694126384,
                1.1633056468733256,
                1.2618558304900267,
                1.0614919965174623,
                1.3108090838670783,
                1.2497211441114835
              ],
              "variance": 0.17681177270749338,
              "mean_reward": 1.206733619566295,
              "min_reward": 1.0614919965174623,
              "max_reward": 1.3108090838670783,
              "num_responses": 7,
              "rvariance": 0.006720491544895714
            },
            {
              "id": "safety_sample_82",
              "rewards": [
                1.3460954745204736,
                1.0411466732719514,
                1.2935681865795043,
                1.52261696649499,
                1.28380627595078,
                1.269639436597956
              ],
              "variance": 0.2789631655727782,
              "mean_reward": 1.292812168902609,
              "min_reward": 1.0411466732719514,
              "max_reward": 1.52261696649499,
              "num_responses": 6,
              "rvariance": 0.01993392175635286
            },
            {
              "id": "safety_sample_286",
              "rewards": [
                -0.24468426775034577,
                -0.8741764458681399,
                -0.29212475527133136,
                -0.6070893688682115,
                -0.7530211823939484,
                -0.5981524040239934
              ],
              "variance": 0.5451943026202056,
              "mean_reward": -0.5615414040293284,
              "min_reward": -0.8741764458681399,
              "max_reward": -0.24468426775034577,
              "num_responses": 6,
              "rvariance": 0.05180065546143344
            },
            {
              "id": "safety_sample_290",
              "rewards": [
                0.7346800970088992,
                0.8617298877053614,
                0.5246000609785928,
                0.7756650315596691,
                0.8389206846404713,
                0.8425466892234508,
                0.7139052384251179
              ],
              "variance": 0.21203680116970725,
              "mean_reward": 0.7560068127916519,
              "min_reward": 0.5246000609785928,
              "max_reward": 0.8617298877053614,
              "num_responses": 7,
              "rvariance": 0.011672018663860622
            },
            {
              "id": "safety_sample_296",
              "rewards": [
                0.39618777917997844,
                0.781190446417639,
                0.6142449000638783,
                0.6064954188479836,
                0.7435801193094469,
                0.6465342485939043,
                0.6852212316994083
              ],
              "variance": 0.23625188717194212,
              "mean_reward": 0.6390648777303198,
              "min_reward": 0.39618777917997844,
              "max_reward": 0.781190446417639,
              "num_responses": 7,
              "rvariance": 0.013425057064762545
            },
            {
              "id": "safety_sample_183",
              "rewards": [
                0.46435710364135935,
                0.3720220333886119,
                0.487935212530442,
                0.7032751780201372,
                0.6298139907141609,
                0.5327236637172521,
                0.7381890125127876
              ],
              "variance": 0.289817636276937,
              "mean_reward": 0.5611880277892501,
              "min_reward": 0.3720220333886119,
              "max_reward": 0.7381890125127876,
              "num_responses": 7,
              "rvariance": 0.01536626084506986
            },
            {
              "id": "safety_sample_304",
              "rewards": [
                -1.0176512671673854,
                -0.8579655567896837,
                -0.6753598157160803,
                -0.7319676893706185,
                -0.8036324672225162,
                -0.5659616733012234,
                -0.6592115411184214
              ],
              "variance": 0.29992824694922215,
              "mean_reward": -0.7588214300979897,
              "min_reward": -1.0176512671673854,
              "max_reward": -0.5659616733012234,
              "num_responses": 7,
              "rvariance": 0.019090635957645926
            },
            {
              "id": "safety_sample_353",
              "rewards": [
                -0.3957053862752984,
                -0.3525383370687378,
                -0.08167873760076384,
                -0.10796492278433557,
                -0.1165982073966861,
                -0.09344337239779414,
                -0.07390890667860997
              ],
              "variance": 0.2912343515194597,
              "mean_reward": -0.17454826717174657,
              "min_reward": -0.3957053862752984,
              "max_reward": -0.07390890667860997,
              "num_responses": 7,
              "rvariance": 0.016244788835623015
            },
            {
              "id": "safety_sample_141",
              "rewards": [
                1.09535422080512,
                1.2253465790266576,
                1.385745468340642,
                1.087710244989369,
                1.2629431309490742,
                1.4792332711848704
              ],
              "variance": 0.34095713686551177,
              "mean_reward": 1.256055485882622,
              "min_reward": 1.087710244989369,
              "max_reward": 1.4792332711848704,
              "num_responses": 6,
              "rvariance": 0.02029721812435745
            },
            {
              "id": "safety_sample_156",
              "rewards": [
                -1.380111469028353,
                -1.4068528614873221,
                -1.101000533280893,
                -1.571395577140481,
                -1.3849928939513212,
                -1.2782082799649492,
                -1.2235452120839794
              ],
              "variance": 0.29814260718584085,
              "mean_reward": -1.3351581181338996,
              "min_reward": -1.571395577140481,
              "max_reward": -1.101000533280893,
              "num_responses": 7,
              "rvariance": 0.019426154472626123
            },
            {
              "id": "safety_sample_372",
              "rewards": [
                -0.21879317994060585,
                -0.5579701871170466,
                -0.2104316421749162,
                -0.29663800704721055,
                -0.2926482123307979,
                -0.5151512744237198,
                -0.23384444883469357
              ],
              "variance": 0.31683027466672053,
              "mean_reward": -0.33221099312414154,
              "min_reward": -0.5579701871170466,
              "max_reward": -0.2104316421749162,
              "num_responses": 7,
              "rvariance": 0.017804971265317795
            },
            {
              "id": "safety_sample_85",
              "rewards": [
                0.381177522770813,
                0.2769582240627122,
                0.23509919136001006,
                0.3384318690200192,
                0.4435371626314038,
                0.38648785688724363,
                0.4423913176328107
              ],
              "variance": 0.18263504465061658,
              "mean_reward": 0.357726163480716,
              "min_reward": 0.23509919136001006,
              "max_reward": 0.4435371626314038,
              "num_responses": 7,
              "rvariance": 0.005406003041580059
            },
            {
              "id": "safety_sample_98",
              "rewards": [
                -0.2916088119495605,
                -0.09314532746919835,
                -0.2570293387843683,
                0.03225081478940345,
                -0.06364075797263838,
                -0.2433668590743677,
                -0.29092881868810033
              ],
              "variance": 0.26591668712486277,
              "mean_reward": -0.17249558559269002,
              "min_reward": -0.2916088119495605,
              "max_reward": 0.03225081478940345,
              "num_responses": 7,
              "rvariance": 0.014350001379720232
            },
            {
              "id": "safety_sample_382",
              "rewards": [
                -0.6364862414577999,
                0.05457350333849747,
                0.03636959533625881,
                -0.005092461558187575,
                0.003168893038226174,
                0.1031955261121307,
                0.15380493250627456
              ],
              "variance": 0.38108926218782074,
              "mean_reward": -0.04149517895494281,
              "min_reward": -0.6364862414577999,
              "max_reward": 0.15380493250627456,
              "num_responses": 7,
              "rvariance": 0.061672007154535184
            },
            {
              "id": "safety_sample_148",
              "rewards": [
                1.3750809699712228,
                1.236080266397358,
                1.0921715267461862,
                1.1576287049718261,
                1.0552076941522277,
                1.2707276762742155,
                1.0802077779002202
              ],
              "variance": 0.24226124935199533,
              "mean_reward": 1.1810149452018937,
              "min_reward": 1.0552076941522277,
              "max_reward": 1.3750809699712228,
              "num_responses": 7,
              "rvariance": 0.011881686330805694
            },
            {
              "id": "safety_sample_37",
              "rewards": [
                0.9938736794870989,
                0.7853439780013369,
                0.9423200467225297,
                0.7102585710634752,
                0.7863069887160015,
                0.983541977083118
              ],
              "variance": 0.24090655375270242,
              "mean_reward": 0.86694087351226,
              "min_reward": 0.7102585710634752,
              "max_reward": 0.9938736794870989,
              "num_responses": 6,
              "rvariance": 0.012183165829243526
            },
            {
              "id": "safety_sample_271",
              "rewards": [
                0.4702685367734453,
                0.5131801188983524,
                0.5592797173130608,
                0.6828522128184373,
                0.4148490859644424
              ],
              "variance": 0.1964063483282431,
              "mean_reward": 0.5280859343535476,
              "min_reward": 0.4148490859644424,
              "max_reward": 0.6828522128184373,
              "num_responses": 5,
              "rvariance": 0.00826265433512283
            },
            {
              "id": "safety_sample_111",
              "rewards": [
                0.970693485623484,
                1.1500492220712966,
                1.1407271781701742,
                1.1871072894588552,
                0.8035325454557802,
                0.9476814116408102,
                1.0325666109682787
              ],
              "variance": 0.27485058385952177,
              "mean_reward": 1.03319396334124,
              "min_reward": 0.8035325454557802,
              "max_reward": 1.1871072894588552,
              "num_responses": 7,
              "rvariance": 0.016124474627189654
            },
            {
              "id": "safety_sample_209",
              "rewards": [
                0.6106677347759208,
                0.8150482876916407,
                0.6313345833803267,
                0.7738805188569423,
                0.4806268503317652,
                0.8629984570863174,
                0.8508052261682286
              ],
              "variance": 0.29703113753720556,
              "mean_reward": 0.717908808327306,
              "min_reward": 0.4806268503317652,
              "max_reward": 0.8629984570863174,
              "num_responses": 7,
              "rvariance": 0.01808283525065302
            },
            {
              "id": "safety_sample_7",
              "rewards": [
                0.16745989847857948,
                -0.011434056173351925,
                0.21893088012849604,
                0.3758684409439984,
                0.22655356702077595,
                0.20598721465805,
                0.28347263464487743
              ],
              "variance": 0.22452864054671892,
              "mean_reward": 0.20954836852877506,
              "min_reward": -0.011434056173351925,
              "max_reward": 0.3758684409439984,
              "num_responses": 7,
              "rvariance": 0.012017389294852732
            },
            {
              "id": "safety_sample_49",
              "rewards": [
                -1.547729181833474,
                -1.3421771119820343,
                -1.4842230708294823,
                -1.4586400462652658,
                -1.7272787100993545,
                -1.5923232150574083
              ],
              "variance": 0.25939238345473137,
              "mean_reward": -1.5253952226778364,
              "min_reward": -1.7272787100993545,
              "max_reward": -1.3421771119820343,
              "num_responses": 6,
              "rvariance": 0.014242563356939422
            },
            {
              "id": "safety_sample_358",
              "rewards": [
                0.9317037615033243,
                0.6025691778295804,
                0.6956218100322665,
                0.8280445493259566,
                0.8384567113377622,
                0.9366318342144866
              ],
              "variance": 0.285072303927982,
              "mean_reward": 0.8055046407072295,
              "min_reward": 0.6025691778295804,
              "max_reward": 0.9366318342144866,
              "num_responses": 6,
              "rvariance": 0.01466191399611424
            },
            {
              "id": "safety_sample_335",
              "rewards": [
                0.057238375641236364,
                -0.23854992706662093,
                -0.21820397767630198,
                0.02181548541970271,
                -0.030140758456394,
                -0.11484813265839776,
                0.10244540463217741
              ],
              "variance": 0.30166354467004236,
              "mean_reward": -0.06003479002351402,
              "min_reward": -0.23854992706662093,
              "max_reward": 0.10244540463217741,
              "num_responses": 7,
              "rvariance": 0.015376511194417292
            },
            {
              "id": "safety_sample_132",
              "rewards": [
                1.0659169618754172,
                0.9072534328967334,
                1.0037564360637623,
                1.1113822755996476,
                0.9738849457097293,
                1.1076532701957562,
                1.2299424819171894
              ],
              "variance": 0.21157401754213334,
              "mean_reward": 1.0571128291797478,
              "min_reward": 0.9072534328967334,
              "max_reward": 1.2299424819171894,
              "num_responses": 7,
              "rvariance": 0.009668390648319815
            },
            {
              "id": "safety_sample_38",
              "rewards": [
                0.5110308768449804,
                0.289345246798869,
                0.6034166648271737,
                0.653748375998981,
                0.5820554216307243,
                0.5189569308967238,
                0.3095459305937379
              ],
              "variance": 0.3220836922201063,
              "mean_reward": 0.49544277822731286,
              "min_reward": 0.289345246798869,
              "max_reward": 0.653748375998981,
              "num_responses": 7,
              "rvariance": 0.01743578672656068
            },
            {
              "id": "safety_sample_53",
              "rewards": [
                0.45510831868277,
                0.46511693036583623,
                0.44953249916775834,
                0.48980425478224543,
                0.4767319165537607,
                0.35749860456764654,
                0.3590088658444807
              ],
              "variance": 0.12355609051140753,
              "mean_reward": 0.4361144842806426,
              "min_reward": 0.35749860456764654,
              "max_reward": 0.48980425478224543,
              "num_responses": 7,
              "rvariance": 0.0025771501351683187
            },
            {
              "id": "safety_sample_219",
              "rewards": [
                0.37937046885499903,
                0.5977751001073247,
                0.5799475051346786,
                0.6254247156102606,
                0.6492861550249517
              ],
              "variance": 0.18014029589220437,
              "mean_reward": 0.5663607889464429,
              "min_reward": 0.37937046885499903,
              "max_reward": 0.6492861550249517,
              "num_responses": 5,
              "rvariance": 0.009300400276519308
            },
            {
              "id": "safety_sample_270",
              "rewards": [
                0.8887921793784174,
                0.7815579934199199,
                0.8140164010480989,
                0.8882671569569308,
                0.7047885700210111,
                0.6402753050933926,
                0.7472487017393686
              ],
              "variance": 0.20949390187556172,
              "mean_reward": 0.7807066153795913,
              "min_reward": 0.6402753050933926,
              "max_reward": 0.8887921793784174,
              "num_responses": 7,
              "rvariance": 0.007280851488589576
            },
            {
              "id": "safety_sample_112",
              "rewards": [
                1.1813912135068572,
                1.1240307137931338,
                1.1589927614359983,
                0.9916226889024311,
                0.8907739276956562,
                1.1025520684451893
              ],
              "variance": 0.2289936791723841,
              "mean_reward": 1.0748938956298777,
              "min_reward": 0.8907739276956562,
              "max_reward": 1.1813912135068572,
              "num_responses": 6,
              "rvariance": 0.010404659304916786
            },
            {
              "id": "safety_sample_362",
              "rewards": [
                -0.04507431212658256,
                -0.10969746546800065,
                -0.10892041976130445,
                -0.0822585476929481,
                -0.10145739979505802,
                -0.22057268348486897,
                -0.11521881038471858
              ],
              "variance": 0.08997550615837686,
              "mean_reward": -0.11188566267335447,
              "min_reward": -0.22057268348486897,
              "max_reward": -0.04507431212658256,
              "num_responses": 7,
              "rvariance": 0.00246969005852715
            },
            {
              "id": "safety_sample_258",
              "rewards": [
                0.9237589231073416,
                0.8814916439898403,
                1.0943345439853336,
                1.023425522916661,
                0.9601858365284622,
                1.1117520141087565,
                1.0948774115338473
              ],
              "variance": 0.19477524110346978,
              "mean_reward": 1.0128322708814632,
              "min_reward": 0.8814916439898403,
              "max_reward": 1.1117520141087565,
              "num_responses": 7,
              "rvariance": 0.007318203831523024
            },
            {
              "id": "safety_sample_78",
              "rewards": [
                0.813184567670705,
                0.6533917865308395,
                0.6181404599866909,
                0.8312397662810498,
                0.7885219759742108,
                0.9750336083599583,
                0.9368685169519009
              ],
              "variance": 0.31284329760194385,
              "mean_reward": 0.8023400973936222,
              "min_reward": 0.6181404599866909,
              "max_reward": 0.9750336083599583,
              "num_responses": 7,
              "rvariance": 0.015025683429343501
            },
            {
              "id": "safety_sample_12",
              "rewards": [
                -0.47015963924672194,
                -0.48735294952888997,
                -0.3873551191161523,
                -0.4348394367736961,
                -0.6318333593897424,
                -0.48391165766426286,
                -0.4047231237997452
              ],
              "variance": 0.1473691915469229,
              "mean_reward": -0.47145361221703014,
              "min_reward": -0.6318333593897424,
              "max_reward": -0.3873551191161523,
              "num_responses": 7,
              "rvariance": 0.005571063137456522
            },
            {
              "id": "safety_sample_173",
              "rewards": [
                1.3888242223614522,
                1.0864244566261936,
                1.259818981429686,
                1.0719110461221557,
                1.0413332644247277,
                1.054295714239413
              ],
              "variance": 0.276507112563499,
              "mean_reward": 1.1504346142006046,
              "min_reward": 1.0413332644247277,
              "max_reward": 1.3888242223614522,
              "num_responses": 6,
              "rvariance": 0.01670059811638783
            },
            {
              "id": "safety_sample_67",
              "rewards": [
                0.08167868593089968,
                -0.0016524219831764231,
                -0.13028510675419772,
                0.16574363555992175,
                -0.04316957962072455,
                -0.16536361733134544,
                -0.11542731660577404
              ],
              "variance": 0.25962117676756535,
              "mean_reward": -0.029782245829199534,
              "min_reward": -0.16536361733134544,
              "max_reward": 0.16574363555992175,
              "num_responses": 7,
              "rvariance": 0.012491804114044729
            },
            {
              "id": "safety_sample_154",
              "rewards": [
                0.8234151476881981,
                0.5899623782658245,
                0.720325414213683,
                1.008966273938513,
                0.8262425045686064,
                0.8142944093428396,
                0.7830867259685893
              ],
              "variance": 0.23115181248202954,
              "mean_reward": 0.7951846934266077,
              "min_reward": 0.5899623782658245,
              "max_reward": 1.008966273938513,
              "num_responses": 7,
              "rvariance": 0.013670823247165837
            },
            {
              "id": "safety_sample_17",
              "rewards": [
                0.6841405057608446,
                0.7534271856320557,
                0.5533044174105615,
                0.8032360658892044,
                0.39360274034025633
              ],
              "variance": 0.32582910261796655,
              "mean_reward": 0.6375421830065845,
              "min_reward": 0.39360274034025633,
              "max_reward": 0.8032360658892044,
              "num_responses": 5,
              "rvariance": 0.02193153063654087
            },
            {
              "id": "safety_sample_249",
              "rewards": [
                0.6449861055561877,
                0.8779304453944861,
                0.7772260105659493,
                0.7447372349145835,
                0.9437579882740428,
                0.7256560980363728
              ],
              "variance": 0.22552311503798417,
              "mean_reward": 0.7857156471236038,
              "min_reward": 0.6449861055561877,
              "max_reward": 0.9437579882740428,
              "num_responses": 6,
              "rvariance": 0.009774034686473549
            },
            {
              "id": "safety_sample_266",
              "rewards": [
                0.6093274718144517,
                0.3745479015439805,
                0.31662574993750403,
                0.5825312916847848,
                0.45631239514850475,
                0.47132484306449807,
                0.5834852232997337
              ],
              "variance": 0.24244308180423102,
              "mean_reward": 0.484879268070494,
              "min_reward": 0.31662574993750403,
              "max_reward": 0.6093274718144517,
              "num_responses": 7,
              "rvariance": 0.01088977900103642
            },
            {
              "id": "safety_sample_133",
              "rewards": [
                1.0114404851472236,
                0.8335646419530586,
                0.8946666699668329,
                1.142829459362948,
                1.1116724937181437,
                0.8874857282365788
              ],
              "variance": 0.26672579144572717,
              "mean_reward": 0.9802765797307975,
              "min_reward": 0.8335646419530586,
              "max_reward": 1.142829459362948,
              "num_responses": 6,
              "rvariance": 0.013687184224565649
            },
            {
              "id": "safety_sample_125",
              "rewards": [
                1.4013396047832436,
                1.1771187144096442,
                1.22342932362464,
                1.2784236221090284,
                1.1226350370161589,
                1.0631522194758063
              ],
              "variance": 0.24698798520015353,
              "mean_reward": 1.2110164202364202,
              "min_reward": 1.0631522194758063,
              "max_reward": 1.4013396047832436,
              "num_responses": 6,
              "rvariance": 0.011957478472947416
            },
            {
              "id": "safety_sample_182",
              "rewards": [
                1.2935359401218935,
                1.1015233125256874,
                1.3985958382347,
                1.3504878803484137,
                1.1908184497357193,
                1.4669282734185582,
                1.3282256147732892
              ],
              "variance": 0.27082841745653674,
              "mean_reward": 1.3043021870226088,
              "min_reward": 1.1015233125256874,
              "max_reward": 1.4669282734185582,
              "num_responses": 7,
              "rvariance": 0.013165389705980395
            },
            {
              "id": "safety_sample_117",
              "rewards": [
                1.2692023875219898,
                0.9796893080796517,
                1.1569139606735235,
                1.2369146043539838,
                1.2675913169310717,
                1.281754086342644
              ],
              "variance": 0.20717660255572934,
              "mean_reward": 1.1986776106504775,
              "min_reward": 0.9796893080796517,
              "max_reward": 1.281754086342644,
              "num_responses": 6,
              "rvariance": 0.011297781781544466
            },
            {
              "id": "safety_sample_242",
              "rewards": [
                0.9910735599058376,
                0.9553241351669453,
                1.094812918618626,
                0.9865618734919783,
                0.7508418337199295,
                0.894538623353602
              ],
              "variance": 0.220253010725466,
              "mean_reward": 0.9455254907094867,
              "min_reward": 0.7508418337199295,
              "max_reward": 1.094812918618626,
              "num_responses": 6,
              "rvariance": 0.011107124637651837
            },
            {
              "id": "safety_sample_70",
              "rewards": [
                0.40543468570414387,
                0.2152535316712626,
                0.5632253688205113,
                0.5653727324394594,
                0.4493722060969169,
                0.4149761933604612,
                0.6353606944956018
              ],
              "variance": 0.26400569317092504,
              "mean_reward": 0.4641422017983367,
              "min_reward": 0.2152535316712626,
              "max_reward": 0.6353606944956018,
              "num_responses": 7,
              "rvariance": 0.01677263689783678
            },
            {
              "id": "safety_sample_31",
              "rewards": [
                0.5454566314598148,
                0.2654540655057992,
                0.3970196125573724,
                0.4847500138922764,
                0.4465313871031372,
                0.5798150755077921,
                0.4650233217170441
              ],
              "variance": 0.2148066153422627,
              "mean_reward": 0.4548643011061766,
              "min_reward": 0.2654540655057992,
              "max_reward": 0.5798150755077921,
              "num_responses": 7,
              "rvariance": 0.009158244381464587
            },
            {
              "id": "safety_sample_59",
              "rewards": [
                1.2133546536643325,
                1.2232514984991754,
                1.2836882476544769,
                1.1417293229353371,
                1.0864288396398494,
                1.3263687823452412
              ],
              "variance": 0.1909494337122657,
              "mean_reward": 1.212470224123069,
              "min_reward": 1.0864288396398494,
              "max_reward": 1.3263687823452412,
              "num_responses": 6,
              "rvariance": 0.00650876870614922
            },
            {
              "id": "safety_sample_149",
              "rewards": [
                1.3624372278637964,
                1.072730043530986,
                1.1636046310191335,
                1.4955274375227872,
                1.2869811431996139,
                1.3404060097228145,
                1.2976168389078664
              ],
              "variance": 0.2884185157035182,
              "mean_reward": 1.2884719045381428,
              "min_reward": 1.072730043530986,
              "max_reward": 1.4955274375227872,
              "num_responses": 7,
              "rvariance": 0.016180321836636223
            },
            {
              "id": "safety_sample_309",
              "rewards": [
                -0.08450327682953619,
                -0.2100678520414831,
                -0.17843251176338637,
                -0.06693427966258353,
                -0.09122995050160478,
                -0.175949847599768,
                -0.13938925226214494
              ],
              "variance": 0.11361096991186995,
              "mean_reward": -0.13521528152292955,
              "min_reward": -0.2100678520414831,
              "max_reward": -0.06693427966258353,
              "num_responses": 7,
              "rvariance": 0.0026165821697460958
            }
          ]
        }
      },
      "overall_stats": {
        "mean_variance_across_files": 0.6199368963180693,
        "mean_rvariance_across_files": 0.12119394383068885,
        "total_processed_files": 4
      }
    }
  },
  "summary": {
    "model_comparison": {
      "URM-LLaMa-3.1-8B": {
        "mean_variance": 0.6199368963180693,
        "mean_rvariance": 0.12119394383068885
      }
    }
  }
}