template_id,split,question_idx,prediction,label
llm_goals_449,test,0,0.0709419050406782,0.1336325872199141
llm_goals_449,test,1,0.1619335130741301,0.2356014848705813
llm_goals_449,test,2,0.0671017058835019,0.3977331353545913
llm_goals_449,test,3,0.9488206770095235,0.9671817093217177
llm_goals_449,test,4,0.7474684017469194,0.7857460873195503
llm_goals_449,test,5,0.039570109108474,0.5164481763709956
llm_goals_449,test,6,0.039570109108474,0.0370459810848937
llm_goals_449,test,7,0.0709419050406782,0.2618660511464079
llm_goals_449,test,8,0.5980664896900705,0.9771937256062914
llm_goals_449,test,9,0.0746925918900774,0.0204302625650166
llm_goals_449,test,10,0.3735109435546767,0.0731782442371117
llm_goals_449,test,11,0.13433174397591,0.0091003072940505
llm_goals_449,test,12,0.1619335130741301,0.1108627498844831
llm_goals_449,test,13,0.0746925918900774,0.054840421346723
llm_goals_449,test,14,0.5155207738559613,0.8313263696124994
llm_goals_449,test,15,0.7633050025194208,0.8253071431638606
llm_goals_449,test,16,0.5155207738559613,0.831142754565476
llm_goals_449,test,17,0.7334189184998696,0.3065891414116863
llm_goals_449,test,18,0.5155207738559613,0.4235929706341914
llm_goals_449,test,19,0.5081340888474455,0.2342867705548718
llm_goals_449,test,20,0.7633050025194208,0.5687148418873526
llm_goals_449,test,21,0.0746925918900774,0.4888083146033534
llm_goals_449,test,22,0.0989927027736901,0.0069036151286541
llm_goals_449,test,23,0.8805568764512753,0.0739780745569788
llm_goals_449,test,24,0.9175134960157624,0.9314584192860104
llm_goals_449,test,25,0.1223603196974264,0.1420477852561596
llm_goals_449,test,26,0.3228734861091518,0.7006375316273405
llm_goals_449,test,27,0.1239571676185442,0.0612984362789981
llm_goals_449,test,28,0.1615405844665852,0.9549750406111494
llm_goals_449,test,29,0.6043090045417064,0.2943014776892277
llm_goals_449,test,30,0.0420183307768579,0.0576629803259434
llm_goals_449,test,31,0.039570109108474,0.2255338162735628
llm_goals_449,test,32,0.3734133270383069,0.0217578202648259
llm_goals_449,test,33,0.9643933518799314,0.5881005329750926
llm_goals_449,test,34,0.0420183307768579,0.0656003360881953
llm_goals_449,test,35,0.2718782339144924,0.1899455989825758
llm_goals_449,test,36,0.0420183307768579,0.1356723510839239
llm_goals_449,test,37,0.5568350936477791,0.1724577552330986
llm_goals_449,test,38,0.9735765761950989,0.097576330461044
llm_goals_449,test,39,0.1221029646037177,0.0831443503045603
llm_goals_449,test,40,0.0141023713770453,0.0085659129540734
llm_goals_449,test,41,0.0746925918900774,0.0438119169092525
llm_goals_449,test,42,0.0794392016007004,0.4942733211865646
llm_goals_449,test,43,0.039570109108474,0.1247723307463423
llm_goals_449,test,44,0.7633050025194208,0.8400723355781036
llm_goals_449,test,45,0.9875265205127608,0.925208223971735
llm_goals_449,test,46,0.588011315723828,0.0740922882863047
llm_goals_449,test,47,0.9158646559071312,0.9373555404045412
llm_goals_449,test,48,0.073875751738136,0.3920310752556691
llm_goals_449,test,49,0.1619335130741301,0.0277662962683335
llm_goals_75,test,0,0.9103229346257946,0.8642124165137652
llm_goals_75,test,1,0.9679259185374958,0.910359703136258
llm_goals_75,test,2,0.9266010855857304,0.8128286324258283
llm_goals_75,test,3,0.9017204248594564,0.1661489886313124
llm_goals_75,test,4,0.0751215061790111,0.1236451678860016
llm_goals_75,test,5,0.961386183458567,0.6739037233559247
llm_goals_75,test,6,0.8932439033574047,0.1134434733777058
llm_goals_75,test,7,0.8844782056354616,0.6946055843235053
llm_goals_75,test,8,0.0751215061790111,0.1004496505890182
llm_goals_75,test,9,0.8275351203945236,0.1540130266900075
llm_goals_75,test,10,0.2998126101642177,0.3569515830662073
llm_goals_75,test,11,0.9212924366819822,0.4576154291835114
llm_goals_75,test,12,0.9646449569693856,0.1367346048355968
llm_goals_75,test,13,0.0442614142373688,0.0646890805500496
llm_goals_75,test,14,0.917606455440905,0.1675122689898172
llm_goals_75,test,15,0.6581725752768258,0.069582458224139
llm_goals_75,test,16,0.0572231707129205,0.2354277864496811
llm_goals_75,test,17,0.8495712447120932,0.9447837743973488
llm_goals_75,test,18,0.7797369080061485,0.0781001795812696
llm_goals_75,test,19,0.8338227723543179,0.4868721494751054
llm_goals_75,test,20,0.0751215061790111,0.1033036348939128
llm_goals_75,test,21,0.9017204248594564,0.1276999559430948
llm_goals_75,test,22,0.7243806698779564,0.8431325364742722
llm_goals_75,test,23,0.9444284716561824,0.7460283918906632
llm_goals_75,test,24,0.8922167250816467,0.192573320599938
llm_goals_75,test,25,0.2998126101642177,0.3801085776614793
llm_goals_75,test,26,0.0572231707129205,0.1267870145951939
llm_goals_75,test,27,0.9355080792876184,0.9607504432606712
llm_goals_75,test,28,0.6552419805408431,0.0423146645658729
llm_goals_75,test,29,0.9035463964418424,0.4777054812224888
llm_goals_75,test,30,0.1330396689126687,0.4822637810175876
llm_goals_75,test,31,0.0385065312397458,0.0805248550261055
llm_goals_75,test,32,0.8092890496680294,0.6890841093919252
llm_goals_75,test,33,0.2001129865013068,0.1145962248845397
llm_goals_75,test,34,0.2998126101642177,0.2921261463182895
llm_goals_75,test,35,0.9103229346257946,0.6530562837025381
llm_goals_75,test,36,0.2998126101642177,0.1183304077208745
llm_goals_75,test,37,0.981815752238907,0.868052766582826
llm_goals_75,test,38,0.7751191880297357,0.6535917953521371
llm_goals_75,test,39,0.8847889063051668,0.0644053193022136
llm_goals_75,test,40,0.7797369080061485,0.6019618834627347
llm_goals_75,test,41,0.7243806698779564,0.230389069862908
llm_goals_75,test,42,0.8963859047065235,0.7894553184375537
llm_goals_75,test,43,0.6450552234595432,0.2977582471382819
llm_goals_75,test,44,0.9319704901022596,0.2211815525008748
llm_goals_75,test,45,0.8415861589718261,0.0745441466493943
llm_goals_75,test,46,0.0989406303571733,0.7127955514788996
llm_goals_75,test,47,0.3001812287579745,0.0161223980025345
llm_goals_75,test,48,0.7797369080061485,0.1382513395050604
llm_goals_75,test,49,0.961386183458567,0.9815106661613362
llm_goals_305,test,0,0.1173653021320184,0.2062097726301097
llm_goals_305,test,1,0.2102059114429175,0.7603213407742078
llm_goals_305,test,2,0.1896247716253509,0.0406395612652842
llm_goals_305,test,3,0.7631245744429269,0.4422001539134155
llm_goals_305,test,4,0.1513247999265971,0.2689791708049951
llm_goals_305,test,5,0.0747358851031551,0.1412581238797707
llm_goals_305,test,6,0.0691963519045397,0.0992911357773575
llm_goals_305,test,7,0.1896247716253509,0.1984947738037692
llm_goals_305,test,8,0.2147961892592141,0.1577864619647619
llm_goals_305,test,9,0.1173653021320184,0.0621641107275182
llm_goals_305,test,10,0.9027346931898252,0.9879174023450592
llm_goals_305,test,11,0.280729650840792,0.5269669419962362
llm_goals_305,test,12,0.0586973799656297,0.2105593475656798
llm_goals_305,test,13,0.1759957614798339,0.2072161629845012
llm_goals_305,test,14,0.763315377311124,0.6545892217736428
llm_goals_305,test,15,0.2147961892592141,0.5104040428268571
llm_goals_305,test,16,0.5109898386795877,0.5524398163622298
llm_goals_305,test,17,0.3309544973113312,0.8665614751565875
llm_goals_305,test,18,0.3985168225753824,0.3175479682579358
llm_goals_305,test,19,0.7266758032873198,0.3701558259397783
llm_goals_305,test,20,0.0923041614406128,0.0528314061272507
llm_goals_305,test,21,0.3372607298969772,0.3148726989644924
llm_goals_305,test,22,0.1173653021320184,0.447303668549321
llm_goals_305,test,23,0.3364153293102218,0.1744797562558885
llm_goals_305,test,24,0.7495774070368321,0.8158235756439657
llm_goals_305,test,25,0.9027346931898252,0.9578316364476024
llm_goals_305,test,26,0.7495774070368321,0.5595920193399587
llm_goals_305,test,27,0.0271082455628235,0.5967193097172223
llm_goals_305,test,28,0.5510475728332331,0.9037929343333102
llm_goals_305,test,29,0.1325883576355438,0.278165145436113
llm_goals_305,test,30,0.0147056213023361,0.9532629887346658
llm_goals_305,test,31,0.3372607298969772,0.5121334481158791
llm_goals_305,test,32,0.2102059114429175,0.1605879890433021
llm_goals_305,test,33,0.3309544973113312,0.6222808213139804
llm_goals_305,test,34,0.9027346931898252,0.9709568242405192
llm_goals_305,test,35,0.1896247716253509,0.5513220475450542
llm_goals_305,test,36,0.9083626173635054,0.9876292784574268
llm_goals_305,test,37,0.7266758032873198,0.258566594074644
llm_goals_305,test,38,0.887345470451353,0.3940893870837836
llm_goals_305,test,39,0.261247679488323,0.6249683049434822
llm_goals_305,test,40,0.2772186334244859,0.036012250509986
llm_goals_305,test,41,0.0251284289052585,0.0238784684017155
llm_goals_305,test,42,0.015793951736561,0.1015334102504109
llm_goals_305,test,43,0.4718945287424333,0.0682627831684364
llm_goals_305,test,44,0.2147961892592141,0.0901285910304827
llm_goals_305,test,45,0.8469651440405966,0.8520020311890948
llm_goals_305,test,46,0.3505890920518906,0.512946133742762
llm_goals_305,test,47,0.2055821944442399,0.9460715758270588
llm_goals_305,test,48,0.7495774070368321,0.2634284981215168
llm_goals_305,test,49,0.2102059114429175,0.5226278491298435
llm_goals_263,test,0,0.9594930498231914,0.9722113849684072
llm_goals_263,test,1,0.3875621031969178,0.4308884142088059
llm_goals_263,test,2,0.1088305297021957,0.9112282637417588
llm_goals_263,test,3,0.1336864327516324,0.4678322072304764
llm_goals_263,test,4,0.6907479061589563,0.0681171790473069
llm_goals_263,test,5,0.548826940335909,0.3304750158657515
llm_goals_263,test,6,0.0248785940993689,0.1049596434028026
llm_goals_263,test,7,0.3754495992357841,0.868290478100796
llm_goals_263,test,8,0.0082239137496206,0.0107688258732955
llm_goals_263,test,9,0.7893808851589301,0.5335894362422906
llm_goals_263,test,10,0.9271837164297608,0.4571801332195204
llm_goals_263,test,11,0.3643416848091783,0.4017475232284387
llm_goals_263,test,12,0.0214694160174864,0.7410716651377723
llm_goals_263,test,13,0.4175659290365474,0.2222869461895513
llm_goals_263,test,14,0.1366321993426032,0.0236037417776026
llm_goals_263,test,15,0.4175659290365474,0.0998823008982278
llm_goals_263,test,16,0.2378839093738415,0.0090037236123257
llm_goals_263,test,17,0.0678695590283205,0.3371875979935536
llm_goals_263,test,18,0.1366321993426032,0.2095794100566156
llm_goals_263,test,19,0.1510315832367025,0.1483621477954244
llm_goals_263,test,20,0.0082239137496206,0.2829259876769517
llm_goals_263,test,21,0.0248785940993689,0.1128506991103582
llm_goals_263,test,22,0.7893808851589301,0.8918927085227047
llm_goals_263,test,23,0.293049384708822,0.1960590879366542
llm_goals_263,test,24,0.4348038410452636,0.0409316032122589
llm_goals_263,test,25,0.2226265308176087,0.1971178454456452
llm_goals_263,test,26,0.4717797495064882,0.290576284754869
llm_goals_263,test,27,0.4009981634773483,0.3914767323316075
llm_goals_263,test,28,0.2956045582386387,0.3629055172172753
llm_goals_263,test,29,0.0895774141696241,0.0312142081028261
llm_goals_263,test,30,0.8265092430187212,0.1928083275379132
llm_goals_263,test,31,0.0248785940993689,0.318621097342132
llm_goals_263,test,32,0.3791091232958771,0.1747653444762649
llm_goals_263,test,33,0.4686688762105362,0.0531218265570888
llm_goals_263,test,34,0.1674551433492084,0.1598154925951403
llm_goals_263,test,35,0.4175659290365474,0.94307484220015
llm_goals_263,test,36,0.1771447032062837,0.5041818847108344
llm_goals_263,test,37,0.1933949033709068,0.1111175217519077
llm_goals_263,test,38,0.0895774141696241,0.1867701836992809
llm_goals_263,test,39,0.4175659290365474,0.9513736387795227
llm_goals_263,test,40,0.4717797495064882,0.726601907835183
llm_goals_263,test,41,0.6581133491156186,0.2793940710071973
llm_goals_263,test,42,0.5484358801159307,0.7591325538288878
llm_goals_263,test,43,0.0678695590283205,0.0599255853483329
llm_goals_263,test,44,0.3328667942518803,0.0248060297565235
llm_goals_263,test,45,0.2208789358691529,0.4429293016127257
llm_goals_263,test,46,0.3695976859064504,0.3978895760863248
llm_goals_263,test,47,0.3103774149698418,0.9291514786865128
llm_goals_263,test,48,0.6581133491156186,0.2313178866490127
llm_goals_263,test,49,0.8568856654180469,0.3779293731936072
llm_goals_157,test,0,0.8371557433947188,0.7943095194508789
llm_goals_157,test,1,0.0336900755244193,0.0516624712053447
llm_goals_157,test,2,0.5969926233450199,0.8020233336204885
llm_goals_157,test,3,0.0388840696837866,0.5904722684734964
llm_goals_157,test,4,0.8054334230931457,0.9619353001797089
llm_goals_157,test,5,0.7150935615058345,0.6767415952202784
llm_goals_157,test,6,0.2424313561403037,0.7612977247981438
llm_goals_157,test,7,0.5969926233450199,0.6294506387377161
llm_goals_157,test,8,0.8054334230931457,0.8937361945430545
llm_goals_157,test,9,0.1753109589945453,0.9788153257749777
llm_goals_157,test,10,0.7187574459658809,0.8824125505492224
llm_goals_157,test,11,0.0255359509444069,0.199986733795525
llm_goals_157,test,12,0.8536639291851708,0.9284577144290443
llm_goals_157,test,13,0.977736348913886,0.9240516415338534
llm_goals_157,test,14,0.2321044598385402,0.2475658313194042
llm_goals_157,test,15,0.9706541812762836,0.976340679507306
llm_goals_157,test,16,0.0225960295261658,0.3126950781624377
llm_goals_157,test,17,0.0341549743160244,0.046177739393252
llm_goals_157,test,18,0.6413523430873771,0.4250899393616417
llm_goals_157,test,19,0.6550882275333912,0.6637557888114428
llm_goals_157,test,20,0.8054334230931457,0.9747431080575436
llm_goals_157,test,21,0.7150935615058345,0.566102644985123
llm_goals_157,test,22,0.0289859909616508,0.4645121573786108
llm_goals_157,test,23,0.0163418656639607,0.1429816093888423
llm_goals_157,test,24,0.1741231539841163,0.0397822616409018
llm_goals_157,test,25,0.3471591973106736,0.2832629442692311
llm_goals_157,test,26,0.1879039767426245,0.3005834296865567
llm_goals_157,test,27,0.3433644240079982,0.049069242775247
llm_goals_157,test,28,0.7601972530379655,0.2908678434467844
llm_goals_157,test,29,0.3433644240079982,0.1061660413895585
llm_goals_157,test,30,0.3471591973106736,0.5164500368467446
llm_goals_157,test,31,0.6221326038396446,0.9364517603204892
llm_goals_157,test,32,0.3983248762240459,0.0583368009018155
llm_goals_157,test,33,0.0225960295261658,0.102471328139649
llm_goals_157,test,34,0.8239039936941527,0.7754930766823708
llm_goals_157,test,35,0.9543082930796178,0.930098280704675
llm_goals_157,test,36,0.7187574459658809,0.8978537108401503
llm_goals_157,test,37,0.0152142017147236,0.185447729939923
llm_goals_157,test,38,0.6413523430873771,0.4989516423125952
llm_goals_157,test,39,0.938811907353553,0.8172337053734404
llm_goals_157,test,40,0.0289859909616508,0.3208967259617554
llm_goals_157,test,41,0.1231472113484556,0.9628746978064082
llm_goals_157,test,42,0.5969926233450199,0.9537549409903032
llm_goals_157,test,43,0.7150935615058345,0.9854372229811326
llm_goals_157,test,44,0.8054334230931457,0.9446223273489608
llm_goals_157,test,45,0.8233413435239318,0.917287033427004
llm_goals_157,test,46,0.6126619919877532,0.2958138118998824
llm_goals_157,test,47,0.7484148517205657,0.7644578181201236
llm_goals_157,test,48,0.1879039767426245,0.2919786437406029
llm_goals_157,test,49,0.5509008169248885,0.2435548949640933
llm_goals_358,test,0,0.8722666509854878,0.9710288332808288
llm_goals_358,test,1,0.9030788897147458,0.1090780967183576
llm_goals_358,test,2,0.9171645313495131,0.8957724929016077
llm_goals_358,test,3,0.2444353000057121,0.0314742636417454
llm_goals_358,test,4,0.837758281920007,0.9345866127648594
llm_goals_358,test,5,0.2963511569922055,0.3075908794558576
llm_goals_358,test,6,0.0853093080681576,0.1938894394639401
llm_goals_358,test,7,0.9171645313495131,0.9366675383938772
llm_goals_358,test,8,0.9753502976047737,0.9600018984290702
llm_goals_358,test,9,0.2125217163227303,0.0356972898371527
llm_goals_358,test,10,0.3046122784109649,0.7396882546703099
llm_goals_358,test,11,0.1268051972976895,0.0409023187764638
llm_goals_358,test,12,0.035541009048691,0.0976624021485058
llm_goals_358,test,13,0.0625935420378402,0.1216232236474993
llm_goals_358,test,14,0.7330212569577729,0.7864359180640846
llm_goals_358,test,15,0.9413167193138908,0.8556484582282166
llm_goals_358,test,16,0.936306577752406,0.7341230488107452
llm_goals_358,test,17,0.791742970892711,0.2726809060238253
llm_goals_358,test,18,0.0755278451431677,0.7566054280756713
llm_goals_358,test,19,0.6876182544777331,0.0434563732454263
llm_goals_358,test,20,0.8740166909749276,0.8243328886415383
llm_goals_358,test,21,0.0625935420378402,0.1112076480131408
llm_goals_358,test,22,0.0755278451431677,0.0845862458189736
llm_goals_358,test,23,0.7658007745053227,0.0375312043866978
llm_goals_358,test,24,0.7330212569577729,0.8172477900339192
llm_goals_358,test,25,0.6832605911411632,0.9764694049382328
llm_goals_358,test,26,0.7075640638718501,0.7040948478982805
llm_goals_358,test,27,0.2260192806051778,0.125707811898555
llm_goals_358,test,28,0.2444353000057121,0.1566378003751444
llm_goals_358,test,29,0.8607538989221549,0.1707030695577025
llm_goals_358,test,30,0.9422944886075704,0.7917262984233946
llm_goals_358,test,31,0.0625935420378402,0.0448402492326266
llm_goals_358,test,32,0.8809302017198033,0.0880149966006802
llm_goals_358,test,33,0.936306577752406,0.9036261072893176
llm_goals_358,test,34,0.119932767683189,0.6926631691100236
llm_goals_358,test,35,0.9171645313495131,0.772573980123232
llm_goals_358,test,36,0.0978612929306139,0.443962006250219
llm_goals_358,test,37,0.9467956485443186,0.5987374702917627
llm_goals_358,test,38,0.0727948594919855,0.0973650244988885
llm_goals_358,test,39,0.035541009048691,0.0374517082121219
llm_goals_358,test,40,0.0755278451431677,0.0459188553104236
llm_goals_358,test,41,0.0571003265822452,0.067381376462992
llm_goals_358,test,42,0.6735133295377659,0.9322344143419644
llm_goals_358,test,43,0.0625935420378402,0.0773258781385884
llm_goals_358,test,44,0.3198831347823997,0.9867304662942348
llm_goals_358,test,45,0.3198831347823997,0.0921047575496883
llm_goals_358,test,46,0.2171530278902441,0.0203810451816961
llm_goals_358,test,47,0.0480583261869559,0.0161558697095388
llm_goals_358,test,48,0.7330212569577729,0.7751475880899051
llm_goals_358,test,49,0.2260192806051778,0.4160470958249456
llm_goals_78,test,0,0.1348733469503043,0.2251708162334548
llm_goals_78,test,1,0.3127966417879114,0.0367340336052023
llm_goals_78,test,2,0.2120211457251434,0.0527379912395899
llm_goals_78,test,3,0.1626577842713076,0.0259505842905422
llm_goals_78,test,4,0.2739711160438865,0.0939178372549231
llm_goals_78,test,5,0.1381413249829573,0.6658069720444946
llm_goals_78,test,6,0.1720623669557213,0.0424593855688115
llm_goals_78,test,7,0.136204110235674,0.3068789421692927
llm_goals_78,test,8,0.2739711160438865,0.0254129292421898
llm_goals_78,test,9,0.0650963040180886,0.0407835069490974
llm_goals_78,test,10,0.9400504643797348,0.9375706694734316
llm_goals_78,test,11,0.959618688019492,0.7386383432572439
llm_goals_78,test,12,0.5602040927290391,0.3108688169890243
llm_goals_78,test,13,0.3355971707416643,0.0946944663222736
llm_goals_78,test,14,0.1279134972036333,0.1717796546359565
llm_goals_78,test,15,0.2739711160438865,0.1277153625141483
llm_goals_78,test,16,0.0762588248301841,0.0689165589110325
llm_goals_78,test,17,0.8503918552770308,0.0883911059243408
llm_goals_78,test,18,0.1175723917717473,0.0337617130750813
llm_goals_78,test,19,0.8294889804985837,0.7169547264343438
llm_goals_78,test,20,0.2753289028288226,0.1528222000997753
llm_goals_78,test,21,0.3355971707416643,0.0350685532944032
llm_goals_78,test,22,0.9119278534473942,0.0940461009061424
llm_goals_78,test,23,0.9815792758974532,0.9060885414573472
llm_goals_78,test,24,0.1128846067005182,0.0217941677583094
llm_goals_78,test,25,0.9400504643797348,0.9667879364041514
llm_goals_78,test,26,0.0762588248301841,0.0797221269088608
llm_goals_78,test,27,0.95309889520794,0.0603014558146647
llm_goals_78,test,28,0.0680819498474285,0.019185604671188
llm_goals_78,test,29,0.7398471723257246,0.181847707574815
llm_goals_78,test,30,0.9557894472246976,0.9576328540155246
llm_goals_78,test,31,0.1381413249829573,0.1600616173680257
llm_goals_78,test,32,0.959618688019492,0.8196381975442921
llm_goals_78,test,33,0.1175723917717473,0.0444875750236097
llm_goals_78,test,34,0.9236282775883368,0.9277514916547148
llm_goals_78,test,35,0.1348733469503043,0.1986446962511548
llm_goals_78,test,36,0.9236282775883368,0.9359311183925404
llm_goals_78,test,37,0.7635518421268939,0.8760354323987716
llm_goals_78,test,38,0.563561845199206,0.4610991071324792
llm_goals_78,test,39,0.4315754500000708,0.2972845381897555
llm_goals_78,test,40,0.8889531838698135,0.7716125042657197
llm_goals_78,test,41,0.1358434545113775,0.1328309068036672
llm_goals_78,test,42,0.2120211457251434,0.3354286767519867
llm_goals_78,test,43,0.1381413249829573,0.086342843675339
llm_goals_78,test,44,0.2042341898232444,0.0958279087075554
llm_goals_78,test,45,0.2649095563501317,0.1302156649936615
llm_goals_78,test,46,0.973914336757064,0.8983792614483327
llm_goals_78,test,47,0.103739204998502,0.1775307323333411
llm_goals_78,test,48,0.0762588248301841,0.0658487938814022
llm_goals_78,test,49,0.1639032575008981,0.079644576255816
llm_goals_420,test,0,0.1027703698392232,0.7165124795044365
llm_goals_420,test,1,0.0296877815248364,0.7608911842606508
llm_goals_420,test,2,0.9272085353227922,0.799936385630717
llm_goals_420,test,3,0.0191873930013649,0.2211062209422303
llm_goals_420,test,4,0.7068668472005154,0.2926466150380465
llm_goals_420,test,5,0.9739656414533578,0.9140651066289046
llm_goals_420,test,6,0.0326213321002556,0.4131756456187543
llm_goals_420,test,7,0.947921390998665,0.6643261466520904
llm_goals_420,test,8,0.8056008428862758,0.3578404079978603
llm_goals_420,test,9,0.9746221247167955,0.8413468212597344
llm_goals_420,test,10,0.1627859465535909,0.4981438990065536
llm_goals_420,test,11,0.8456218714221574,0.2468097596316683
llm_goals_420,test,12,0.174069759876894,0.1549754451331909
llm_goals_420,test,13,0.8386638511407195,0.8951478256933764
llm_goals_420,test,14,0.0460155271833315,0.0722168451540495
llm_goals_420,test,15,0.1209866882558583,0.7175548720080566
llm_goals_420,test,16,0.0422076538064917,0.0482770035552138
llm_goals_420,test,17,0.8795757926907944,0.9171404716362525
llm_goals_420,test,18,0.6701610414860973,0.2149325509708838
llm_goals_420,test,19,0.0516455740541564,0.9314370105190324
llm_goals_420,test,20,0.8248393203151128,0.6958358689335516
llm_goals_420,test,21,0.9739656414533578,0.6712961637420737
llm_goals_420,test,22,0.9746221247167955,0.9091188630862124
llm_goals_420,test,23,0.9632136271919428,0.080457132763502
llm_goals_420,test,24,0.0460155271833315,0.0910185464003223
llm_goals_420,test,25,0.9410940100056328,0.0266374948315803
llm_goals_420,test,26,0.0296877815248364,0.3477530565713536
llm_goals_420,test,27,0.0155047079485942,0.8201931514993901
llm_goals_420,test,28,0.9810942292243068,0.2425383031071764
llm_goals_420,test,29,0.9410940100056328,0.4181605367795475
llm_goals_420,test,30,0.0762130117851734,0.0299293846265948
llm_goals_420,test,31,0.0487080486946026,0.940670822547668
llm_goals_420,test,32,0.9680566638538792,0.0196824789824236
llm_goals_420,test,33,0.0460155271833315,0.1078959069076236
llm_goals_420,test,34,0.1361013640868144,0.2191371931392249
llm_goals_420,test,35,0.5308713635177714,0.9034152914594604
llm_goals_420,test,36,0.1250639758602871,0.548380428606202
llm_goals_420,test,37,0.5852546105422443,0.50388122703708
llm_goals_420,test,38,0.0296877815248364,0.4294891851736946
llm_goals_420,test,39,0.1209866882558583,0.4382416051683284
llm_goals_420,test,40,0.0715399682229241,0.141879820547579
llm_goals_420,test,41,0.0182261433015779,0.6151086701978562
llm_goals_420,test,42,0.0516455740541564,0.7490416767979864
llm_goals_420,test,43,0.9777976629352274,0.6273048386641107
llm_goals_420,test,44,0.6760094091282541,0.8162625944607043
llm_goals_420,test,45,0.02964392451172,0.3347655055973148
llm_goals_420,test,46,0.0912296409282047,0.2248938224655197
llm_goals_420,test,47,0.0296877815248364,0.7293239346358632
llm_goals_420,test,48,0.969159791272908,0.1530180333157787
llm_goals_420,test,49,0.7908942744817576,0.9588707841469084
llm_goals_53,test,0,0.7448861349519237,0.976097291167194
llm_goals_53,test,1,0.9665936595222716,0.2598265618814769
llm_goals_53,test,2,0.9679014771134362,0.9770793290161108
llm_goals_53,test,3,0.9665936595222716,0.4768547215758607
llm_goals_53,test,4,0.9665936595222716,0.2361872878274303
llm_goals_53,test,5,0.0656667940920021,0.0986317022184206
llm_goals_53,test,6,0.1278218108642054,0.0477100161960414
llm_goals_53,test,7,0.9872176205673084,0.937994454790112
llm_goals_53,test,8,0.9760934870365888,0.2701156822033339
llm_goals_53,test,9,0.1278218108642054,0.2989108711032385
llm_goals_53,test,10,0.4744826290633033,0.5544564065686126
llm_goals_53,test,11,0.10188773581826,0.3953618346843373
llm_goals_53,test,12,0.1431362250303733,0.1335346211746911
llm_goals_53,test,13,0.5288125403215103,0.0585116233918817
llm_goals_53,test,14,0.8158606210311431,0.1376328700771095
llm_goals_53,test,15,0.0638494318486866,0.4350138720043813
llm_goals_53,test,16,0.9706629155446485,0.0717024446401859
llm_goals_53,test,17,0.9894967462442044,0.6563471973646152
llm_goals_53,test,18,0.9887343587218084,0.2165785858914521
llm_goals_53,test,19,0.9760934870365888,0.3746358016952676
llm_goals_53,test,20,0.9894967462442044,0.5337460360023749
llm_goals_53,test,21,0.3765335607937951,0.0467709874601332
llm_goals_53,test,22,0.9962048591447612,0.7796763173252493
llm_goals_53,test,23,0.2171471779638178,0.3205915991497378
llm_goals_53,test,24,0.149669309523959,0.0640075835802484
llm_goals_53,test,25,0.149669309523959,0.833565084619613
llm_goals_53,test,26,0.0754981603691567,0.0854875283183964
llm_goals_53,test,27,0.2163091299336187,0.9078949534688217
llm_goals_53,test,28,0.9872176205673084,0.3980814368097108
llm_goals_53,test,29,0.149669309523959,0.0495337152571608
llm_goals_53,test,30,0.569882295986771,0.49697645864992
llm_goals_53,test,31,0.3765335607937951,0.4685591079414317
llm_goals_53,test,32,0.9872176205673084,0.0870796105685882
llm_goals_53,test,33,0.9773273247404586,0.0188204043218978
llm_goals_53,test,34,0.9805969583675788,0.5566033569957117
llm_goals_53,test,35,0.9917541681894212,0.9313365617424948
llm_goals_53,test,36,0.8158606210311431,0.9304982364910718
llm_goals_53,test,37,0.4744826290633033,0.1916887084340081
llm_goals_53,test,38,0.0638494318486866,0.0179322256288976
llm_goals_53,test,39,0.6379205068085301,0.042191597199028
llm_goals_53,test,40,0.0954293213091898,0.4480237505797492
llm_goals_53,test,41,0.7537526258692056,0.199711476764323
llm_goals_53,test,42,0.1257689808988572,0.984673662230153
llm_goals_53,test,43,0.0692929605445084,0.1015360353200591
llm_goals_53,test,44,0.8052595774943403,0.2398468184361071
llm_goals_53,test,45,0.8055542369384947,0.5147270663759912
llm_goals_53,test,46,0.35875831435166,0.6026394622908158
llm_goals_53,test,47,0.0638494318486866,0.7105197565308571
llm_goals_53,test,48,0.9872176205673084,0.1056143884471251
llm_goals_53,test,49,0.0656667940920021,0.2875693652635701
llm_goals_427,test,0,0.8891137012533223,0.9912377865392056
llm_goals_427,test,1,0.6321043688939182,0.1393504988400085
llm_goals_427,test,2,0.993959144684545,0.9826717605764466
llm_goals_427,test,3,0.9856286099866526,0.9914966630190112
llm_goals_427,test,4,0.419065256318945,0.0287440390481499
llm_goals_427,test,5,0.7840991372215356,0.1508234315553654
llm_goals_427,test,6,0.0888501448158868,0.0241177394276523
llm_goals_427,test,7,0.3805337688434007,0.9533421090109172
llm_goals_427,test,8,0.2178235140501479,0.1357554081265164
llm_goals_427,test,9,0.8803341660953263,0.0422408742214398
llm_goals_427,test,10,0.6321043688939182,0.3560677064830195
llm_goals_427,test,11,0.9904849525535764,0.2848587352361455
llm_goals_427,test,12,0.7134891581773088,0.0783011900572995
llm_goals_427,test,13,0.5127133293824118,0.053588048642731
llm_goals_427,test,14,0.9503446994493456,0.1755007793342038
llm_goals_427,test,15,0.6167416871053722,0.03905897487628
llm_goals_427,test,16,0.2623413832015914,0.0861236052612804
llm_goals_427,test,17,0.6321043688939182,0.2907015821684348
llm_goals_427,test,18,0.6321043688939182,0.0468453325440364
llm_goals_427,test,19,0.7859926096238357,0.7510010963524218
llm_goals_427,test,20,0.419065256318945,0.0467429391605962
llm_goals_427,test,21,0.8803341660953263,0.1304366461429133
llm_goals_427,test,22,0.6321043688939182,0.1246622694694481
llm_goals_427,test,23,0.7279095038254075,0.5644455097827197
llm_goals_427,test,24,0.2081818556883427,0.0414160339225927
llm_goals_427,test,25,0.8891137012533223,0.8926284254200217
llm_goals_427,test,26,0.6321043688939182,0.0591453922508401
llm_goals_427,test,27,0.7919311770006959,0.5016671352552752
llm_goals_427,test,28,0.98302234710588,0.9189449605602464
llm_goals_427,test,29,0.6264245164753564,0.5267252864404038
llm_goals_427,test,30,0.6321043688939182,0.3196802851986922
llm_goals_427,test,31,0.947730257127236,0.0622742618121558
llm_goals_427,test,32,0.9237100008388404,0.2393552597896355
llm_goals_427,test,33,0.2081818556883427,0.0317774218950805
llm_goals_427,test,34,0.6321043688939182,0.2969897604985466
llm_goals_427,test,35,0.8706838638718468,0.911826685378058
llm_goals_427,test,36,0.8164159826773449,0.5044385498946317
llm_goals_427,test,37,0.7859926096238357,0.961152239017662
llm_goals_427,test,38,0.5263616206192477,0.383885411527425
llm_goals_427,test,39,0.4121140464058971,0.0767754062509803
llm_goals_427,test,40,0.9904849525535764,0.3019915478879681
llm_goals_427,test,41,0.160026232871865,0.0597208539505394
llm_goals_427,test,42,0.9503446994493456,0.9798415326165176
llm_goals_427,test,43,0.419065256318945,0.0828234646890313
llm_goals_427,test,44,0.6167416871053722,0.1075404432723246
llm_goals_427,test,45,0.9395437750546628,0.9497563751433828
llm_goals_427,test,46,0.3040648667345251,0.2027056215184361
llm_goals_427,test,47,0.947730257127236,0.9493266919171398
llm_goals_427,test,48,0.599709284370368,0.0344289143960405
llm_goals_427,test,49,0.419065256318945,0.1952894749193552
llm_goals_186,test,0,0.9631457311756436,0.534925569771277
llm_goals_186,test,1,0.5983183791997791,0.0649953944046378
llm_goals_186,test,2,0.9692789996298776,0.91763923479236
llm_goals_186,test,3,0.6113671304199514,0.3425021516930106
llm_goals_186,test,4,0.5933211308238896,0.1153021531057396
llm_goals_186,test,5,0.8747787649369047,0.7928793741281699
llm_goals_186,test,6,0.9407853519117952,0.9038094070559602
llm_goals_186,test,7,0.9465907181485383,0.6367372560980368
llm_goals_186,test,8,0.1904957745583066,0.2126364849604726
llm_goals_186,test,9,0.8120936833432515,0.8694824597543704
llm_goals_186,test,10,0.0820855549975484,0.5802607311846129
llm_goals_186,test,11,0.9566045159731936,0.2225491999116792
llm_goals_186,test,12,0.3252361573674235,0.2300986684078339
llm_goals_186,test,13,0.8798052619609892,0.9257638147127129
llm_goals_186,test,14,0.1550075646007755,0.1695718974503099
llm_goals_186,test,15,0.0820855549975484,0.151038541979901
llm_goals_186,test,16,0.2134455998685991,0.0464142133590747
llm_goals_186,test,17,0.08351979250002,0.0732763222959853
llm_goals_186,test,18,0.3885488204046692,0.0482171595539919
llm_goals_186,test,19,0.3485125263587582,0.347547591319228
llm_goals_186,test,20,0.4776563573712507,0.1739822028354879
llm_goals_186,test,21,0.9663049104539188,0.9541198242132036
llm_goals_186,test,22,0.12471453034617,0.049497112506125
llm_goals_186,test,23,0.6113671304199514,0.1810016520865223
llm_goals_186,test,24,0.3385506583380203,0.1851077351512521
llm_goals_186,test,25,0.6807866956311596,0.6713192505556377
llm_goals_186,test,26,0.9921217093459382,0.0711032925420902
llm_goals_186,test,27,0.1762487838841639,0.4081627252904761
llm_goals_186,test,28,0.1762487838841639,0.2745405964802801
llm_goals_186,test,29,0.7082375907976941,0.1854855714896691
llm_goals_186,test,30,0.890376120770417,0.7354449882906446
llm_goals_186,test,31,0.8947122644376758,0.9912562823764032
llm_goals_186,test,32,0.6066531440659316,0.2618042375153737
llm_goals_186,test,33,0.2134455998685991,0.0337875336716617
llm_goals_186,test,34,0.890376120770417,0.6428971957222914
llm_goals_186,test,35,0.0820855549975484,0.7900459432200765
llm_goals_186,test,36,0.7697026904727476,0.8730032999439788
llm_goals_186,test,37,0.4214063421599405,0.0649927594327202
llm_goals_186,test,38,0.4366780107352097,0.0471132735562561
llm_goals_186,test,39,0.7408324961647307,0.2481877539812294
llm_goals_186,test,40,0.9956222363036892,0.2111860555781098
llm_goals_186,test,41,0.9819813749053732,0.8712882416841639
llm_goals_186,test,42,0.9465907181485383,0.6193248853412385
llm_goals_186,test,43,0.9954620956531488,0.8760979623283635
llm_goals_186,test,44,0.5933211308238896,0.0767958111106498
llm_goals_186,test,45,0.6113671304199514,0.0848440049881495
llm_goals_186,test,46,0.9559763361117734,0.6601266976660584
llm_goals_186,test,47,0.4908576527089256,0.4818652455075419
llm_goals_186,test,48,0.0690818587433053,0.1752603358335205
llm_goals_186,test,49,0.6113671304199514,0.027320507820661
llm_goals_133,test,0,0.4559093883834618,0.1030518399074919
llm_goals_133,test,1,0.969908155530912,0.1009270067527766
llm_goals_133,test,2,0.2139357723421015,0.4669147668825159
llm_goals_133,test,3,0.1357085126033054,0.9886211587587188
llm_goals_133,test,4,0.958188989661608,0.6589999206031925
llm_goals_133,test,5,0.9171310858405564,0.0478680529217008
llm_goals_133,test,6,0.0750534423160929,0.0213367665689539
llm_goals_133,test,7,0.0305362101698243,0.06300162626541
llm_goals_133,test,8,0.905613904942175,0.8613404237563876
llm_goals_133,test,9,0.3756828940033098,0.0502374017351794
llm_goals_133,test,10,0.9182632431193848,0.0728398857397339
llm_goals_133,test,11,0.5218790490511612,0.0886358546776828
llm_goals_133,test,12,0.7503719741196108,0.4714116383526195
llm_goals_133,test,13,0.01856803671873,0.0406440348343292
llm_goals_133,test,14,0.9734651574332298,0.8416674339341796
llm_goals_133,test,15,0.6600733369103863,0.5989281494815651
llm_goals_133,test,16,0.1357085126033054,0.9641061261695968
llm_goals_133,test,17,0.6756268837558906,0.0521719884710187
llm_goals_133,test,18,0.8679953553293617,0.9257678218156756
llm_goals_133,test,19,0.138961592024264,0.0409677417198195
llm_goals_133,test,20,0.0897975026805257,0.9201317528016504
llm_goals_133,test,21,0.0897975026805257,0.0611858046803647
llm_goals_133,test,22,0.0444151759650052,0.0749444450486417
llm_goals_133,test,23,0.9732529539242084,0.484676139228053
llm_goals_133,test,24,0.1083245795059067,0.8221724152075577
llm_goals_133,test,25,0.5089088647140888,0.2957602203771531
llm_goals_133,test,26,0.0544967071399587,0.8046360378637115
llm_goals_133,test,27,0.9182632431193848,0.0759761030516968
llm_goals_133,test,28,0.1805423061540022,0.9366340572155704
llm_goals_133,test,29,0.3999700936731424,0.1272708658186502
llm_goals_133,test,30,0.665659391421771,0.1227999985147976
llm_goals_133,test,31,0.6519497363936658,0.0136010194313778
llm_goals_133,test,32,0.0776500376849175,0.3597276462870885
llm_goals_133,test,33,0.1159296318103267,0.8726937465962196
llm_goals_133,test,34,0.3452190382512341,0.2894476365444396
llm_goals_133,test,35,0.0517110236990523,0.0165111879681815
llm_goals_133,test,36,0.7939503755144868,0.0576655273020702
llm_goals_133,test,37,0.138961592024264,0.2554780098122276
llm_goals_133,test,38,0.5604890736768211,0.032809734462924
llm_goals_133,test,39,0.6600733369103863,0.1481243946785008
llm_goals_133,test,40,0.0416826941994386,0.4462128198301662
llm_goals_133,test,41,0.3064147357983886,0.093264815138027
llm_goals_133,test,42,0.0540122353414662,0.2383228605626679
llm_goals_133,test,43,0.0897975026805257,0.196654087051587
llm_goals_133,test,44,0.623498813461612,0.9747002088111656
llm_goals_133,test,45,0.6109855984975063,0.9831163433792584
llm_goals_133,test,46,0.0403068832705345,0.1097011751248294
llm_goals_133,test,47,0.9182632431193848,0.8283354147237331
llm_goals_133,test,48,0.9721755233008385,0.8799294836893965
llm_goals_133,test,49,0.969908155530912,0.2364671831052382
llm_goals_81,test,0,0.0589077184235156,0.1758977435560022
llm_goals_81,test,1,0.1080996786872263,0.4421252700970533
llm_goals_81,test,2,0.420480119877041,0.5612444031805882
llm_goals_81,test,3,0.0777960215726907,0.3079533253993743
llm_goals_81,test,4,0.2453845477978662,0.1763212150593861
llm_goals_81,test,5,0.0971304727903281,0.9704465583106344
llm_goals_81,test,6,0.1274018308243188,0.9821312875358365
llm_goals_81,test,7,0.0616935257298143,0.3270685617728195
llm_goals_81,test,8,0.1934684660684231,0.4843756215736013
llm_goals_81,test,9,0.1099648716919228,0.9933654977534896
llm_goals_81,test,10,0.1704754987552471,0.4711097472541105
llm_goals_81,test,11,0.3369167543199748,0.1673212093996636
llm_goals_81,test,12,0.2453845477978662,0.2643530158966523
llm_goals_81,test,13,0.1732187973813612,0.9714035818561728
llm_goals_81,test,14,0.0394724154779062,0.9265405587707818
llm_goals_81,test,15,0.113129399193254,0.1723195082090535
llm_goals_81,test,16,0.0209726895260339,0.9360974516501586
llm_goals_81,test,17,0.1419335340595952,0.4363540220565442
llm_goals_81,test,18,0.0781809719432033,0.9611565911249424
llm_goals_81,test,19,0.0659901418058653,0.0324757314893466
llm_goals_81,test,20,0.2453845477978662,0.6006056520074408
llm_goals_81,test,21,0.0907225841662123,0.9971859123159944
llm_goals_81,test,22,0.420480119877041,0.0870371051461664
llm_goals_81,test,23,0.1001089207089741,0.2408633212672459
llm_goals_81,test,24,0.1099648716919228,0.9951702226622482
llm_goals_81,test,25,0.0659901418058653,0.6867633490140795
llm_goals_81,test,26,0.1274018308243188,0.9718244652881064
llm_goals_81,test,27,0.3322254624981693,0.4588186617124049
llm_goals_81,test,28,0.2240714746818266,0.5322330497164953
llm_goals_81,test,29,0.0659901418058653,0.2121016556019813
llm_goals_81,test,30,0.3863431232092621,0.6774810136296258
llm_goals_81,test,31,0.2875225511762614,0.9816113605758902
llm_goals_81,test,32,0.2667986815824979,0.2656694493977183
llm_goals_81,test,33,0.0781809719432033,0.942492448912156
llm_goals_81,test,34,0.1223903272838119,0.6429005762747164
llm_goals_81,test,35,0.1433904692341786,0.1528167702888629
llm_goals_81,test,36,0.1274018308243188,0.4512348514816248
llm_goals_81,test,37,0.3739498348987752,0.0605006450173409
llm_goals_81,test,38,0.1080996786872263,0.0274755323758623
llm_goals_81,test,39,0.1433904692341786,0.2279901766778581
llm_goals_81,test,40,0.420480119877041,0.2775541527352398
llm_goals_81,test,41,0.0781809719432033,0.9829489706314426
llm_goals_81,test,42,0.0781809719432033,0.2494339762077133
llm_goals_81,test,43,0.2453845477978662,0.9819424303599844
llm_goals_81,test,44,0.1080996786872263,0.632760349651464
llm_goals_81,test,45,0.2240714746818266,0.090990563553155
llm_goals_81,test,46,0.1730948343833815,0.0910438800719751
llm_goals_81,test,47,0.1080996786872263,0.1292081639058968
llm_goals_81,test,48,0.0781809719432033,0.974747372736112
llm_goals_81,test,49,0.2453845477978662,0.2645580764012665
llm_goals_93,test,0,0.169706854840785,0.5635269221536086
llm_goals_93,test,1,0.020151398397673,0.8801163792253427
llm_goals_93,test,2,0.0987736064069792,0.0696003588446044
llm_goals_93,test,3,0.7151712106556259,0.8186048531566104
llm_goals_93,test,4,0.0425330063448706,0.2222011584760154
llm_goals_93,test,5,0.0626991855260315,0.1268359519713418
llm_goals_93,test,6,0.2561414757385663,0.4582622566067956
llm_goals_93,test,7,0.626541610238238,0.429479690525812
llm_goals_93,test,8,0.0563954385908228,0.1536290973166499
llm_goals_93,test,9,0.0202227122263221,0.6112573193671209
llm_goals_93,test,10,0.7674066697577696,0.7998858649804967
llm_goals_93,test,11,0.0766147899752141,0.5454222135748753
llm_goals_93,test,12,0.6122648113230418,0.2508427619545539
llm_goals_93,test,13,0.0766147899752141,0.0884842413878226
llm_goals_93,test,14,0.1347943316363481,0.6768600290465995
llm_goals_93,test,15,0.026607640234176,0.0352718405868165
llm_goals_93,test,16,0.1347943316363481,0.8009568965617743
llm_goals_93,test,17,0.1109157047850289,0.8092096317591537
llm_goals_93,test,18,0.4325312994224439,0.963804174465268
llm_goals_93,test,19,0.6062245797660748,0.9058854167265824
llm_goals_93,test,20,0.0425330063448706,0.265390180652688
llm_goals_93,test,21,0.2561414757385663,0.1541113602215154
llm_goals_93,test,22,0.0362346800278078,0.9766790566784582
llm_goals_93,test,23,0.0720206010722747,0.7843335253318285
llm_goals_93,test,24,0.1347943316363481,0.548404369330273
llm_goals_93,test,25,0.8708495685377148,0.9813529135147334
llm_goals_93,test,26,0.3366039802055577,0.9397963116499958
llm_goals_93,test,27,0.2362404235303432,0.542547443300257
llm_goals_93,test,28,0.2362404235303432,0.8277938193324692
llm_goals_93,test,29,0.020151398397673,0.8549419878819347
llm_goals_93,test,30,0.6438464531979535,0.9761371695174176
llm_goals_93,test,31,0.0629959139812336,0.1774015734695253
llm_goals_93,test,32,0.1685990893728533,0.9590755456587298
llm_goals_93,test,33,0.0852618561899201,0.9496314531215296
llm_goals_93,test,34,0.0119674661063761,0.9112802317013324
llm_goals_93,test,35,0.0777768252220382,0.0646469314244137
llm_goals_93,test,36,0.7917928166051958,0.965643964207344
llm_goals_93,test,37,0.0394159552584301,0.963180821243277
llm_goals_93,test,38,0.1715176427909161,0.9411316422109696
llm_goals_93,test,39,0.5670877241996723,0.1075404372822008
llm_goals_93,test,40,0.1183135929288665,0.959466160286712
llm_goals_93,test,41,0.0220626729950221,0.3698215332403156
llm_goals_93,test,42,0.0210051630644776,0.1589404653011508
llm_goals_93,test,43,0.2561414757385663,0.2338719832936831
llm_goals_93,test,44,0.1347943316363481,0.1124984808029749
llm_goals_93,test,45,0.0534273204141915,0.866543330684459
llm_goals_93,test,46,0.232600312244377,0.8519759554788342
llm_goals_93,test,47,0.0362346800278078,0.8737971308795239
llm_goals_93,test,48,0.1347943316363481,0.8916334225039363
llm_goals_93,test,49,0.1147554096309258,0.8758339889840314
llm_goals_401,test,0,0.1025709385407213,0.1359674012107803
llm_goals_401,test,1,0.0862470273997913,0.939276601509621
llm_goals_401,test,2,0.2311649575007186,0.3090277756984529
llm_goals_401,test,3,0.1741771429629475,0.2822982814806737
llm_goals_401,test,4,0.5235185246789716,0.9227317209028506
llm_goals_401,test,5,0.0355442568776134,0.0683562610885711
llm_goals_401,test,6,0.1498846116619545,0.1529393504632372
llm_goals_401,test,7,0.1349332132227256,0.2291880493623187
llm_goals_401,test,8,0.9265417643305038,0.910221445630232
llm_goals_401,test,9,0.0279869383815441,0.0669374443869285
llm_goals_401,test,10,0.9454929215265458,0.2562041584734201
llm_goals_401,test,11,0.1096117498401532,0.1977345307962301
llm_goals_401,test,12,0.8932732209722387,0.9351182671047276
llm_goals_401,test,13,0.0279869383815441,0.084239780653768
llm_goals_401,test,14,0.1533634542032049,0.3803121877997557
llm_goals_401,test,15,0.9205633435034054,0.9255856152963072
llm_goals_401,test,16,0.0336319804238267,0.2187242193427731
llm_goals_401,test,17,0.0481813887418106,0.9062633304766484
llm_goals_401,test,18,0.1533634542032049,0.0989866685824555
llm_goals_401,test,19,0.242657477661261,0.0798642603957049
llm_goals_401,test,20,0.5235185246789716,0.7283447799445965
llm_goals_401,test,21,0.0279869383815441,0.3040102668224276
llm_goals_401,test,22,0.0959213297793621,0.8871123935548803
llm_goals_401,test,23,0.0503277563454289,0.6306703155992205
llm_goals_401,test,24,0.0224105039689347,0.342468541641041
llm_goals_401,test,25,0.2546060119315204,0.0306332962828717
llm_goals_401,test,26,0.1533634542032049,0.1178928014307589
llm_goals_401,test,27,0.1511989289419739,0.8247832937930811
llm_goals_401,test,28,0.1608605612544864,0.3694959007053917
llm_goals_401,test,29,0.5660345611551753,0.0798909574616735
llm_goals_401,test,30,0.0402692866659738,0.3951674202836078
llm_goals_401,test,31,0.0338658114168048,0.466307960095254
llm_goals_401,test,32,0.1349332132227256,0.1971577420397864
llm_goals_401,test,33,0.7825571764610231,0.1760928155683087
llm_goals_401,test,34,0.0402692866659738,0.2047678657851429
llm_goals_401,test,35,0.0771115665850084,0.2637872561841102
llm_goals_401,test,36,0.4747437189544288,0.4724849406439279
llm_goals_401,test,37,0.8669726160793032,0.0192510310263775
llm_goals_401,test,38,0.0179628678367229,0.1812826057265395
llm_goals_401,test,39,0.8932732209722387,0.905821781657468
llm_goals_401,test,40,0.0450964676982052,0.1146947001091413
llm_goals_401,test,41,0.0338658114168048,0.1032293515072512
llm_goals_401,test,42,0.0959213297793621,0.3834835806051595
llm_goals_401,test,43,0.1607403922750956,0.2508475125103526
llm_goals_401,test,44,0.9205567379687908,0.8248843542416243
llm_goals_401,test,45,0.643625021428926,0.5847666727108293
llm_goals_401,test,46,0.0939249649628366,0.4045147001032884
llm_goals_401,test,47,0.643625021428926,0.6278339401682421
llm_goals_401,test,48,0.0224105039689347,0.1361878043204594
llm_goals_401,test,49,0.8933252080235167,0.8435596200846341
