template_id,split,question_idx,prediction,label
llm_goals_449,test,0,0.2056360890473946,0.1336325872199141
llm_goals_449,test,1,0.2710079900598266,0.2356014848705813
llm_goals_449,test,2,0.1892592207369678,0.3977331353545913
llm_goals_449,test,3,0.9283257794592137,0.9671817093217177
llm_goals_449,test,4,0.7511209516909255,0.7857460873195503
llm_goals_449,test,5,0.05144787460396177,0.5164481763709956
llm_goals_449,test,6,0.05144787460396177,0.0370459810848937
llm_goals_449,test,7,0.25632737845074977,0.2618660511464079
llm_goals_449,test,8,0.8044653463597701,0.9771937256062914
llm_goals_449,test,9,0.06133346138546553,0.0204302625650166
llm_goals_449,test,10,0.20722184498982946,0.0731782442371117
llm_goals_449,test,11,0.14710273099451238,0.0091003072940505
llm_goals_449,test,12,0.11280219030870615,0.1108627498844831
llm_goals_449,test,13,0.14428128356815906,0.054840421346723
llm_goals_449,test,14,0.7429346699274001,0.8313263696124994
llm_goals_449,test,15,0.7246120573246716,0.8253071431638606
llm_goals_449,test,16,0.7039036009093845,0.831142754565476
llm_goals_449,test,17,0.5746587220990261,0.3065891414116863
llm_goals_449,test,18,0.6035883900340583,0.4235929706341914
llm_goals_449,test,19,0.522911251116226,0.2342867705548718
llm_goals_449,test,20,0.544802902774118,0.5687148418873526
llm_goals_449,test,21,0.3565426752699285,0.4888083146033534
llm_goals_449,test,22,0.06314091388556037,0.0069036151286541
llm_goals_449,test,23,0.89331803366876,0.0739780745569788
llm_goals_449,test,24,0.8895364415320229,0.9314584192860104
llm_goals_449,test,25,0.17929653134298698,0.1420477852561596
llm_goals_449,test,26,0.39609211138291406,0.7006375316273405
llm_goals_449,test,27,0.13994316535367982,0.0612984362789981
llm_goals_449,test,28,0.2553633303416622,0.9549750406111494
llm_goals_449,test,29,0.6840217666118091,0.2943014776892277
llm_goals_449,test,30,0.19638372998368694,0.0576629803259434
llm_goals_449,test,31,0.15417653531706496,0.2255338162735628
llm_goals_449,test,32,0.34779351509262296,0.0217578202648259
llm_goals_449,test,33,0.7901324546759616,0.5881005329750926
llm_goals_449,test,34,0.12827948991067617,0.0656003360881953
llm_goals_449,test,35,0.40531759182261506,0.1899455989825758
llm_goals_449,test,36,0.0447258889982074,0.1356723510839239
llm_goals_449,test,37,0.5037147077875584,0.1724577552330986
llm_goals_449,test,38,0.8910102855815912,0.097576330461044
llm_goals_449,test,39,0.14094725851399123,0.0831443503045603
llm_goals_449,test,40,0.14603595625454316,0.0085659129540734
llm_goals_449,test,41,0.05144787460396177,0.0438119169092525
llm_goals_449,test,42,0.18974685242827458,0.4942733211865646
llm_goals_449,test,43,0.09508318153989948,0.1247723307463423
llm_goals_449,test,44,0.4937276723296124,0.8400723355781036
llm_goals_449,test,45,0.97332718581906,0.925208223971735
llm_goals_449,test,46,0.7198564069719947,0.0740922882863047
llm_goals_449,test,47,0.6476537618427886,0.9373555404045412
llm_goals_449,test,48,0.29201098838510264,0.3920310752556691
llm_goals_449,test,49,0.23058263600219564,0.0277662962683335
llm_goals_75,test,0,0.9335511159346419,0.8642124165137652
llm_goals_75,test,1,0.9699749247777086,0.910359703136258
llm_goals_75,test,2,0.6556043242086942,0.8128286324258283
llm_goals_75,test,3,0.657792185628972,0.1661489886313124
llm_goals_75,test,4,0.20223591902394533,0.1236451678860016
llm_goals_75,test,5,0.8236495588930114,0.6739037233559247
llm_goals_75,test,6,0.8447204179848992,0.1134434733777058
llm_goals_75,test,7,0.8663800148396975,0.6946055843235053
llm_goals_75,test,8,0.07505504422864294,0.1004496505890182
llm_goals_75,test,9,0.6427959077769095,0.1540130266900075
llm_goals_75,test,10,0.4422081499273524,0.3569515830662073
llm_goals_75,test,11,0.8088733275469903,0.4576154291835114
llm_goals_75,test,12,0.6645010966898913,0.1367346048355968
llm_goals_75,test,13,0.3250113955456698,0.0646890805500496
llm_goals_75,test,14,0.9429117795640015,0.1675122689898172
llm_goals_75,test,15,0.5914174208485194,0.069582458224139
llm_goals_75,test,16,0.18040572473137953,0.2354277864496811
llm_goals_75,test,17,0.9038521931639254,0.9447837743973488
llm_goals_75,test,18,0.7772175660928761,0.0781001795812696
llm_goals_75,test,19,0.8504287278367823,0.4868721494751054
llm_goals_75,test,20,0.24888142079863385,0.1033036348939128
llm_goals_75,test,21,0.6762059293844711,0.1276999559430948
llm_goals_75,test,22,0.812656383846364,0.8431325364742722
llm_goals_75,test,23,0.5637701589885737,0.7460283918906632
llm_goals_75,test,24,0.9113982749939703,0.192573320599938
llm_goals_75,test,25,0.6713338387727005,0.3801085776614793
llm_goals_75,test,26,0.3841111029961057,0.1267870145951939
llm_goals_75,test,27,0.842812731517027,0.9607504432606712
llm_goals_75,test,28,0.29023786396964163,0.0423146645658729
llm_goals_75,test,29,0.8458133670152269,0.4777054812224888
llm_goals_75,test,30,0.6257744003303973,0.4822637810175876
llm_goals_75,test,31,0.09225163444890262,0.0805248550261055
llm_goals_75,test,32,0.696815172993302,0.6890841093919252
llm_goals_75,test,33,0.5828150923289322,0.1145962248845397
llm_goals_75,test,34,0.515951199625063,0.2921261463182895
llm_goals_75,test,35,0.8505773216376902,0.6530562837025381
llm_goals_75,test,36,0.6660119994936683,0.1183304077208745
llm_goals_75,test,37,0.7533806511622562,0.868052766582826
llm_goals_75,test,38,0.5210975811695298,0.6535917953521371
llm_goals_75,test,39,0.6283040555611275,0.0644053193022136
llm_goals_75,test,40,0.7772175660928763,0.6019618834627347
llm_goals_75,test,41,0.5395865178080234,0.230389069862908
llm_goals_75,test,42,0.9264775990231815,0.7894553184375537
llm_goals_75,test,43,0.7677729957068532,0.2977582471382819
llm_goals_75,test,44,0.9592029694051522,0.2211815525008748
llm_goals_75,test,45,0.824424996519113,0.0745441466493943
llm_goals_75,test,46,0.44518671479594846,0.7127955514788996
llm_goals_75,test,47,0.45568259255088117,0.0161223980025345
llm_goals_75,test,48,0.7772175660928763,0.1382513395050604
llm_goals_75,test,49,0.8949771907834251,0.9815106661613362
llm_goals_305,test,0,0.13642985228628013,0.2062097726301097
llm_goals_305,test,1,0.4902577190531124,0.7603213407742078
llm_goals_305,test,2,0.1755586595276372,0.0406395612652842
llm_goals_305,test,3,0.6504796394303275,0.4422001539134155
llm_goals_305,test,4,0.083598056280841,0.2689791708049951
llm_goals_305,test,5,0.06232309588400794,0.1412581238797707
llm_goals_305,test,6,0.09076678631573236,0.0992911357773575
llm_goals_305,test,7,0.187899677172219,0.1984947738037692
llm_goals_305,test,8,0.17328600442889394,0.1577864619647619
llm_goals_305,test,9,0.36038786836726283,0.0621641107275182
llm_goals_305,test,10,0.6848997750868882,0.9879174023450592
llm_goals_305,test,11,0.2483291808544392,0.5269669419962362
llm_goals_305,test,12,0.12001115934933519,0.2105593475656798
llm_goals_305,test,13,0.12047888208968993,0.2072161629845012
llm_goals_305,test,14,0.6746275410091812,0.6545892217736428
llm_goals_305,test,15,0.1544733320738488,0.5104040428268571
llm_goals_305,test,16,0.6708537918901234,0.5524398163622298
llm_goals_305,test,17,0.3849446942577021,0.8665614751565875
llm_goals_305,test,18,0.5877714098808315,0.3175479682579358
llm_goals_305,test,19,0.2985051422974985,0.3701558259397783
llm_goals_305,test,20,0.14974469783224498,0.0528314061272507
llm_goals_305,test,21,0.18550132351188073,0.3148726989644924
llm_goals_305,test,22,0.3933091508407534,0.447303668549321
llm_goals_305,test,23,0.3314373451796177,0.1744797562558885
llm_goals_305,test,24,0.6846798330595956,0.8158235756439657
llm_goals_305,test,25,0.8996911043687544,0.9578316364476024
llm_goals_305,test,26,0.7587523572464089,0.5595920193399587
llm_goals_305,test,27,0.5095599275178687,0.5967193097172223
llm_goals_305,test,28,0.6504796394303275,0.9037929343333102
llm_goals_305,test,29,0.35942548391535806,0.278165145436113
llm_goals_305,test,30,0.015375370696476633,0.9532629887346658
llm_goals_305,test,31,0.20381426230849295,0.5121334481158791
llm_goals_305,test,32,0.39581369756505874,0.1605879890433021
llm_goals_305,test,33,0.4482304399723312,0.6222808213139804
llm_goals_305,test,34,0.9052463320927017,0.9709568242405192
llm_goals_305,test,35,0.35229617626589893,0.5513220475450542
llm_goals_305,test,36,0.8656067187754702,0.9876292784574268
llm_goals_305,test,37,0.33566462761157156,0.258566594074644
llm_goals_305,test,38,0.39622718951124297,0.3940893870837836
llm_goals_305,test,39,0.19688815961842343,0.6249683049434822
llm_goals_305,test,40,0.19387439795151465,0.036012250509986
llm_goals_305,test,41,0.3025024468931072,0.0238784684017155
llm_goals_305,test,42,0.10642855627416936,0.1015334102504109
llm_goals_305,test,43,0.2510078675124326,0.0682627831684364
llm_goals_305,test,44,0.19797147809952634,0.0901285910304827
llm_goals_305,test,45,0.7491188298327821,0.8520020311890948
llm_goals_305,test,46,0.3790900520814587,0.512946133742762
llm_goals_305,test,47,0.5065847805734667,0.9460715758270588
llm_goals_305,test,48,0.6252624152488999,0.2634284981215168
llm_goals_305,test,49,0.3653637732442101,0.5226278491298435
llm_goals_263,test,0,0.68612282166003,0.9722113849684072
llm_goals_263,test,1,0.2855642845650543,0.4308884142088059
llm_goals_263,test,2,0.2502068578401951,0.9112282637417588
llm_goals_263,test,3,0.3752739564139513,0.4678322072304764
llm_goals_263,test,4,0.6820436096013777,0.0681171790473069
llm_goals_263,test,5,0.27052981460303976,0.3304750158657515
llm_goals_263,test,6,0.22515519777589976,0.1049596434028026
llm_goals_263,test,7,0.7647390806981545,0.868290478100796
llm_goals_263,test,8,0.01807281279728787,0.0107688258732955
llm_goals_263,test,9,0.7095233985334611,0.5335894362422906
llm_goals_263,test,10,0.5578462448612823,0.4571801332195204
llm_goals_263,test,11,0.33618746173549874,0.4017475232284387
llm_goals_263,test,12,0.2787570206687094,0.7410716651377723
llm_goals_263,test,13,0.312416962337458,0.2222869461895513
llm_goals_263,test,14,0.42806507176269903,0.0236037417776026
llm_goals_263,test,15,0.30871432419525613,0.0998823008982278
llm_goals_263,test,16,0.17754509793227657,0.0090037236123257
llm_goals_263,test,17,0.22543686603146373,0.3371875979935536
llm_goals_263,test,18,0.2986584726277091,0.2095794100566156
llm_goals_263,test,19,0.1509370713337069,0.1483621477954244
llm_goals_263,test,20,0.2967600885869455,0.2829259876769517
llm_goals_263,test,21,0.2797957626582912,0.1128506991103582
llm_goals_263,test,22,0.8155834639485003,0.8918927085227047
llm_goals_263,test,23,0.24751756969522312,0.1960590879366542
llm_goals_263,test,24,0.3714622020594562,0.0409316032122589
llm_goals_263,test,25,0.276576581371969,0.1971178454456452
llm_goals_263,test,26,0.3690834181909497,0.290576284754869
llm_goals_263,test,27,0.25001305790737255,0.3914767323316075
llm_goals_263,test,28,0.19021096007142846,0.3629055172172753
llm_goals_263,test,29,0.087359471141271,0.0312142081028261
llm_goals_263,test,30,0.5965872812830746,0.1928083275379132
llm_goals_263,test,31,0.432812459392039,0.318621097342132
llm_goals_263,test,32,0.4252151791084457,0.1747653444762649
llm_goals_263,test,33,0.4320163272373652,0.0531218265570888
llm_goals_263,test,34,0.2574782767589469,0.1598154925951403
llm_goals_263,test,35,0.33618746173549874,0.94307484220015
llm_goals_263,test,36,0.23657661732375249,0.5041818847108344
llm_goals_263,test,37,0.15127267177275872,0.1111175217519077
llm_goals_263,test,38,0.22316155454461384,0.1867701836992809
llm_goals_263,test,39,0.30871432419525613,0.9513736387795227
llm_goals_263,test,40,0.2652545923975936,0.726601907835183
llm_goals_263,test,41,0.4546893015136073,0.2793940710071973
llm_goals_263,test,42,0.4348344944914824,0.7591325538288878
llm_goals_263,test,43,0.21287342088468075,0.0599255853483329
llm_goals_263,test,44,0.11725338686719868,0.0248060297565235
llm_goals_263,test,45,0.30436884837187506,0.4429293016127257
llm_goals_263,test,46,0.2752105451223601,0.3978895760863248
llm_goals_263,test,47,0.5041456175585018,0.9291514786865128
llm_goals_263,test,48,0.5711219912189175,0.2313178866490127
llm_goals_263,test,49,0.6348032752425167,0.3779293731936072
llm_goals_157,test,0,0.7685672215674496,0.7943095194508789
llm_goals_157,test,1,0.02293025773672967,0.0516624712053447
llm_goals_157,test,2,0.7439934259767925,0.8020233336204885
llm_goals_157,test,3,0.40360002587697225,0.5904722684734964
llm_goals_157,test,4,0.863039184974661,0.9619353001797089
llm_goals_157,test,5,0.5660155878152956,0.6767415952202784
llm_goals_157,test,6,0.6320914226359365,0.7612977247981438
llm_goals_157,test,7,0.6993271909919417,0.6294506387377161
llm_goals_157,test,8,0.863039184974661,0.8937361945430545
llm_goals_157,test,9,0.31327017114345934,0.9788153257749777
llm_goals_157,test,10,0.6364843565246948,0.8824125505492224
llm_goals_157,test,11,0.2095906878699012,0.199986733795525
llm_goals_157,test,12,0.8819090996088711,0.9284577144290443
llm_goals_157,test,13,0.574926861175519,0.9240516415338534
llm_goals_157,test,14,0.2461248059144481,0.2475658313194042
llm_goals_157,test,15,0.9222309556445959,0.976340679507306
llm_goals_157,test,16,0.07601047318574854,0.3126950781624377
llm_goals_157,test,17,0.07087669607642867,0.046177739393252
llm_goals_157,test,18,0.4678354805112159,0.4250899393616417
llm_goals_157,test,19,0.629960941120263,0.6637557888114428
llm_goals_157,test,20,0.9222309556445959,0.9747431080575436
llm_goals_157,test,21,0.8747186633344226,0.566102644985123
llm_goals_157,test,22,0.2319580949978116,0.4645121573786108
llm_goals_157,test,23,0.026566411185268535,0.1429816093888423
llm_goals_157,test,24,0.19122373512328808,0.0397822616409018
llm_goals_157,test,25,0.6364843565246948,0.2832629442692311
llm_goals_157,test,26,0.3469667981577083,0.3005834296865567
llm_goals_157,test,27,0.16851339622954262,0.049069242775247
llm_goals_157,test,28,0.8036743214342893,0.2908678434467844
llm_goals_157,test,29,0.20877205370467591,0.1061660413895585
llm_goals_157,test,30,0.4371141435751908,0.5164500368467446
llm_goals_157,test,31,0.66410479762629,0.9364517603204892
llm_goals_157,test,32,0.15605550515612845,0.0583368009018155
llm_goals_157,test,33,0.07601047318574854,0.102471328139649
llm_goals_157,test,34,0.629940212323569,0.7754930766823708
llm_goals_157,test,35,0.8076180714624158,0.930098280704675
llm_goals_157,test,36,0.6364843565246948,0.8978537108401503
llm_goals_157,test,37,0.05502341222794784,0.185447729939923
llm_goals_157,test,38,0.27199627433678814,0.4989516423125952
llm_goals_157,test,39,0.9457512091580452,0.8172337053734404
llm_goals_157,test,40,0.026360413469477966,0.3208967259617554
llm_goals_157,test,41,0.26236192800500124,0.9628746978064082
llm_goals_157,test,42,0.7383780408869081,0.9537549409903032
llm_goals_157,test,43,0.25740202624242464,0.9854372229811326
llm_goals_157,test,44,0.863039184974661,0.9446223273489608
llm_goals_157,test,45,0.6401102865558986,0.917287033427004
llm_goals_157,test,46,0.4619846074583657,0.2958138118998824
llm_goals_157,test,47,0.7773178160941544,0.7644578181201236
llm_goals_157,test,48,0.23930467751597587,0.2919786437406029
llm_goals_157,test,49,0.48662085906134384,0.2435548949640933
llm_goals_358,test,0,0.7927648003142135,0.9710288332808288
llm_goals_358,test,1,0.9083410332229676,0.1090780967183576
llm_goals_358,test,2,0.765304717544109,0.8957724929016077
llm_goals_358,test,3,0.14391501617885674,0.0314742636417454
llm_goals_358,test,4,0.8695847230863584,0.9345866127648594
llm_goals_358,test,5,0.4867665835869821,0.3075908794558576
llm_goals_358,test,6,0.2878597362445903,0.1938894394639401
llm_goals_358,test,7,0.9057179453262494,0.9366675383938772
llm_goals_358,test,8,0.9563424377514261,0.9600018984290702
llm_goals_358,test,9,0.16445987493723105,0.0356972898371527
llm_goals_358,test,10,0.34717015722306654,0.7396882546703099
llm_goals_358,test,11,0.4679488574091037,0.0409023187764638
llm_goals_358,test,12,0.5344359170522962,0.0976624021485058
llm_goals_358,test,13,0.24091797308955532,0.1216232236474993
llm_goals_358,test,14,0.8262167238763699,0.7864359180640846
llm_goals_358,test,15,0.904972671680885,0.8556484582282166
llm_goals_358,test,16,0.8561013649518058,0.7341230488107452
llm_goals_358,test,17,0.629548514033787,0.2726809060238253
llm_goals_358,test,18,0.3759894473840755,0.7566054280756713
llm_goals_358,test,19,0.7650641389444779,0.0434563732454263
llm_goals_358,test,20,0.7610083958423278,0.8243328886415383
llm_goals_358,test,21,0.14003159914022387,0.1112076480131408
llm_goals_358,test,22,0.08837325955364093,0.0845862458189736
llm_goals_358,test,23,0.7761567296473063,0.0375312043866978
llm_goals_358,test,24,0.7857085156311046,0.8172477900339192
llm_goals_358,test,25,0.7800074905211648,0.9764694049382328
llm_goals_358,test,26,0.8056063277901065,0.7040948478982805
llm_goals_358,test,27,0.38578460207925397,0.125707811898555
llm_goals_358,test,28,0.25146411262928087,0.1566378003751444
llm_goals_358,test,29,0.6802776019485471,0.1707030695577025
llm_goals_358,test,30,0.8044556522065606,0.7917262984233946
llm_goals_358,test,31,0.6651350024556743,0.0448402492326266
llm_goals_358,test,32,0.9186259668241842,0.0880149966006802
llm_goals_358,test,33,0.9218265030962405,0.9036261072893176
llm_goals_358,test,34,0.14432228831899382,0.6926631691100236
llm_goals_358,test,35,0.755895335407892,0.772573980123232
llm_goals_358,test,36,0.16187028364288672,0.443962006250219
llm_goals_358,test,37,0.8317226006480688,0.5987374702917627
llm_goals_358,test,38,0.45832615519322245,0.0973650244988885
llm_goals_358,test,39,0.6129513779997086,0.0374517082121219
llm_goals_358,test,40,0.07349624080618056,0.0459188553104236
llm_goals_358,test,41,0.07367426215166403,0.067381376462992
llm_goals_358,test,42,0.765304717544109,0.9322344143419644
llm_goals_358,test,43,0.055757066516752274,0.0773258781385884
llm_goals_358,test,44,0.6856326164535372,0.9867304662942348
llm_goals_358,test,45,0.676858185079891,0.0921047575496883
llm_goals_358,test,46,0.18377450208562887,0.0203810451816961
llm_goals_358,test,47,0.3101573995027192,0.0161558697095388
llm_goals_358,test,48,0.6706917189657506,0.7751475880899051
llm_goals_358,test,49,0.6198332784945465,0.4160470958249456
llm_goals_78,test,0,0.24754224217588328,0.2251708162334548
llm_goals_78,test,1,0.3913637438002264,0.0367340336052023
llm_goals_78,test,2,0.18873004222949022,0.0527379912395899
llm_goals_78,test,3,0.2013843649907147,0.0259505842905422
llm_goals_78,test,4,0.22015402470259196,0.0939178372549231
llm_goals_78,test,5,0.12775093992546446,0.6658069720444946
llm_goals_78,test,6,0.19605094787369537,0.0424593855688115
llm_goals_78,test,7,0.18873004222949022,0.3068789421692927
llm_goals_78,test,8,0.2687563582470263,0.0254129292421898
llm_goals_78,test,9,0.0911980923725257,0.0407835069490974
llm_goals_78,test,10,0.9480522847024998,0.9375706694734316
llm_goals_78,test,11,0.7230314820518751,0.7386383432572439
llm_goals_78,test,12,0.41847287000876143,0.3108688169890243
llm_goals_78,test,13,0.2321512112767671,0.0946944663222736
llm_goals_78,test,14,0.14249255928281596,0.1717796546359565
llm_goals_78,test,15,0.23385375558361302,0.1277153625141483
llm_goals_78,test,16,0.10724823793518823,0.0689165589110325
llm_goals_78,test,17,0.8298576286031493,0.0883911059243408
llm_goals_78,test,18,0.0825884183916373,0.0337617130750813
llm_goals_78,test,19,0.633578159190023,0.7169547264343438
llm_goals_78,test,20,0.3097789098972572,0.1528222000997753
llm_goals_78,test,21,0.19091861390515805,0.0350685532944032
llm_goals_78,test,22,0.42936002973639437,0.0940461009061424
llm_goals_78,test,23,0.9658729722345805,0.9060885414573472
llm_goals_78,test,24,0.10568564291144521,0.0217941677583094
llm_goals_78,test,25,0.9543776318638875,0.9667879364041514
llm_goals_78,test,26,0.0636306845617639,0.0797221269088608
llm_goals_78,test,27,0.8750198809479343,0.0603014558146647
llm_goals_78,test,28,0.16521643015628926,0.019185604671188
llm_goals_78,test,29,0.7411573445254063,0.181847707574815
llm_goals_78,test,30,0.9297230233062234,0.9576328540155246
llm_goals_78,test,31,0.21526695422678097,0.1600616173680257
llm_goals_78,test,32,0.8479559742771196,0.8196381975442921
llm_goals_78,test,33,0.0825884183916373,0.0444875750236097
llm_goals_78,test,34,0.9255061237812735,0.9277514916547148
llm_goals_78,test,35,0.14592604425456657,0.1986446962511548
llm_goals_78,test,36,0.9272313781973492,0.9359311183925404
llm_goals_78,test,37,0.860389990595306,0.8760354323987716
llm_goals_78,test,38,0.6074223396334016,0.4610991071324792
llm_goals_78,test,39,0.41847287000876143,0.2972845381897555
llm_goals_78,test,40,0.6803725434155442,0.7716125042657197
llm_goals_78,test,41,0.18397797705891408,0.1328309068036672
llm_goals_78,test,42,0.18873004222949022,0.3354286767519867
llm_goals_78,test,43,0.21526695422678097,0.086342843675339
llm_goals_78,test,44,0.29421166166554297,0.0958279087075554
llm_goals_78,test,45,0.21947983729791964,0.1302156649936615
llm_goals_78,test,46,0.957041515415297,0.8983792614483327
llm_goals_78,test,47,0.1117420693088389,0.1775307323333411
llm_goals_78,test,48,0.08000980842654891,0.0658487938814022
llm_goals_78,test,49,0.3566345399178386,0.079644576255816
llm_goals_420,test,0,0.6533812751550817,0.7165124795044365
llm_goals_420,test,1,0.3698175402213897,0.7608911842606508
llm_goals_420,test,2,0.6968586322717197,0.799936385630717
llm_goals_420,test,3,0.18948344076947668,0.2211062209422303
llm_goals_420,test,4,0.5567842848623308,0.2926466150380465
llm_goals_420,test,5,0.6519830691965159,0.9140651066289046
llm_goals_420,test,6,0.543912620870392,0.4131756456187543
llm_goals_420,test,7,0.8888801608692506,0.6643261466520904
llm_goals_420,test,8,0.9101719259763672,0.3578404079978603
llm_goals_420,test,9,0.7376955088666669,0.8413468212597344
llm_goals_420,test,10,0.39226607833946076,0.4981438990065536
llm_goals_420,test,11,0.389451569219283,0.2468097596316683
llm_goals_420,test,12,0.15985186834647938,0.1549754451331909
llm_goals_420,test,13,0.8710226131340485,0.8951478256933764
llm_goals_420,test,14,0.3742505128253042,0.0722168451540495
llm_goals_420,test,15,0.29089743528756457,0.7175548720080566
llm_goals_420,test,16,0.0905174083142304,0.0482770035552138
llm_goals_420,test,17,0.3806404692876832,0.9171404716362525
llm_goals_420,test,18,0.5670935217089377,0.2149325509708838
llm_goals_420,test,19,0.6295627722541582,0.9314370105190324
llm_goals_420,test,20,0.654070742861124,0.6958358689335516
llm_goals_420,test,21,0.6848445580759361,0.6712961637420737
llm_goals_420,test,22,0.6476303207891396,0.9091188630862124
llm_goals_420,test,23,0.3465605301440328,0.080457132763502
llm_goals_420,test,24,0.03829797795297927,0.0910185464003223
llm_goals_420,test,25,0.6843130507757778,0.0266374948315803
llm_goals_420,test,26,0.6032043040357746,0.3477530565713536
llm_goals_420,test,27,0.08847376871046264,0.8201931514993901
llm_goals_420,test,28,0.6798946146540764,0.2425383031071764
llm_goals_420,test,29,0.9572975794783254,0.4181605367795475
llm_goals_420,test,30,0.0881731586852782,0.0299293846265948
llm_goals_420,test,31,0.37514801999572794,0.940670822547668
llm_goals_420,test,32,0.87239651122704,0.0196824789824236
llm_goals_420,test,33,0.0702387457798037,0.1078959069076236
llm_goals_420,test,34,0.08028035972327037,0.2191371931392249
llm_goals_420,test,35,0.6834743973953245,0.9034152914594604
llm_goals_420,test,36,0.08584070907478225,0.548380428606202
llm_goals_420,test,37,0.5877427539939674,0.50388122703708
llm_goals_420,test,38,0.2991337325435764,0.4294891851736946
llm_goals_420,test,39,0.07977981057641227,0.4382416051683284
llm_goals_420,test,40,0.3556588277141095,0.141879820547579
llm_goals_420,test,41,0.5631054158751615,0.6151086701978562
llm_goals_420,test,42,0.3324430700373492,0.7490416767979864
llm_goals_420,test,43,0.6922757600829574,0.6273048386641107
llm_goals_420,test,44,0.724737714677926,0.8162625944607043
llm_goals_420,test,45,0.03248376856202317,0.3347655055973148
llm_goals_420,test,46,0.09842901955800722,0.2248938224655197
llm_goals_420,test,47,0.03174593423432063,0.7293239346358632
llm_goals_420,test,48,0.6503505599733826,0.1530180333157787
llm_goals_420,test,49,0.8903064395089824,0.9588707841469084
llm_goals_53,test,0,0.31331602546509646,0.976097291167194
llm_goals_53,test,1,0.9812316194946832,0.2598265618814769
llm_goals_53,test,2,0.9029572411833167,0.9770793290161108
llm_goals_53,test,3,0.6788141934157231,0.4768547215758607
llm_goals_53,test,4,0.9855726126254333,0.2361872878274303
llm_goals_53,test,5,0.099003701181677,0.0986317022184206
llm_goals_53,test,6,0.13938966665656574,0.0477100161960414
llm_goals_53,test,7,0.9814755639663383,0.937994454790112
llm_goals_53,test,8,0.7304185686915542,0.2701156822033339
llm_goals_53,test,9,0.40802400617870455,0.2989108711032385
llm_goals_53,test,10,0.5606299117777341,0.5544564065686126
llm_goals_53,test,11,0.4399427250956056,0.3953618346843373
llm_goals_53,test,12,0.4235409091984185,0.1335346211746911
llm_goals_53,test,13,0.33325976374609606,0.0585116233918817
llm_goals_53,test,14,0.7272969760230475,0.1376328700771095
llm_goals_53,test,15,0.596124145939752,0.4350138720043813
llm_goals_53,test,16,0.470501641239925,0.0717024446401859
llm_goals_53,test,17,0.6437087827247349,0.6563471973646152
llm_goals_53,test,18,0.5324847114782504,0.2165785858914521
llm_goals_53,test,19,0.673360765833952,0.3746358016952676
llm_goals_53,test,20,0.7272969760230475,0.5337460360023749
llm_goals_53,test,21,0.41360856412724395,0.0467709874601332
llm_goals_53,test,22,0.9931437454791734,0.7796763173252493
llm_goals_53,test,23,0.49703113012500477,0.3205915991497378
llm_goals_53,test,24,0.3649808191434341,0.0640075835802484
llm_goals_53,test,25,0.6604552929453404,0.833565084619613
llm_goals_53,test,26,0.6226584528102684,0.0854875283183964
llm_goals_53,test,27,0.3847008807625962,0.9078949534688217
llm_goals_53,test,28,0.7286139721939978,0.3980814368097108
llm_goals_53,test,29,0.6472419372891787,0.0495337152571608
llm_goals_53,test,30,0.6831149956715749,0.49697645864992
llm_goals_53,test,31,0.6624644509561222,0.4685591079414317
llm_goals_53,test,32,0.5541452035803244,0.0870796105685882
llm_goals_53,test,33,0.46423270451547527,0.0188204043218978
llm_goals_53,test,34,0.7924131853994983,0.5566033569957117
llm_goals_53,test,35,0.5744329855593634,0.9313365617424948
llm_goals_53,test,36,0.9082069319171923,0.9304982364910718
llm_goals_53,test,37,0.5129448256254406,0.1916887084340081
llm_goals_53,test,38,0.6553658619489249,0.0179322256288976
llm_goals_53,test,39,0.61013002472184,0.042191597199028
llm_goals_53,test,40,0.2315685545915146,0.4480237505797492
llm_goals_53,test,41,0.37933306820664936,0.199711476764323
llm_goals_53,test,42,0.5621719122939747,0.984673662230153
llm_goals_53,test,43,0.5433465721758584,0.1015360353200591
llm_goals_53,test,44,0.5653063513825279,0.2398468184361071
llm_goals_53,test,45,0.6799970054356971,0.5147270663759912
llm_goals_53,test,46,0.7594624972907745,0.6026394622908158
llm_goals_53,test,47,0.4439166120125541,0.7105197565308571
llm_goals_53,test,48,0.9029572411833167,0.1056143884471251
llm_goals_53,test,49,0.6219037791373189,0.2875693652635701
llm_goals_427,test,0,0.8668697903230386,0.9912377865392056
llm_goals_427,test,1,0.6884206795588784,0.1393504988400085
llm_goals_427,test,2,0.9685247031166581,0.9826717605764466
llm_goals_427,test,3,0.9888774510658647,0.9914966630190112
llm_goals_427,test,4,0.20350582535915696,0.0287440390481499
llm_goals_427,test,5,0.6388845172392631,0.1508234315553654
llm_goals_427,test,6,0.23066672966919663,0.0241177394276523
llm_goals_427,test,7,0.7748785240122741,0.9533421090109172
llm_goals_427,test,8,0.38003500070864954,0.1357554081265164
llm_goals_427,test,9,0.9488132449023982,0.0422408742214398
llm_goals_427,test,10,0.7762848392221965,0.3560677064830195
llm_goals_427,test,11,0.8660699791685955,0.2848587352361455
llm_goals_427,test,12,0.6365674472682471,0.0783011900572995
llm_goals_427,test,13,0.6036135022216303,0.053588048642731
llm_goals_427,test,14,0.8576329171432823,0.1755007793342038
llm_goals_427,test,15,0.5559704374394118,0.03905897487628
llm_goals_427,test,16,0.1577634036611279,0.0861236052612804
llm_goals_427,test,17,0.7097267406982056,0.2907015821684348
llm_goals_427,test,18,0.48567597056254436,0.0468453325440364
llm_goals_427,test,19,0.8892301968198852,0.7510010963524218
llm_goals_427,test,20,0.3981405007858427,0.0467429391605962
llm_goals_427,test,21,0.9488132449023982,0.1304366461429133
llm_goals_427,test,22,0.7097267406982056,0.1246622694694481
llm_goals_427,test,23,0.7762859710629709,0.5644455097827197
llm_goals_427,test,24,0.29820350611544993,0.0414160339225927
llm_goals_427,test,25,0.9199776066340751,0.8926284254200217
llm_goals_427,test,26,0.48567597056254436,0.0591453922508401
llm_goals_427,test,27,0.6836647086170569,0.5016671352552752
llm_goals_427,test,28,0.9835105415470031,0.9189449605602464
llm_goals_427,test,29,0.6927615836449159,0.5267252864404038
llm_goals_427,test,30,0.6582939907301703,0.3196802851986922
llm_goals_427,test,31,0.9290628859433013,0.0622742618121558
llm_goals_427,test,32,0.6081541411355724,0.2393552597896355
llm_goals_427,test,33,0.13505215806946627,0.0317774218950805
llm_goals_427,test,34,0.639331316423157,0.2969897604985466
llm_goals_427,test,35,0.8365213144390401,0.911826685378058
llm_goals_427,test,36,0.7007685210176327,0.5044385498946317
llm_goals_427,test,37,0.8658525541420796,0.961152239017662
llm_goals_427,test,38,0.6912853565321749,0.383885411527425
llm_goals_427,test,39,0.36050440829936053,0.0767754062509803
llm_goals_427,test,40,0.9488132449023982,0.3019915478879681
llm_goals_427,test,41,0.13236412100838857,0.0597208539505394
llm_goals_427,test,42,0.8975381518399068,0.9798415326165176
llm_goals_427,test,43,0.7601933125162049,0.0828234646890313
llm_goals_427,test,44,0.37499269389817336,0.1075404432723246
llm_goals_427,test,45,0.7546096730234942,0.9497563751433828
llm_goals_427,test,46,0.2945447121606009,0.2027056215184361
llm_goals_427,test,47,0.9511476197750722,0.9493266919171398
llm_goals_427,test,48,0.3187023751320415,0.0344289143960405
llm_goals_427,test,49,0.19784285556758555,0.1952894749193552
llm_goals_186,test,0,0.9618733692783547,0.534925569771277
llm_goals_186,test,1,0.5345190267996206,0.0649953944046378
llm_goals_186,test,2,0.9017561009958323,0.91763923479236
llm_goals_186,test,3,0.2839138625813906,0.3425021516930106
llm_goals_186,test,4,0.6338125695297792,0.1153021531057396
llm_goals_186,test,5,0.945031294226479,0.7928793741281699
llm_goals_186,test,6,0.9320899218317825,0.9038094070559602
llm_goals_186,test,7,0.953530596262016,0.6367372560980368
llm_goals_186,test,8,0.3116733053429723,0.2126364849604726
llm_goals_186,test,9,0.923176680941554,0.8694824597543704
llm_goals_186,test,10,0.4476272455917318,0.5802607311846129
llm_goals_186,test,11,0.6312828925191178,0.2225491999116792
llm_goals_186,test,12,0.47584736977073866,0.2300986684078339
llm_goals_186,test,13,0.3488946787256006,0.9257638147127129
llm_goals_186,test,14,0.13280260197761454,0.1695718974503099
llm_goals_186,test,15,0.2500564717193607,0.151038541979901
llm_goals_186,test,16,0.23902643206927135,0.0464142133590747
llm_goals_186,test,17,0.3995120711099894,0.0732763222959853
llm_goals_186,test,18,0.3118634154645849,0.0482171595539919
llm_goals_186,test,19,0.1526436358053959,0.347547591319228
llm_goals_186,test,20,0.5952576450455663,0.1739822028354879
llm_goals_186,test,21,0.9418732373755306,0.9541198242132036
llm_goals_186,test,22,0.3463496328175435,0.049497112506125
llm_goals_186,test,23,0.5034075280351026,0.1810016520865223
llm_goals_186,test,24,0.2782057420418831,0.1851077351512521
llm_goals_186,test,25,0.7692600226465126,0.6713192505556377
llm_goals_186,test,26,0.6135724301521136,0.0711032925420902
llm_goals_186,test,27,0.3487629806477606,0.4081627252904761
llm_goals_186,test,28,0.3487629806477606,0.2745405964802801
llm_goals_186,test,29,0.28795690697269316,0.1854855714896691
llm_goals_186,test,30,0.5359659447764923,0.7354449882906446
llm_goals_186,test,31,0.9276571239710686,0.9912562823764032
llm_goals_186,test,32,0.45036456814082637,0.2618042375153737
llm_goals_186,test,33,0.34586229547965824,0.0337875336716617
llm_goals_186,test,34,0.4476272455917318,0.6428971957222914
llm_goals_186,test,35,0.08298810973778699,0.7900459432200765
llm_goals_186,test,36,0.7202655673742839,0.8730032999439788
llm_goals_186,test,37,0.3896079631672446,0.0649927594327202
llm_goals_186,test,38,0.6452170881062367,0.0471132735562561
llm_goals_186,test,39,0.41477479777407317,0.2481877539812294
llm_goals_186,test,40,0.6504133897229454,0.2111860555781098
llm_goals_186,test,41,0.909238208653833,0.8712882416841639
llm_goals_186,test,42,0.9618733692783547,0.6193248853412385
llm_goals_186,test,43,0.7338990829942859,0.8760979623283635
llm_goals_186,test,44,0.5097599544073182,0.0767958111106498
llm_goals_186,test,45,0.3866918416189627,0.0848440049881495
llm_goals_186,test,46,0.5735889092384472,0.6601266976660584
llm_goals_186,test,47,0.40711539011654785,0.4818652455075419
llm_goals_186,test,48,0.1139626074642347,0.1752603358335205
llm_goals_186,test,49,0.4507466605579428,0.027320507820661
llm_goals_133,test,0,0.6565403116177054,0.1030518399074919
llm_goals_133,test,1,0.39856233526734325,0.1009270067527766
llm_goals_133,test,2,0.3611376355165072,0.4669147668825159
llm_goals_133,test,3,0.34951689797786695,0.9886211587587188
llm_goals_133,test,4,0.6438701218453234,0.6589999206031925
llm_goals_133,test,5,0.5598444691970503,0.0478680529217008
llm_goals_133,test,6,0.24453242074270776,0.0213367665689539
llm_goals_133,test,7,0.38713694089440415,0.06300162626541
llm_goals_133,test,8,0.94909439587043,0.8613404237563876
llm_goals_133,test,9,0.6116804222590709,0.0502374017351794
llm_goals_133,test,10,0.36470226250260535,0.0728398857397339
llm_goals_133,test,11,0.6176281835531889,0.0886358546776828
llm_goals_133,test,12,0.2922824906758645,0.4714116383526195
llm_goals_133,test,13,0.12114025402132649,0.0406440348343292
llm_goals_133,test,14,0.6584922611229638,0.8416674339341796
llm_goals_133,test,15,0.6176281835531889,0.5989281494815651
llm_goals_133,test,16,0.30416320428029353,0.9641061261695968
llm_goals_133,test,17,0.6599708951932195,0.0521719884710187
llm_goals_133,test,18,0.5291462206502547,0.9257678218156756
llm_goals_133,test,19,0.16060952748600532,0.0409677417198195
llm_goals_133,test,20,0.5840101354486531,0.9201317528016504
llm_goals_133,test,21,0.3642356711623469,0.0611858046803647
llm_goals_133,test,22,0.4019844638474927,0.0749444450486417
llm_goals_133,test,23,0.9735635347536252,0.484676139228053
llm_goals_133,test,24,0.4637084290134674,0.8221724152075577
llm_goals_133,test,25,0.3177647114507455,0.2957602203771531
llm_goals_133,test,26,0.3989510079377245,0.8046360378637115
llm_goals_133,test,27,0.6412541534647381,0.0759761030516968
llm_goals_133,test,28,0.48877086667060227,0.9366340572155704
llm_goals_133,test,29,0.1978263921382696,0.1272708658186502
llm_goals_133,test,30,0.6885937425405816,0.1227999985147976
llm_goals_133,test,31,0.3834369028311772,0.0136010194313778
llm_goals_133,test,32,0.16651197667351247,0.3597276462870885
llm_goals_133,test,33,0.1873418687438444,0.8726937465962196
llm_goals_133,test,34,0.1619385026761647,0.2894476365444396
llm_goals_133,test,35,0.25486588128051163,0.0165111879681815
llm_goals_133,test,36,0.6354368790364712,0.0576655273020702
llm_goals_133,test,37,0.3535038879820656,0.2554780098122276
llm_goals_133,test,38,0.48464697173458887,0.032809734462924
llm_goals_133,test,39,0.6176281835531889,0.1481243946785008
llm_goals_133,test,40,0.348239528152784,0.4462128198301662
llm_goals_133,test,41,0.18331710924258834,0.093264815138027
llm_goals_133,test,42,0.522318118227936,0.2383228605626679
llm_goals_133,test,43,0.3586816859543313,0.196654087051587
llm_goals_133,test,44,0.5570250239570641,0.9747002088111656
llm_goals_133,test,45,0.3022103987585883,0.9831163433792584
llm_goals_133,test,46,0.1992948761033634,0.1097011751248294
llm_goals_133,test,47,0.3845319219674937,0.8283354147237331
llm_goals_133,test,48,0.6531838096195076,0.8799294836893965
llm_goals_133,test,49,0.5684010301793317,0.2364671831052382
llm_goals_81,test,0,0.17474301613159363,0.1758977435560022
llm_goals_81,test,1,0.25502737533567915,0.4421252700970533
llm_goals_81,test,2,0.19128093135768096,0.5612444031805882
llm_goals_81,test,3,0.07863398143858093,0.3079533253993743
llm_goals_81,test,4,0.13665279724247453,0.1763212150593861
llm_goals_81,test,5,0.3912981631739549,0.9704465583106344
llm_goals_81,test,6,0.20441048270358866,0.9821312875358365
llm_goals_81,test,7,0.0876077370311897,0.3270685617728195
llm_goals_81,test,8,0.1012306071214305,0.4843756215736013
llm_goals_81,test,9,0.22208726962397293,0.9933654977534896
llm_goals_81,test,10,0.16761896538916168,0.4711097472541105
llm_goals_81,test,11,0.3897566795589385,0.1673212093996636
llm_goals_81,test,12,0.17729638685168658,0.2643530158966523
llm_goals_81,test,13,0.125711584765227,0.9714035818561728
llm_goals_81,test,14,0.04214508226993513,0.9265405587707818
llm_goals_81,test,15,0.13304300305335004,0.1723195082090535
llm_goals_81,test,16,0.06486742052110153,0.9360974516501586
llm_goals_81,test,17,0.1947079560832291,0.4363540220565442
llm_goals_81,test,18,0.06968559631003611,0.9611565911249424
llm_goals_81,test,19,0.10041168548896429,0.0324757314893466
llm_goals_81,test,20,0.20221047412973717,0.6006056520074408
llm_goals_81,test,21,0.07817335776275176,0.9971859123159944
llm_goals_81,test,22,0.1847850688514502,0.0870371051461664
llm_goals_81,test,23,0.1079611003265369,0.2408633212672459
llm_goals_81,test,24,0.33747874292874686,0.9951702226622482
llm_goals_81,test,25,0.09516227389845688,0.6867633490140795
llm_goals_81,test,26,0.25502737533567915,0.9718244652881064
llm_goals_81,test,27,0.22208726962397293,0.4588186617124049
llm_goals_81,test,28,0.3755142772587147,0.5322330497164953
llm_goals_81,test,29,0.1318542817214519,0.2121016556019813
llm_goals_81,test,30,0.2258417707879333,0.6774810136296258
llm_goals_81,test,31,0.4155169781811381,0.9816113605758902
llm_goals_81,test,32,0.3897566795589385,0.2656694493977183
llm_goals_81,test,33,0.10456082715158278,0.942492448912156
llm_goals_81,test,34,0.13346639309078526,0.6429005762747164
llm_goals_81,test,35,0.09074702119921936,0.1528167702888629
llm_goals_81,test,36,0.11621030290159971,0.4512348514816248
llm_goals_81,test,37,0.37341277650911026,0.0605006450173409
llm_goals_81,test,38,0.25502737533567915,0.0274755323758623
llm_goals_81,test,39,0.09074702119921936,0.2279901766778581
llm_goals_81,test,40,0.183785312287982,0.2775541527352398
llm_goals_81,test,41,0.11424113291004023,0.9829489706314426
llm_goals_81,test,42,0.19128093135768096,0.2494339762077133
llm_goals_81,test,43,0.17729638685168658,0.9819424303599844
llm_goals_81,test,44,0.0969211100345671,0.632760349651464
llm_goals_81,test,45,0.2977378971666569,0.090990563553155
llm_goals_81,test,46,0.11715563994047036,0.0910438800719751
llm_goals_81,test,47,0.2154163262545972,0.1292081639058968
llm_goals_81,test,48,0.19128093135768096,0.974747372736112
llm_goals_81,test,49,0.1369241204701343,0.2645580764012665
llm_goals_93,test,0,0.2400849613530663,0.5635269221536086
llm_goals_93,test,1,0.11345936786036227,0.8801163792253427
llm_goals_93,test,2,0.14203767251433505,0.0696003588446044
llm_goals_93,test,3,0.4560085458713658,0.8186048531566104
llm_goals_93,test,4,0.023970818654257865,0.2222011584760154
llm_goals_93,test,5,0.3240283193599115,0.1268359519713418
llm_goals_93,test,6,0.127106624873323,0.4582622566067956
llm_goals_93,test,7,0.3133731017782991,0.429479690525812
llm_goals_93,test,8,0.0343848257408906,0.1536290973166499
llm_goals_93,test,9,0.10702475507442177,0.6112573193671209
llm_goals_93,test,10,0.823993083395217,0.7998858649804967
llm_goals_93,test,11,0.17273663926452978,0.5454222135748753
llm_goals_93,test,12,0.3203193341387822,0.2508427619545539
llm_goals_93,test,13,0.035771215990504736,0.0884842413878226
llm_goals_93,test,14,0.5167905854363958,0.6768600290465995
llm_goals_93,test,15,0.07189173259078394,0.0352718405868165
llm_goals_93,test,16,0.25661510741207855,0.8009568965617743
llm_goals_93,test,17,0.07796664905431383,0.8092096317591537
llm_goals_93,test,18,0.43633151233167977,0.963804174465268
llm_goals_93,test,19,0.2362121496685795,0.9058854167265824
llm_goals_93,test,20,0.030121444132616332,0.265390180652688
llm_goals_93,test,21,0.28490767410790624,0.1541113602215154
llm_goals_93,test,22,0.10796321757929832,0.9766790566784582
llm_goals_93,test,23,0.20339145333879807,0.7843335253318285
llm_goals_93,test,24,0.34333231835542294,0.548404369330273
llm_goals_93,test,25,0.7752819706326627,0.9813529135147334
llm_goals_93,test,26,0.22801746009847498,0.9397963116499958
llm_goals_93,test,27,0.20612895324621153,0.542547443300257
llm_goals_93,test,28,0.3722385780253328,0.8277938193324692
llm_goals_93,test,29,0.05734004040635493,0.8549419878819347
llm_goals_93,test,30,0.768829612780288,0.9761371695174176
llm_goals_93,test,31,0.08475067195669173,0.1774015734695253
llm_goals_93,test,32,0.11337184312055822,0.9590755456587298
llm_goals_93,test,33,0.156539591246752,0.9496314531215296
llm_goals_93,test,34,0.022087911451778602,0.9112802317013324
llm_goals_93,test,35,0.21665359827532363,0.0646469314244137
llm_goals_93,test,36,0.5662923550569061,0.965643964207344
llm_goals_93,test,37,0.27163776507184356,0.963180821243277
llm_goals_93,test,38,0.2841987826297161,0.9411316422109696
llm_goals_93,test,39,0.3520178560532981,0.1075404372822008
llm_goals_93,test,40,0.15525399767291123,0.959466160286712
llm_goals_93,test,41,0.1949122948155587,0.3698215332403156
llm_goals_93,test,42,0.2072389519867767,0.1589404653011508
llm_goals_93,test,43,0.11567142220972333,0.2338719832936831
llm_goals_93,test,44,0.17675967518619284,0.1124984808029749
llm_goals_93,test,45,0.09116116941348656,0.866543330684459
llm_goals_93,test,46,0.13818185559566484,0.8519759554788342
llm_goals_93,test,47,0.3537844908336089,0.8737971308795239
llm_goals_93,test,48,0.22023883528936453,0.8916334225039363
llm_goals_93,test,49,0.12262111139871346,0.8758339889840314
llm_goals_401,test,0,0.49956419102114724,0.1359674012107803
llm_goals_401,test,1,0.06053497584851569,0.939276601509621
llm_goals_401,test,2,0.2043174799392916,0.3090277756984529
llm_goals_401,test,3,0.14271210245073693,0.2822982814806737
llm_goals_401,test,4,0.5156561049045612,0.9227317209028506
llm_goals_401,test,5,0.03926034028204144,0.0683562610885711
llm_goals_401,test,6,0.14851940571992522,0.1529393504632372
llm_goals_401,test,7,0.09656648073978617,0.2291880493623187
llm_goals_401,test,8,0.790205675659422,0.910221445630232
llm_goals_401,test,9,0.027337995824112102,0.0669374443869285
llm_goals_401,test,10,0.34435942799817526,0.2562041584734201
llm_goals_401,test,11,0.08294402058631327,0.1977345307962301
llm_goals_401,test,12,0.8169244358279272,0.9351182671047276
llm_goals_401,test,13,0.026588275690009433,0.084239780653768
llm_goals_401,test,14,0.19224992849449474,0.3803121877997557
llm_goals_401,test,15,0.8328543313365131,0.9255856152963072
llm_goals_401,test,16,0.036870079037907934,0.2187242193427731
llm_goals_401,test,17,0.052000883157434535,0.9062633304766484
llm_goals_401,test,18,0.10203113148106407,0.0989866685824555
llm_goals_401,test,19,0.14747228530441328,0.0798642603957049
llm_goals_401,test,20,0.790205675659422,0.7283447799445965
llm_goals_401,test,21,0.0741977140244815,0.3040102668224276
llm_goals_401,test,22,0.05815865295911634,0.8871123935548803
llm_goals_401,test,23,0.13586199455229023,0.6306703155992205
llm_goals_401,test,24,0.16831736633546365,0.342468541641041
llm_goals_401,test,25,0.1154283744676302,0.0306332962828717
llm_goals_401,test,26,0.2585361633488943,0.1178928014307589
llm_goals_401,test,27,0.1435150917281677,0.8247832937930811
llm_goals_401,test,28,0.3003574217908697,0.3694959007053917
llm_goals_401,test,29,0.21131748884129076,0.0798909574616735
llm_goals_401,test,30,0.057944129955923795,0.3951674202836078
llm_goals_401,test,31,0.0741977140244815,0.466307960095254
llm_goals_401,test,32,0.09219515185105903,0.1971577420397864
llm_goals_401,test,33,0.2790144040209417,0.1760928155683087
llm_goals_401,test,34,0.0533101834724918,0.2047678657851429
llm_goals_401,test,35,0.13764347830575221,0.2637872561841102
llm_goals_401,test,36,0.22164063336592668,0.4724849406439279
llm_goals_401,test,37,0.8381951963350458,0.0192510310263775
llm_goals_401,test,38,0.20510711204544183,0.1812826057265395
llm_goals_401,test,39,0.7510884507797663,0.905821781657468
llm_goals_401,test,40,0.04315875905544281,0.1146947001091413
llm_goals_401,test,41,0.03321790213004457,0.1032293515072512
llm_goals_401,test,42,0.06836016740238583,0.3834835806051595
llm_goals_401,test,43,0.07172056886783602,0.2508475125103526
llm_goals_401,test,44,0.7201423864372464,0.8248843542416243
llm_goals_401,test,45,0.45684004794619587,0.5847666727108293
llm_goals_401,test,46,0.05912901933299356,0.4045147001032884
llm_goals_401,test,47,0.509165482542173,0.6278339401682421
llm_goals_401,test,48,0.07943661526014217,0.1361878043204594
llm_goals_401,test,49,0.3792220582934256,0.8435596200846341
