template_id,split,question_idx,prediction,label
llm_goals_449,test,0,0.451919087462046,0.1336325872199141
llm_goals_449,test,1,0.451919087462046,0.2356014848705813
llm_goals_449,test,2,0.451919087462046,0.3977331353545913
llm_goals_449,test,3,0.451919087462046,0.9671817093217177
llm_goals_449,test,4,0.451919087462046,0.7857460873195503
llm_goals_449,test,5,0.451919087462046,0.5164481763709956
llm_goals_449,test,6,0.451919087462046,0.0370459810848937
llm_goals_449,test,7,0.451919087462046,0.2618660511464079
llm_goals_449,test,8,0.451919087462046,0.9771937256062914
llm_goals_449,test,9,0.451919087462046,0.0204302625650166
llm_goals_449,test,10,0.451919087462046,0.0731782442371117
llm_goals_449,test,11,0.451919087462046,0.0091003072940505
llm_goals_449,test,12,0.451919087462046,0.1108627498844831
llm_goals_449,test,13,0.451919087462046,0.054840421346723
llm_goals_449,test,14,0.451919087462046,0.8313263696124994
llm_goals_449,test,15,0.451919087462046,0.8253071431638606
llm_goals_449,test,16,0.451919087462046,0.831142754565476
llm_goals_449,test,17,0.451919087462046,0.3065891414116863
llm_goals_449,test,18,0.451919087462046,0.4235929706341914
llm_goals_449,test,19,0.451919087462046,0.2342867705548718
llm_goals_449,test,20,0.451919087462046,0.5687148418873526
llm_goals_449,test,21,0.451919087462046,0.4888083146033534
llm_goals_449,test,22,0.451919087462046,0.0069036151286541
llm_goals_449,test,23,0.451919087462046,0.0739780745569788
llm_goals_449,test,24,0.451919087462046,0.9314584192860104
llm_goals_449,test,25,0.451919087462046,0.1420477852561596
llm_goals_449,test,26,0.451919087462046,0.7006375316273405
llm_goals_449,test,27,0.451919087462046,0.0612984362789981
llm_goals_449,test,28,0.451919087462046,0.9549750406111494
llm_goals_449,test,29,0.451919087462046,0.2943014776892277
llm_goals_449,test,30,0.451919087462046,0.0576629803259434
llm_goals_449,test,31,0.451919087462046,0.2255338162735628
llm_goals_449,test,32,0.451919087462046,0.0217578202648259
llm_goals_449,test,33,0.451919087462046,0.5881005329750926
llm_goals_449,test,34,0.451919087462046,0.0656003360881953
llm_goals_449,test,35,0.451919087462046,0.1899455989825758
llm_goals_449,test,36,0.451919087462046,0.1356723510839239
llm_goals_449,test,37,0.451919087462046,0.1724577552330986
llm_goals_449,test,38,0.451919087462046,0.097576330461044
llm_goals_449,test,39,0.451919087462046,0.0831443503045603
llm_goals_449,test,40,0.451919087462046,0.0085659129540734
llm_goals_449,test,41,0.451919087462046,0.0438119169092525
llm_goals_449,test,42,0.451919087462046,0.4942733211865646
llm_goals_449,test,43,0.451919087462046,0.1247723307463423
llm_goals_449,test,44,0.451919087462046,0.8400723355781036
llm_goals_449,test,45,0.451919087462046,0.925208223971735
llm_goals_449,test,46,0.451919087462046,0.0740922882863047
llm_goals_449,test,47,0.451919087462046,0.9373555404045412
llm_goals_449,test,48,0.451919087462046,0.3920310752556691
llm_goals_449,test,49,0.451919087462046,0.0277662962683335
llm_goals_75,test,0,0.6059667054166018,0.8642124165137652
llm_goals_75,test,1,0.6059667054166018,0.910359703136258
llm_goals_75,test,2,0.6059667054166018,0.8128286324258283
llm_goals_75,test,3,0.6059667054166018,0.1661489886313124
llm_goals_75,test,4,0.6059667054166018,0.1236451678860016
llm_goals_75,test,5,0.6059667054166018,0.6739037233559247
llm_goals_75,test,6,0.6059667054166018,0.1134434733777058
llm_goals_75,test,7,0.6059667054166018,0.6946055843235053
llm_goals_75,test,8,0.6059667054166018,0.1004496505890182
llm_goals_75,test,9,0.6059667054166018,0.1540130266900075
llm_goals_75,test,10,0.6059667054166018,0.3569515830662073
llm_goals_75,test,11,0.6059667054166018,0.4576154291835114
llm_goals_75,test,12,0.6059667054166018,0.1367346048355968
llm_goals_75,test,13,0.6059667054166018,0.0646890805500496
llm_goals_75,test,14,0.6059667054166018,0.1675122689898172
llm_goals_75,test,15,0.6059667054166018,0.069582458224139
llm_goals_75,test,16,0.6059667054166018,0.2354277864496811
llm_goals_75,test,17,0.6059667054166018,0.9447837743973488
llm_goals_75,test,18,0.6059667054166018,0.0781001795812696
llm_goals_75,test,19,0.6059667054166018,0.4868721494751054
llm_goals_75,test,20,0.6059667054166018,0.1033036348939128
llm_goals_75,test,21,0.6059667054166018,0.1276999559430948
llm_goals_75,test,22,0.6059667054166018,0.8431325364742722
llm_goals_75,test,23,0.6059667054166018,0.7460283918906632
llm_goals_75,test,24,0.6059667054166018,0.192573320599938
llm_goals_75,test,25,0.6059667054166018,0.3801085776614793
llm_goals_75,test,26,0.6059667054166018,0.1267870145951939
llm_goals_75,test,27,0.6059667054166018,0.9607504432606712
llm_goals_75,test,28,0.6059667054166018,0.0423146645658729
llm_goals_75,test,29,0.6059667054166018,0.4777054812224888
llm_goals_75,test,30,0.6059667054166018,0.4822637810175876
llm_goals_75,test,31,0.6059667054166018,0.0805248550261055
llm_goals_75,test,32,0.6059667054166018,0.6890841093919252
llm_goals_75,test,33,0.6059667054166018,0.1145962248845397
llm_goals_75,test,34,0.6059667054166018,0.2921261463182895
llm_goals_75,test,35,0.6059667054166018,0.6530562837025381
llm_goals_75,test,36,0.6059667054166018,0.1183304077208745
llm_goals_75,test,37,0.6059667054166018,0.868052766582826
llm_goals_75,test,38,0.6059667054166018,0.6535917953521371
llm_goals_75,test,39,0.6059667054166018,0.0644053193022136
llm_goals_75,test,40,0.6059667054166018,0.6019618834627347
llm_goals_75,test,41,0.6059667054166018,0.230389069862908
llm_goals_75,test,42,0.6059667054166018,0.7894553184375537
llm_goals_75,test,43,0.6059667054166018,0.2977582471382819
llm_goals_75,test,44,0.6059667054166018,0.2211815525008748
llm_goals_75,test,45,0.6059667054166018,0.0745441466493943
llm_goals_75,test,46,0.6059667054166018,0.7127955514788996
llm_goals_75,test,47,0.6059667054166018,0.0161223980025345
llm_goals_75,test,48,0.6059667054166018,0.1382513395050604
llm_goals_75,test,49,0.6059667054166018,0.9815106661613362
llm_goals_305,test,0,0.43604689176371075,0.2062097726301097
llm_goals_305,test,1,0.43604689176371075,0.7603213407742078
llm_goals_305,test,2,0.43604689176371075,0.0406395612652842
llm_goals_305,test,3,0.43604689176371075,0.4422001539134155
llm_goals_305,test,4,0.43604689176371075,0.2689791708049951
llm_goals_305,test,5,0.43604689176371075,0.1412581238797707
llm_goals_305,test,6,0.43604689176371075,0.0992911357773575
llm_goals_305,test,7,0.43604689176371075,0.1984947738037692
llm_goals_305,test,8,0.43604689176371075,0.1577864619647619
llm_goals_305,test,9,0.43604689176371075,0.0621641107275182
llm_goals_305,test,10,0.43604689176371075,0.9879174023450592
llm_goals_305,test,11,0.43604689176371075,0.5269669419962362
llm_goals_305,test,12,0.43604689176371075,0.2105593475656798
llm_goals_305,test,13,0.43604689176371075,0.2072161629845012
llm_goals_305,test,14,0.43604689176371075,0.6545892217736428
llm_goals_305,test,15,0.43604689176371075,0.5104040428268571
llm_goals_305,test,16,0.43604689176371075,0.5524398163622298
llm_goals_305,test,17,0.43604689176371075,0.8665614751565875
llm_goals_305,test,18,0.43604689176371075,0.3175479682579358
llm_goals_305,test,19,0.43604689176371075,0.3701558259397783
llm_goals_305,test,20,0.43604689176371075,0.0528314061272507
llm_goals_305,test,21,0.43604689176371075,0.3148726989644924
llm_goals_305,test,22,0.43604689176371075,0.447303668549321
llm_goals_305,test,23,0.43604689176371075,0.1744797562558885
llm_goals_305,test,24,0.43604689176371075,0.8158235756439657
llm_goals_305,test,25,0.43604689176371075,0.9578316364476024
llm_goals_305,test,26,0.43604689176371075,0.5595920193399587
llm_goals_305,test,27,0.43604689176371075,0.5967193097172223
llm_goals_305,test,28,0.43604689176371075,0.9037929343333102
llm_goals_305,test,29,0.43604689176371075,0.278165145436113
llm_goals_305,test,30,0.43604689176371075,0.9532629887346658
llm_goals_305,test,31,0.43604689176371075,0.5121334481158791
llm_goals_305,test,32,0.43604689176371075,0.1605879890433021
llm_goals_305,test,33,0.43604689176371075,0.6222808213139804
llm_goals_305,test,34,0.43604689176371075,0.9709568242405192
llm_goals_305,test,35,0.43604689176371075,0.5513220475450542
llm_goals_305,test,36,0.43604689176371075,0.9876292784574268
llm_goals_305,test,37,0.43604689176371075,0.258566594074644
llm_goals_305,test,38,0.43604689176371075,0.3940893870837836
llm_goals_305,test,39,0.43604689176371075,0.6249683049434822
llm_goals_305,test,40,0.43604689176371075,0.036012250509986
llm_goals_305,test,41,0.43604689176371075,0.0238784684017155
llm_goals_305,test,42,0.43604689176371075,0.1015334102504109
llm_goals_305,test,43,0.43604689176371075,0.0682627831684364
llm_goals_305,test,44,0.43604689176371075,0.0901285910304827
llm_goals_305,test,45,0.43604689176371075,0.8520020311890948
llm_goals_305,test,46,0.43604689176371075,0.512946133742762
llm_goals_305,test,47,0.43604689176371075,0.9460715758270588
llm_goals_305,test,48,0.43604689176371075,0.2634284981215168
llm_goals_305,test,49,0.43604689176371075,0.5226278491298435
llm_goals_263,test,0,0.41769153031366724,0.9722113849684072
llm_goals_263,test,1,0.41769153031366724,0.4308884142088059
llm_goals_263,test,2,0.41769153031366724,0.9112282637417588
llm_goals_263,test,3,0.41769153031366724,0.4678322072304764
llm_goals_263,test,4,0.41769153031366724,0.0681171790473069
llm_goals_263,test,5,0.41769153031366724,0.3304750158657515
llm_goals_263,test,6,0.41769153031366724,0.1049596434028026
llm_goals_263,test,7,0.41769153031366724,0.868290478100796
llm_goals_263,test,8,0.41769153031366724,0.0107688258732955
llm_goals_263,test,9,0.41769153031366724,0.5335894362422906
llm_goals_263,test,10,0.41769153031366724,0.4571801332195204
llm_goals_263,test,11,0.41769153031366724,0.4017475232284387
llm_goals_263,test,12,0.41769153031366724,0.7410716651377723
llm_goals_263,test,13,0.41769153031366724,0.2222869461895513
llm_goals_263,test,14,0.41769153031366724,0.0236037417776026
llm_goals_263,test,15,0.41769153031366724,0.0998823008982278
llm_goals_263,test,16,0.41769153031366724,0.0090037236123257
llm_goals_263,test,17,0.41769153031366724,0.3371875979935536
llm_goals_263,test,18,0.41769153031366724,0.2095794100566156
llm_goals_263,test,19,0.41769153031366724,0.1483621477954244
llm_goals_263,test,20,0.41769153031366724,0.2829259876769517
llm_goals_263,test,21,0.41769153031366724,0.1128506991103582
llm_goals_263,test,22,0.41769153031366724,0.8918927085227047
llm_goals_263,test,23,0.41769153031366724,0.1960590879366542
llm_goals_263,test,24,0.41769153031366724,0.0409316032122589
llm_goals_263,test,25,0.41769153031366724,0.1971178454456452
llm_goals_263,test,26,0.41769153031366724,0.290576284754869
llm_goals_263,test,27,0.41769153031366724,0.3914767323316075
llm_goals_263,test,28,0.41769153031366724,0.3629055172172753
llm_goals_263,test,29,0.41769153031366724,0.0312142081028261
llm_goals_263,test,30,0.41769153031366724,0.1928083275379132
llm_goals_263,test,31,0.41769153031366724,0.318621097342132
llm_goals_263,test,32,0.41769153031366724,0.1747653444762649
llm_goals_263,test,33,0.41769153031366724,0.0531218265570888
llm_goals_263,test,34,0.41769153031366724,0.1598154925951403
llm_goals_263,test,35,0.41769153031366724,0.94307484220015
llm_goals_263,test,36,0.41769153031366724,0.5041818847108344
llm_goals_263,test,37,0.41769153031366724,0.1111175217519077
llm_goals_263,test,38,0.41769153031366724,0.1867701836992809
llm_goals_263,test,39,0.41769153031366724,0.9513736387795227
llm_goals_263,test,40,0.41769153031366724,0.726601907835183
llm_goals_263,test,41,0.41769153031366724,0.2793940710071973
llm_goals_263,test,42,0.41769153031366724,0.7591325538288878
llm_goals_263,test,43,0.41769153031366724,0.0599255853483329
llm_goals_263,test,44,0.41769153031366724,0.0248060297565235
llm_goals_263,test,45,0.41769153031366724,0.4429293016127257
llm_goals_263,test,46,0.41769153031366724,0.3978895760863248
llm_goals_263,test,47,0.41769153031366724,0.9291514786865128
llm_goals_263,test,48,0.41769153031366724,0.2313178866490127
llm_goals_263,test,49,0.41769153031366724,0.3779293731936072
llm_goals_157,test,0,0.3550183973285731,0.7943095194508789
llm_goals_157,test,1,0.3550183973285731,0.0516624712053447
llm_goals_157,test,2,0.3550183973285731,0.8020233336204885
llm_goals_157,test,3,0.3550183973285731,0.5904722684734964
llm_goals_157,test,4,0.3550183973285731,0.9619353001797089
llm_goals_157,test,5,0.3550183973285731,0.6767415952202784
llm_goals_157,test,6,0.3550183973285731,0.7612977247981438
llm_goals_157,test,7,0.3550183973285731,0.6294506387377161
llm_goals_157,test,8,0.3550183973285731,0.8937361945430545
llm_goals_157,test,9,0.3550183973285731,0.9788153257749777
llm_goals_157,test,10,0.3550183973285731,0.8824125505492224
llm_goals_157,test,11,0.3550183973285731,0.199986733795525
llm_goals_157,test,12,0.3550183973285731,0.9284577144290443
llm_goals_157,test,13,0.3550183973285731,0.9240516415338534
llm_goals_157,test,14,0.3550183973285731,0.2475658313194042
llm_goals_157,test,15,0.3550183973285731,0.976340679507306
llm_goals_157,test,16,0.3550183973285731,0.3126950781624377
llm_goals_157,test,17,0.3550183973285731,0.046177739393252
llm_goals_157,test,18,0.3550183973285731,0.4250899393616417
llm_goals_157,test,19,0.3550183973285731,0.6637557888114428
llm_goals_157,test,20,0.3550183973285731,0.9747431080575436
llm_goals_157,test,21,0.3550183973285731,0.566102644985123
llm_goals_157,test,22,0.3550183973285731,0.4645121573786108
llm_goals_157,test,23,0.3550183973285731,0.1429816093888423
llm_goals_157,test,24,0.3550183973285731,0.0397822616409018
llm_goals_157,test,25,0.3550183973285731,0.2832629442692311
llm_goals_157,test,26,0.3550183973285731,0.3005834296865567
llm_goals_157,test,27,0.3550183973285731,0.049069242775247
llm_goals_157,test,28,0.3550183973285731,0.2908678434467844
llm_goals_157,test,29,0.3550183973285731,0.1061660413895585
llm_goals_157,test,30,0.3550183973285731,0.5164500368467446
llm_goals_157,test,31,0.3550183973285731,0.9364517603204892
llm_goals_157,test,32,0.3550183973285731,0.0583368009018155
llm_goals_157,test,33,0.3550183973285731,0.102471328139649
llm_goals_157,test,34,0.3550183973285731,0.7754930766823708
llm_goals_157,test,35,0.3550183973285731,0.930098280704675
llm_goals_157,test,36,0.3550183973285731,0.8978537108401503
llm_goals_157,test,37,0.3550183973285731,0.185447729939923
llm_goals_157,test,38,0.3550183973285731,0.4989516423125952
llm_goals_157,test,39,0.3550183973285731,0.8172337053734404
llm_goals_157,test,40,0.3550183973285731,0.3208967259617554
llm_goals_157,test,41,0.3550183973285731,0.9628746978064082
llm_goals_157,test,42,0.3550183973285731,0.9537549409903032
llm_goals_157,test,43,0.3550183973285731,0.9854372229811326
llm_goals_157,test,44,0.3550183973285731,0.9446223273489608
llm_goals_157,test,45,0.3550183973285731,0.917287033427004
llm_goals_157,test,46,0.3550183973285731,0.2958138118998824
llm_goals_157,test,47,0.3550183973285731,0.7644578181201236
llm_goals_157,test,48,0.3550183973285731,0.2919786437406029
llm_goals_157,test,49,0.3550183973285731,0.2435548949640933
llm_goals_358,test,0,0.4877666150488641,0.9710288332808288
llm_goals_358,test,1,0.4877666150488641,0.1090780967183576
llm_goals_358,test,2,0.4877666150488641,0.8957724929016077
llm_goals_358,test,3,0.4877666150488641,0.0314742636417454
llm_goals_358,test,4,0.4877666150488641,0.9345866127648594
llm_goals_358,test,5,0.4877666150488641,0.3075908794558576
llm_goals_358,test,6,0.4877666150488641,0.1938894394639401
llm_goals_358,test,7,0.4877666150488641,0.9366675383938772
llm_goals_358,test,8,0.4877666150488641,0.9600018984290702
llm_goals_358,test,9,0.4877666150488641,0.0356972898371527
llm_goals_358,test,10,0.4877666150488641,0.7396882546703099
llm_goals_358,test,11,0.4877666150488641,0.0409023187764638
llm_goals_358,test,12,0.4877666150488641,0.0976624021485058
llm_goals_358,test,13,0.4877666150488641,0.1216232236474993
llm_goals_358,test,14,0.4877666150488641,0.7864359180640846
llm_goals_358,test,15,0.4877666150488641,0.8556484582282166
llm_goals_358,test,16,0.4877666150488641,0.7341230488107452
llm_goals_358,test,17,0.4877666150488641,0.2726809060238253
llm_goals_358,test,18,0.4877666150488641,0.7566054280756713
llm_goals_358,test,19,0.4877666150488641,0.0434563732454263
llm_goals_358,test,20,0.4877666150488641,0.8243328886415383
llm_goals_358,test,21,0.4877666150488641,0.1112076480131408
llm_goals_358,test,22,0.4877666150488641,0.0845862458189736
llm_goals_358,test,23,0.4877666150488641,0.0375312043866978
llm_goals_358,test,24,0.4877666150488641,0.8172477900339192
llm_goals_358,test,25,0.4877666150488641,0.9764694049382328
llm_goals_358,test,26,0.4877666150488641,0.7040948478982805
llm_goals_358,test,27,0.4877666150488641,0.125707811898555
llm_goals_358,test,28,0.4877666150488641,0.1566378003751444
llm_goals_358,test,29,0.4877666150488641,0.1707030695577025
llm_goals_358,test,30,0.4877666150488641,0.7917262984233946
llm_goals_358,test,31,0.4877666150488641,0.0448402492326266
llm_goals_358,test,32,0.4877666150488641,0.0880149966006802
llm_goals_358,test,33,0.4877666150488641,0.9036261072893176
llm_goals_358,test,34,0.4877666150488641,0.6926631691100236
llm_goals_358,test,35,0.4877666150488641,0.772573980123232
llm_goals_358,test,36,0.4877666150488641,0.443962006250219
llm_goals_358,test,37,0.4877666150488641,0.5987374702917627
llm_goals_358,test,38,0.4877666150488641,0.0973650244988885
llm_goals_358,test,39,0.4877666150488641,0.0374517082121219
llm_goals_358,test,40,0.4877666150488641,0.0459188553104236
llm_goals_358,test,41,0.4877666150488641,0.067381376462992
llm_goals_358,test,42,0.4877666150488641,0.9322344143419644
llm_goals_358,test,43,0.4877666150488641,0.0773258781385884
llm_goals_358,test,44,0.4877666150488641,0.9867304662942348
llm_goals_358,test,45,0.4877666150488641,0.0921047575496883
llm_goals_358,test,46,0.4877666150488641,0.0203810451816961
llm_goals_358,test,47,0.4877666150488641,0.0161558697095388
llm_goals_358,test,48,0.4877666150488641,0.7751475880899051
llm_goals_358,test,49,0.4877666150488641,0.4160470958249456
llm_goals_78,test,0,0.6024050836885196,0.2251708162334548
llm_goals_78,test,1,0.6024050836885196,0.0367340336052023
llm_goals_78,test,2,0.6024050836885196,0.0527379912395899
llm_goals_78,test,3,0.6024050836885196,0.0259505842905422
llm_goals_78,test,4,0.6024050836885196,0.0939178372549231
llm_goals_78,test,5,0.6024050836885196,0.6658069720444946
llm_goals_78,test,6,0.6024050836885196,0.0424593855688115
llm_goals_78,test,7,0.6024050836885196,0.3068789421692927
llm_goals_78,test,8,0.6024050836885196,0.0254129292421898
llm_goals_78,test,9,0.6024050836885196,0.0407835069490974
llm_goals_78,test,10,0.6024050836885196,0.9375706694734316
llm_goals_78,test,11,0.6024050836885196,0.7386383432572439
llm_goals_78,test,12,0.6024050836885196,0.3108688169890243
llm_goals_78,test,13,0.6024050836885196,0.0946944663222736
llm_goals_78,test,14,0.6024050836885196,0.1717796546359565
llm_goals_78,test,15,0.6024050836885196,0.1277153625141483
llm_goals_78,test,16,0.6024050836885196,0.0689165589110325
llm_goals_78,test,17,0.6024050836885196,0.0883911059243408
llm_goals_78,test,18,0.6024050836885196,0.0337617130750813
llm_goals_78,test,19,0.6024050836885196,0.7169547264343438
llm_goals_78,test,20,0.6024050836885196,0.1528222000997753
llm_goals_78,test,21,0.6024050836885196,0.0350685532944032
llm_goals_78,test,22,0.6024050836885196,0.0940461009061424
llm_goals_78,test,23,0.6024050836885196,0.9060885414573472
llm_goals_78,test,24,0.6024050836885196,0.0217941677583094
llm_goals_78,test,25,0.6024050836885196,0.9667879364041514
llm_goals_78,test,26,0.6024050836885196,0.0797221269088608
llm_goals_78,test,27,0.6024050836885196,0.0603014558146647
llm_goals_78,test,28,0.6024050836885196,0.019185604671188
llm_goals_78,test,29,0.6024050836885196,0.181847707574815
llm_goals_78,test,30,0.6024050836885196,0.9576328540155246
llm_goals_78,test,31,0.6024050836885196,0.1600616173680257
llm_goals_78,test,32,0.6024050836885196,0.8196381975442921
llm_goals_78,test,33,0.6024050836885196,0.0444875750236097
llm_goals_78,test,34,0.6024050836885196,0.9277514916547148
llm_goals_78,test,35,0.6024050836885196,0.1986446962511548
llm_goals_78,test,36,0.6024050836885196,0.9359311183925404
llm_goals_78,test,37,0.6024050836885196,0.8760354323987716
llm_goals_78,test,38,0.6024050836885196,0.4610991071324792
llm_goals_78,test,39,0.6024050836885196,0.2972845381897555
llm_goals_78,test,40,0.6024050836885196,0.7716125042657197
llm_goals_78,test,41,0.6024050836885196,0.1328309068036672
llm_goals_78,test,42,0.6024050836885196,0.3354286767519867
llm_goals_78,test,43,0.6024050836885196,0.086342843675339
llm_goals_78,test,44,0.6024050836885196,0.0958279087075554
llm_goals_78,test,45,0.6024050836885196,0.1302156649936615
llm_goals_78,test,46,0.6024050836885196,0.8983792614483327
llm_goals_78,test,47,0.6024050836885196,0.1775307323333411
llm_goals_78,test,48,0.6024050836885196,0.0658487938814022
llm_goals_78,test,49,0.6024050836885196,0.079644576255816
llm_goals_420,test,0,0.5044244438850161,0.7165124795044365
llm_goals_420,test,1,0.5044244438850161,0.7608911842606508
llm_goals_420,test,2,0.5044244438850161,0.799936385630717
llm_goals_420,test,3,0.5044244438850161,0.2211062209422303
llm_goals_420,test,4,0.5044244438850161,0.2926466150380465
llm_goals_420,test,5,0.5044244438850161,0.9140651066289046
llm_goals_420,test,6,0.5044244438850161,0.4131756456187543
llm_goals_420,test,7,0.5044244438850161,0.6643261466520904
llm_goals_420,test,8,0.5044244438850161,0.3578404079978603
llm_goals_420,test,9,0.5044244438850161,0.8413468212597344
llm_goals_420,test,10,0.5044244438850161,0.4981438990065536
llm_goals_420,test,11,0.5044244438850161,0.2468097596316683
llm_goals_420,test,12,0.5044244438850161,0.1549754451331909
llm_goals_420,test,13,0.5044244438850161,0.8951478256933764
llm_goals_420,test,14,0.5044244438850161,0.0722168451540495
llm_goals_420,test,15,0.5044244438850161,0.7175548720080566
llm_goals_420,test,16,0.5044244438850161,0.0482770035552138
llm_goals_420,test,17,0.5044244438850161,0.9171404716362525
llm_goals_420,test,18,0.5044244438850161,0.2149325509708838
llm_goals_420,test,19,0.5044244438850161,0.9314370105190324
llm_goals_420,test,20,0.5044244438850161,0.6958358689335516
llm_goals_420,test,21,0.5044244438850161,0.6712961637420737
llm_goals_420,test,22,0.5044244438850161,0.9091188630862124
llm_goals_420,test,23,0.5044244438850161,0.080457132763502
llm_goals_420,test,24,0.5044244438850161,0.0910185464003223
llm_goals_420,test,25,0.5044244438850161,0.0266374948315803
llm_goals_420,test,26,0.5044244438850161,0.3477530565713536
llm_goals_420,test,27,0.5044244438850161,0.8201931514993901
llm_goals_420,test,28,0.5044244438850161,0.2425383031071764
llm_goals_420,test,29,0.5044244438850161,0.4181605367795475
llm_goals_420,test,30,0.5044244438850161,0.0299293846265948
llm_goals_420,test,31,0.5044244438850161,0.940670822547668
llm_goals_420,test,32,0.5044244438850161,0.0196824789824236
llm_goals_420,test,33,0.5044244438850161,0.1078959069076236
llm_goals_420,test,34,0.5044244438850161,0.2191371931392249
llm_goals_420,test,35,0.5044244438850161,0.9034152914594604
llm_goals_420,test,36,0.5044244438850161,0.548380428606202
llm_goals_420,test,37,0.5044244438850161,0.50388122703708
llm_goals_420,test,38,0.5044244438850161,0.4294891851736946
llm_goals_420,test,39,0.5044244438850161,0.4382416051683284
llm_goals_420,test,40,0.5044244438850161,0.141879820547579
llm_goals_420,test,41,0.5044244438850161,0.6151086701978562
llm_goals_420,test,42,0.5044244438850161,0.7490416767979864
llm_goals_420,test,43,0.5044244438850161,0.6273048386641107
llm_goals_420,test,44,0.5044244438850161,0.8162625944607043
llm_goals_420,test,45,0.5044244438850161,0.3347655055973148
llm_goals_420,test,46,0.5044244438850161,0.2248938224655197
llm_goals_420,test,47,0.5044244438850161,0.7293239346358632
llm_goals_420,test,48,0.5044244438850161,0.1530180333157787
llm_goals_420,test,49,0.5044244438850161,0.9588707841469084
llm_goals_53,test,0,0.6085262128142178,0.976097291167194
llm_goals_53,test,1,0.6085262128142178,0.2598265618814769
llm_goals_53,test,2,0.6085262128142178,0.9770793290161108
llm_goals_53,test,3,0.6085262128142178,0.4768547215758607
llm_goals_53,test,4,0.6085262128142178,0.2361872878274303
llm_goals_53,test,5,0.6085262128142178,0.0986317022184206
llm_goals_53,test,6,0.6085262128142178,0.0477100161960414
llm_goals_53,test,7,0.6085262128142178,0.937994454790112
llm_goals_53,test,8,0.6085262128142178,0.2701156822033339
llm_goals_53,test,9,0.6085262128142178,0.2989108711032385
llm_goals_53,test,10,0.6085262128142178,0.5544564065686126
llm_goals_53,test,11,0.6085262128142178,0.3953618346843373
llm_goals_53,test,12,0.6085262128142178,0.1335346211746911
llm_goals_53,test,13,0.6085262128142178,0.0585116233918817
llm_goals_53,test,14,0.6085262128142178,0.1376328700771095
llm_goals_53,test,15,0.6085262128142178,0.4350138720043813
llm_goals_53,test,16,0.6085262128142178,0.0717024446401859
llm_goals_53,test,17,0.6085262128142178,0.6563471973646152
llm_goals_53,test,18,0.6085262128142178,0.2165785858914521
llm_goals_53,test,19,0.6085262128142178,0.3746358016952676
llm_goals_53,test,20,0.6085262128142178,0.5337460360023749
llm_goals_53,test,21,0.6085262128142178,0.0467709874601332
llm_goals_53,test,22,0.6085262128142178,0.7796763173252493
llm_goals_53,test,23,0.6085262128142178,0.3205915991497378
llm_goals_53,test,24,0.6085262128142178,0.0640075835802484
llm_goals_53,test,25,0.6085262128142178,0.833565084619613
llm_goals_53,test,26,0.6085262128142178,0.0854875283183964
llm_goals_53,test,27,0.6085262128142178,0.9078949534688217
llm_goals_53,test,28,0.6085262128142178,0.3980814368097108
llm_goals_53,test,29,0.6085262128142178,0.0495337152571608
llm_goals_53,test,30,0.6085262128142178,0.49697645864992
llm_goals_53,test,31,0.6085262128142178,0.4685591079414317
llm_goals_53,test,32,0.6085262128142178,0.0870796105685882
llm_goals_53,test,33,0.6085262128142178,0.0188204043218978
llm_goals_53,test,34,0.6085262128142178,0.5566033569957117
llm_goals_53,test,35,0.6085262128142178,0.9313365617424948
llm_goals_53,test,36,0.6085262128142178,0.9304982364910718
llm_goals_53,test,37,0.6085262128142178,0.1916887084340081
llm_goals_53,test,38,0.6085262128142178,0.0179322256288976
llm_goals_53,test,39,0.6085262128142178,0.042191597199028
llm_goals_53,test,40,0.6085262128142178,0.4480237505797492
llm_goals_53,test,41,0.6085262128142178,0.199711476764323
llm_goals_53,test,42,0.6085262128142178,0.984673662230153
llm_goals_53,test,43,0.6085262128142178,0.1015360353200591
llm_goals_53,test,44,0.6085262128142178,0.2398468184361071
llm_goals_53,test,45,0.6085262128142178,0.5147270663759912
llm_goals_53,test,46,0.6085262128142178,0.6026394622908158
llm_goals_53,test,47,0.6085262128142178,0.7105197565308571
llm_goals_53,test,48,0.6085262128142178,0.1056143884471251
llm_goals_53,test,49,0.6085262128142178,0.2875693652635701
llm_goals_427,test,0,0.6756249878022381,0.9912377865392056
llm_goals_427,test,1,0.6756249878022381,0.1393504988400085
llm_goals_427,test,2,0.6756249878022381,0.9826717605764466
llm_goals_427,test,3,0.6756249878022381,0.9914966630190112
llm_goals_427,test,4,0.6756249878022381,0.0287440390481499
llm_goals_427,test,5,0.6756249878022381,0.1508234315553654
llm_goals_427,test,6,0.6756249878022381,0.0241177394276523
llm_goals_427,test,7,0.6756249878022381,0.9533421090109172
llm_goals_427,test,8,0.6756249878022381,0.1357554081265164
llm_goals_427,test,9,0.6756249878022381,0.0422408742214398
llm_goals_427,test,10,0.6756249878022381,0.3560677064830195
llm_goals_427,test,11,0.6756249878022381,0.2848587352361455
llm_goals_427,test,12,0.6756249878022381,0.0783011900572995
llm_goals_427,test,13,0.6756249878022381,0.053588048642731
llm_goals_427,test,14,0.6756249878022381,0.1755007793342038
llm_goals_427,test,15,0.6756249878022381,0.03905897487628
llm_goals_427,test,16,0.6756249878022381,0.0861236052612804
llm_goals_427,test,17,0.6756249878022381,0.2907015821684348
llm_goals_427,test,18,0.6756249878022381,0.0468453325440364
llm_goals_427,test,19,0.6756249878022381,0.7510010963524218
llm_goals_427,test,20,0.6756249878022381,0.0467429391605962
llm_goals_427,test,21,0.6756249878022381,0.1304366461429133
llm_goals_427,test,22,0.6756249878022381,0.1246622694694481
llm_goals_427,test,23,0.6756249878022381,0.5644455097827197
llm_goals_427,test,24,0.6756249878022381,0.0414160339225927
llm_goals_427,test,25,0.6756249878022381,0.8926284254200217
llm_goals_427,test,26,0.6756249878022381,0.0591453922508401
llm_goals_427,test,27,0.6756249878022381,0.5016671352552752
llm_goals_427,test,28,0.6756249878022381,0.9189449605602464
llm_goals_427,test,29,0.6756249878022381,0.5267252864404038
llm_goals_427,test,30,0.6756249878022381,0.3196802851986922
llm_goals_427,test,31,0.6756249878022381,0.0622742618121558
llm_goals_427,test,32,0.6756249878022381,0.2393552597896355
llm_goals_427,test,33,0.6756249878022381,0.0317774218950805
llm_goals_427,test,34,0.6756249878022381,0.2969897604985466
llm_goals_427,test,35,0.6756249878022381,0.911826685378058
llm_goals_427,test,36,0.6756249878022381,0.5044385498946317
llm_goals_427,test,37,0.6756249878022381,0.961152239017662
llm_goals_427,test,38,0.6756249878022381,0.383885411527425
llm_goals_427,test,39,0.6756249878022381,0.0767754062509803
llm_goals_427,test,40,0.6756249878022381,0.3019915478879681
llm_goals_427,test,41,0.6756249878022381,0.0597208539505394
llm_goals_427,test,42,0.6756249878022381,0.9798415326165176
llm_goals_427,test,43,0.6756249878022381,0.0828234646890313
llm_goals_427,test,44,0.6756249878022381,0.1075404432723246
llm_goals_427,test,45,0.6756249878022381,0.9497563751433828
llm_goals_427,test,46,0.6756249878022381,0.2027056215184361
llm_goals_427,test,47,0.6756249878022381,0.9493266919171398
llm_goals_427,test,48,0.6756249878022381,0.0344289143960405
llm_goals_427,test,49,0.6756249878022381,0.1952894749193552
llm_goals_186,test,0,0.6717568347874354,0.534925569771277
llm_goals_186,test,1,0.6717568347874354,0.0649953944046378
llm_goals_186,test,2,0.6717568347874354,0.91763923479236
llm_goals_186,test,3,0.6717568347874354,0.3425021516930106
llm_goals_186,test,4,0.6717568347874354,0.1153021531057396
llm_goals_186,test,5,0.6717568347874354,0.7928793741281699
llm_goals_186,test,6,0.6717568347874354,0.9038094070559602
llm_goals_186,test,7,0.6717568347874354,0.6367372560980368
llm_goals_186,test,8,0.6717568347874354,0.2126364849604726
llm_goals_186,test,9,0.6717568347874354,0.8694824597543704
llm_goals_186,test,10,0.6717568347874354,0.5802607311846129
llm_goals_186,test,11,0.6717568347874354,0.2225491999116792
llm_goals_186,test,12,0.6717568347874354,0.2300986684078339
llm_goals_186,test,13,0.6717568347874354,0.9257638147127129
llm_goals_186,test,14,0.6717568347874354,0.1695718974503099
llm_goals_186,test,15,0.6717568347874354,0.151038541979901
llm_goals_186,test,16,0.6717568347874354,0.0464142133590747
llm_goals_186,test,17,0.6717568347874354,0.0732763222959853
llm_goals_186,test,18,0.6717568347874354,0.0482171595539919
llm_goals_186,test,19,0.6717568347874354,0.347547591319228
llm_goals_186,test,20,0.6717568347874354,0.1739822028354879
llm_goals_186,test,21,0.6717568347874354,0.9541198242132036
llm_goals_186,test,22,0.6717568347874354,0.049497112506125
llm_goals_186,test,23,0.6717568347874354,0.1810016520865223
llm_goals_186,test,24,0.6717568347874354,0.1851077351512521
llm_goals_186,test,25,0.6717568347874354,0.6713192505556377
llm_goals_186,test,26,0.6717568347874354,0.0711032925420902
llm_goals_186,test,27,0.6717568347874354,0.4081627252904761
llm_goals_186,test,28,0.6717568347874354,0.2745405964802801
llm_goals_186,test,29,0.6717568347874354,0.1854855714896691
llm_goals_186,test,30,0.6717568347874354,0.7354449882906446
llm_goals_186,test,31,0.6717568347874354,0.9912562823764032
llm_goals_186,test,32,0.6717568347874354,0.2618042375153737
llm_goals_186,test,33,0.6717568347874354,0.0337875336716617
llm_goals_186,test,34,0.6717568347874354,0.6428971957222914
llm_goals_186,test,35,0.6717568347874354,0.7900459432200765
llm_goals_186,test,36,0.6717568347874354,0.8730032999439788
llm_goals_186,test,37,0.6717568347874354,0.0649927594327202
llm_goals_186,test,38,0.6717568347874354,0.0471132735562561
llm_goals_186,test,39,0.6717568347874354,0.2481877539812294
llm_goals_186,test,40,0.6717568347874354,0.2111860555781098
llm_goals_186,test,41,0.6717568347874354,0.8712882416841639
llm_goals_186,test,42,0.6717568347874354,0.6193248853412385
llm_goals_186,test,43,0.6717568347874354,0.8760979623283635
llm_goals_186,test,44,0.6717568347874354,0.0767958111106498
llm_goals_186,test,45,0.6717568347874354,0.0848440049881495
llm_goals_186,test,46,0.6717568347874354,0.6601266976660584
llm_goals_186,test,47,0.6717568347874354,0.4818652455075419
llm_goals_186,test,48,0.6717568347874354,0.1752603358335205
llm_goals_186,test,49,0.6717568347874354,0.027320507820661
llm_goals_133,test,0,0.47283645143861486,0.1030518399074919
llm_goals_133,test,1,0.47283645143861486,0.1009270067527766
llm_goals_133,test,2,0.47283645143861486,0.4669147668825159
llm_goals_133,test,3,0.47283645143861486,0.9886211587587188
llm_goals_133,test,4,0.47283645143861486,0.6589999206031925
llm_goals_133,test,5,0.47283645143861486,0.0478680529217008
llm_goals_133,test,6,0.47283645143861486,0.0213367665689539
llm_goals_133,test,7,0.47283645143861486,0.06300162626541
llm_goals_133,test,8,0.47283645143861486,0.8613404237563876
llm_goals_133,test,9,0.47283645143861486,0.0502374017351794
llm_goals_133,test,10,0.47283645143861486,0.0728398857397339
llm_goals_133,test,11,0.47283645143861486,0.0886358546776828
llm_goals_133,test,12,0.47283645143861486,0.4714116383526195
llm_goals_133,test,13,0.47283645143861486,0.0406440348343292
llm_goals_133,test,14,0.47283645143861486,0.8416674339341796
llm_goals_133,test,15,0.47283645143861486,0.5989281494815651
llm_goals_133,test,16,0.47283645143861486,0.9641061261695968
llm_goals_133,test,17,0.47283645143861486,0.0521719884710187
llm_goals_133,test,18,0.47283645143861486,0.9257678218156756
llm_goals_133,test,19,0.47283645143861486,0.0409677417198195
llm_goals_133,test,20,0.47283645143861486,0.9201317528016504
llm_goals_133,test,21,0.47283645143861486,0.0611858046803647
llm_goals_133,test,22,0.47283645143861486,0.0749444450486417
llm_goals_133,test,23,0.47283645143861486,0.484676139228053
llm_goals_133,test,24,0.47283645143861486,0.8221724152075577
llm_goals_133,test,25,0.47283645143861486,0.2957602203771531
llm_goals_133,test,26,0.47283645143861486,0.8046360378637115
llm_goals_133,test,27,0.47283645143861486,0.0759761030516968
llm_goals_133,test,28,0.47283645143861486,0.9366340572155704
llm_goals_133,test,29,0.47283645143861486,0.1272708658186502
llm_goals_133,test,30,0.47283645143861486,0.1227999985147976
llm_goals_133,test,31,0.47283645143861486,0.0136010194313778
llm_goals_133,test,32,0.47283645143861486,0.3597276462870885
llm_goals_133,test,33,0.47283645143861486,0.8726937465962196
llm_goals_133,test,34,0.47283645143861486,0.2894476365444396
llm_goals_133,test,35,0.47283645143861486,0.0165111879681815
llm_goals_133,test,36,0.47283645143861486,0.0576655273020702
llm_goals_133,test,37,0.47283645143861486,0.2554780098122276
llm_goals_133,test,38,0.47283645143861486,0.032809734462924
llm_goals_133,test,39,0.47283645143861486,0.1481243946785008
llm_goals_133,test,40,0.47283645143861486,0.4462128198301662
llm_goals_133,test,41,0.47283645143861486,0.093264815138027
llm_goals_133,test,42,0.47283645143861486,0.2383228605626679
llm_goals_133,test,43,0.47283645143861486,0.196654087051587
llm_goals_133,test,44,0.47283645143861486,0.9747002088111656
llm_goals_133,test,45,0.47283645143861486,0.9831163433792584
llm_goals_133,test,46,0.47283645143861486,0.1097011751248294
llm_goals_133,test,47,0.47283645143861486,0.8283354147237331
llm_goals_133,test,48,0.47283645143861486,0.8799294836893965
llm_goals_133,test,49,0.47283645143861486,0.2364671831052382
llm_goals_81,test,0,0.2806913635026799,0.1758977435560022
llm_goals_81,test,1,0.2806913635026799,0.4421252700970533
llm_goals_81,test,2,0.2806913635026799,0.5612444031805882
llm_goals_81,test,3,0.2806913635026799,0.3079533253993743
llm_goals_81,test,4,0.2806913635026799,0.1763212150593861
llm_goals_81,test,5,0.2806913635026799,0.9704465583106344
llm_goals_81,test,6,0.2806913635026799,0.9821312875358365
llm_goals_81,test,7,0.2806913635026799,0.3270685617728195
llm_goals_81,test,8,0.2806913635026799,0.4843756215736013
llm_goals_81,test,9,0.2806913635026799,0.9933654977534896
llm_goals_81,test,10,0.2806913635026799,0.4711097472541105
llm_goals_81,test,11,0.2806913635026799,0.1673212093996636
llm_goals_81,test,12,0.2806913635026799,0.2643530158966523
llm_goals_81,test,13,0.2806913635026799,0.9714035818561728
llm_goals_81,test,14,0.2806913635026799,0.9265405587707818
llm_goals_81,test,15,0.2806913635026799,0.1723195082090535
llm_goals_81,test,16,0.2806913635026799,0.9360974516501586
llm_goals_81,test,17,0.2806913635026799,0.4363540220565442
llm_goals_81,test,18,0.2806913635026799,0.9611565911249424
llm_goals_81,test,19,0.2806913635026799,0.0324757314893466
llm_goals_81,test,20,0.2806913635026799,0.6006056520074408
llm_goals_81,test,21,0.2806913635026799,0.9971859123159944
llm_goals_81,test,22,0.2806913635026799,0.0870371051461664
llm_goals_81,test,23,0.2806913635026799,0.2408633212672459
llm_goals_81,test,24,0.2806913635026799,0.9951702226622482
llm_goals_81,test,25,0.2806913635026799,0.6867633490140795
llm_goals_81,test,26,0.2806913635026799,0.9718244652881064
llm_goals_81,test,27,0.2806913635026799,0.4588186617124049
llm_goals_81,test,28,0.2806913635026799,0.5322330497164953
llm_goals_81,test,29,0.2806913635026799,0.2121016556019813
llm_goals_81,test,30,0.2806913635026799,0.6774810136296258
llm_goals_81,test,31,0.2806913635026799,0.9816113605758902
llm_goals_81,test,32,0.2806913635026799,0.2656694493977183
llm_goals_81,test,33,0.2806913635026799,0.942492448912156
llm_goals_81,test,34,0.2806913635026799,0.6429005762747164
llm_goals_81,test,35,0.2806913635026799,0.1528167702888629
llm_goals_81,test,36,0.2806913635026799,0.4512348514816248
llm_goals_81,test,37,0.2806913635026799,0.0605006450173409
llm_goals_81,test,38,0.2806913635026799,0.0274755323758623
llm_goals_81,test,39,0.2806913635026799,0.2279901766778581
llm_goals_81,test,40,0.2806913635026799,0.2775541527352398
llm_goals_81,test,41,0.2806913635026799,0.9829489706314426
llm_goals_81,test,42,0.2806913635026799,0.2494339762077133
llm_goals_81,test,43,0.2806913635026799,0.9819424303599844
llm_goals_81,test,44,0.2806913635026799,0.632760349651464
llm_goals_81,test,45,0.2806913635026799,0.090990563553155
llm_goals_81,test,46,0.2806913635026799,0.0910438800719751
llm_goals_81,test,47,0.2806913635026799,0.1292081639058968
llm_goals_81,test,48,0.2806913635026799,0.974747372736112
llm_goals_81,test,49,0.2806913635026799,0.2645580764012665
llm_goals_93,test,0,0.2532637969245347,0.5635269221536086
llm_goals_93,test,1,0.2532637969245347,0.8801163792253427
llm_goals_93,test,2,0.2532637969245347,0.0696003588446044
llm_goals_93,test,3,0.2532637969245347,0.8186048531566104
llm_goals_93,test,4,0.2532637969245347,0.2222011584760154
llm_goals_93,test,5,0.2532637969245347,0.1268359519713418
llm_goals_93,test,6,0.2532637969245347,0.4582622566067956
llm_goals_93,test,7,0.2532637969245347,0.429479690525812
llm_goals_93,test,8,0.2532637969245347,0.1536290973166499
llm_goals_93,test,9,0.2532637969245347,0.6112573193671209
llm_goals_93,test,10,0.2532637969245347,0.7998858649804967
llm_goals_93,test,11,0.2532637969245347,0.5454222135748753
llm_goals_93,test,12,0.2532637969245347,0.2508427619545539
llm_goals_93,test,13,0.2532637969245347,0.0884842413878226
llm_goals_93,test,14,0.2532637969245347,0.6768600290465995
llm_goals_93,test,15,0.2532637969245347,0.0352718405868165
llm_goals_93,test,16,0.2532637969245347,0.8009568965617743
llm_goals_93,test,17,0.2532637969245347,0.8092096317591537
llm_goals_93,test,18,0.2532637969245347,0.963804174465268
llm_goals_93,test,19,0.2532637969245347,0.9058854167265824
llm_goals_93,test,20,0.2532637969245347,0.265390180652688
llm_goals_93,test,21,0.2532637969245347,0.1541113602215154
llm_goals_93,test,22,0.2532637969245347,0.9766790566784582
llm_goals_93,test,23,0.2532637969245347,0.7843335253318285
llm_goals_93,test,24,0.2532637969245347,0.548404369330273
llm_goals_93,test,25,0.2532637969245347,0.9813529135147334
llm_goals_93,test,26,0.2532637969245347,0.9397963116499958
llm_goals_93,test,27,0.2532637969245347,0.542547443300257
llm_goals_93,test,28,0.2532637969245347,0.8277938193324692
llm_goals_93,test,29,0.2532637969245347,0.8549419878819347
llm_goals_93,test,30,0.2532637969245347,0.9761371695174176
llm_goals_93,test,31,0.2532637969245347,0.1774015734695253
llm_goals_93,test,32,0.2532637969245347,0.9590755456587298
llm_goals_93,test,33,0.2532637969245347,0.9496314531215296
llm_goals_93,test,34,0.2532637969245347,0.9112802317013324
llm_goals_93,test,35,0.2532637969245347,0.0646469314244137
llm_goals_93,test,36,0.2532637969245347,0.965643964207344
llm_goals_93,test,37,0.2532637969245347,0.963180821243277
llm_goals_93,test,38,0.2532637969245347,0.9411316422109696
llm_goals_93,test,39,0.2532637969245347,0.1075404372822008
llm_goals_93,test,40,0.2532637969245347,0.959466160286712
llm_goals_93,test,41,0.2532637969245347,0.3698215332403156
llm_goals_93,test,42,0.2532637969245347,0.1589404653011508
llm_goals_93,test,43,0.2532637969245347,0.2338719832936831
llm_goals_93,test,44,0.2532637969245347,0.1124984808029749
llm_goals_93,test,45,0.2532637969245347,0.866543330684459
llm_goals_93,test,46,0.2532637969245347,0.8519759554788342
llm_goals_93,test,47,0.2532637969245347,0.8737971308795239
llm_goals_93,test,48,0.2532637969245347,0.8916334225039363
llm_goals_93,test,49,0.2532637969245347,0.8758339889840314
llm_goals_401,test,0,0.24063528708817308,0.1359674012107803
llm_goals_401,test,1,0.24063528708817308,0.939276601509621
llm_goals_401,test,2,0.24063528708817308,0.3090277756984529
llm_goals_401,test,3,0.24063528708817308,0.2822982814806737
llm_goals_401,test,4,0.24063528708817308,0.9227317209028506
llm_goals_401,test,5,0.24063528708817308,0.0683562610885711
llm_goals_401,test,6,0.24063528708817308,0.1529393504632372
llm_goals_401,test,7,0.24063528708817308,0.2291880493623187
llm_goals_401,test,8,0.24063528708817308,0.910221445630232
llm_goals_401,test,9,0.24063528708817308,0.0669374443869285
llm_goals_401,test,10,0.24063528708817308,0.2562041584734201
llm_goals_401,test,11,0.24063528708817308,0.1977345307962301
llm_goals_401,test,12,0.24063528708817308,0.9351182671047276
llm_goals_401,test,13,0.24063528708817308,0.084239780653768
llm_goals_401,test,14,0.24063528708817308,0.3803121877997557
llm_goals_401,test,15,0.24063528708817308,0.9255856152963072
llm_goals_401,test,16,0.24063528708817308,0.2187242193427731
llm_goals_401,test,17,0.24063528708817308,0.9062633304766484
llm_goals_401,test,18,0.24063528708817308,0.0989866685824555
llm_goals_401,test,19,0.24063528708817308,0.0798642603957049
llm_goals_401,test,20,0.24063528708817308,0.7283447799445965
llm_goals_401,test,21,0.24063528708817308,0.3040102668224276
llm_goals_401,test,22,0.24063528708817308,0.8871123935548803
llm_goals_401,test,23,0.24063528708817308,0.6306703155992205
llm_goals_401,test,24,0.24063528708817308,0.342468541641041
llm_goals_401,test,25,0.24063528708817308,0.0306332962828717
llm_goals_401,test,26,0.24063528708817308,0.1178928014307589
llm_goals_401,test,27,0.24063528708817308,0.8247832937930811
llm_goals_401,test,28,0.24063528708817308,0.3694959007053917
llm_goals_401,test,29,0.24063528708817308,0.0798909574616735
llm_goals_401,test,30,0.24063528708817308,0.3951674202836078
llm_goals_401,test,31,0.24063528708817308,0.466307960095254
llm_goals_401,test,32,0.24063528708817308,0.1971577420397864
llm_goals_401,test,33,0.24063528708817308,0.1760928155683087
llm_goals_401,test,34,0.24063528708817308,0.2047678657851429
llm_goals_401,test,35,0.24063528708817308,0.2637872561841102
llm_goals_401,test,36,0.24063528708817308,0.4724849406439279
llm_goals_401,test,37,0.24063528708817308,0.0192510310263775
llm_goals_401,test,38,0.24063528708817308,0.1812826057265395
llm_goals_401,test,39,0.24063528708817308,0.905821781657468
llm_goals_401,test,40,0.24063528708817308,0.1146947001091413
llm_goals_401,test,41,0.24063528708817308,0.1032293515072512
llm_goals_401,test,42,0.24063528708817308,0.3834835806051595
llm_goals_401,test,43,0.24063528708817308,0.2508475125103526
llm_goals_401,test,44,0.24063528708817308,0.8248843542416243
llm_goals_401,test,45,0.24063528708817308,0.5847666727108293
llm_goals_401,test,46,0.24063528708817308,0.4045147001032884
llm_goals_401,test,47,0.24063528708817308,0.6278339401682421
llm_goals_401,test,48,0.24063528708817308,0.1361878043204594
llm_goals_401,test,49,0.24063528708817308,0.8435596200846341
