template_id,split,question_idx,prediction,label
llm_goals_401,test,0,0.8578925947324344,0.9578712581802692
llm_goals_401,test,1,0.8578925947324344,0.9541386350517288
llm_goals_401,test,2,0.8578925947324344,0.957633375223842
llm_goals_401,test,3,0.8578925947324344,0.939051149330178
llm_goals_401,test,4,0.8578925947324344,0.977310418686652
llm_goals_401,test,5,0.8578925947324344,0.9809432028055692
llm_goals_401,test,6,0.8578925947324344,0.9755462400413056
llm_goals_401,test,7,0.8578925947324344,0.9511837371803112
llm_goals_401,test,8,0.8578925947324344,0.9766189453717342
llm_goals_401,test,9,0.8578925947324344,0.980273604068012
llm_goals_401,test,10,0.8578925947324344,0.9337562348751304
llm_goals_401,test,11,0.8578925947324344,0.9722627409957164
llm_goals_401,test,12,0.8578925947324344,0.9492781746196448
llm_goals_401,test,13,0.8578925947324344,0.9655717616666432
llm_goals_401,test,14,0.8578925947324344,0.9574255360215488
llm_goals_401,test,15,0.8578925947324344,0.981384516529317
llm_goals_401,test,16,0.8578925947324344,0.9222335225671268
llm_goals_401,test,17,0.8578925947324344,0.9532549975325786
llm_goals_401,test,18,0.8578925947324344,0.9602041260526504
llm_goals_401,test,19,0.8578925947324344,0.6478757906857974
llm_goals_401,test,20,0.8578925947324344,0.9756843455136628
llm_goals_401,test,21,0.8578925947324344,0.990806877474314
llm_goals_401,test,22,0.8578925947324344,0.9781303405092489
llm_goals_401,test,23,0.8578925947324344,0.9417706148309914
llm_goals_401,test,24,0.8578925947324344,0.956336258298358
llm_goals_401,test,25,0.8578925947324344,0.9313769351906296
llm_goals_401,test,26,0.8578925947324344,0.979961037598938
llm_goals_401,test,27,0.8578925947324344,0.9393076331919324
llm_goals_401,test,28,0.8578925947324344,0.8926497724419561
llm_goals_401,test,29,0.8578925947324344,0.9039012216839892
llm_goals_401,test,30,0.8578925947324344,0.95604890766277
llm_goals_401,test,31,0.8578925947324344,0.9892266395215328
llm_goals_401,test,32,0.8578925947324344,0.9539506448444212
llm_goals_401,test,33,0.8578925947324344,0.96642041239244
llm_goals_401,test,34,0.8578925947324344,0.9213858238598618
llm_goals_401,test,35,0.8578925947324344,0.9778974644047042
llm_goals_401,test,36,0.8578925947324344,0.9268431675812392
llm_goals_401,test,37,0.8578925947324344,0.8127340038962743
llm_goals_401,test,38,0.8578925947324344,0.9302681059523448
llm_goals_401,test,39,0.8578925947324344,0.965603948473316
llm_goals_401,test,40,0.8578925947324344,0.9546924251425224
llm_goals_401,test,41,0.8578925947324344,0.9801422355796748
llm_goals_401,test,42,0.8578925947324344,0.942841528380264
llm_goals_401,test,43,0.8578925947324344,0.9624654057275208
llm_goals_401,test,44,0.8578925947324344,0.966766237132969
llm_goals_401,test,45,0.8578925947324344,0.9166605495286292
llm_goals_401,test,46,0.8578925947324344,0.9735371475107132
llm_goals_401,test,47,0.8578925947324344,0.9170851722665576
llm_goals_401,test,48,0.8578925947324344,0.9537843477184356
llm_goals_401,test,49,0.8578925947324344,0.9543297303993916
llm_goals_438,test,0,0.9430683191467101,0.7747630551513792
llm_goals_438,test,1,0.9430683191467101,0.935855152767207
llm_goals_438,test,2,0.9430683191467101,0.7147502234092127
llm_goals_438,test,3,0.9430683191467101,0.8761475031821572
llm_goals_438,test,4,0.9430683191467101,0.8370855426053896
llm_goals_438,test,5,0.9430683191467101,0.9507074946857058
llm_goals_438,test,6,0.9430683191467101,0.9429353481406656
llm_goals_438,test,7,0.9430683191467101,0.7990903812700391
llm_goals_438,test,8,0.9430683191467101,0.8538515570307835
llm_goals_438,test,9,0.9430683191467101,0.9386380912818448
llm_goals_438,test,10,0.9430683191467101,0.6740432265841833
llm_goals_438,test,11,0.9430683191467101,0.923251629590114
llm_goals_438,test,12,0.9430683191467101,0.9507690082509844
llm_goals_438,test,13,0.9430683191467101,0.9289195559017176
llm_goals_438,test,14,0.9430683191467101,0.9291442660965707
llm_goals_438,test,15,0.9430683191467101,0.7999125079987789
llm_goals_438,test,16,0.9430683191467101,0.88095736898606
llm_goals_438,test,17,0.9430683191467101,0.9601117963812904
llm_goals_438,test,18,0.9430683191467101,0.9583113794533262
llm_goals_438,test,19,0.9430683191467101,0.95757842004367
llm_goals_438,test,20,0.9430683191467101,0.8569924879179522
llm_goals_438,test,21,0.9430683191467101,0.925142229626847
llm_goals_438,test,22,0.9430683191467101,0.969126404096814
llm_goals_438,test,23,0.9430683191467101,0.9270654345691632
llm_goals_438,test,24,0.9430683191467101,0.9447244425458496
llm_goals_438,test,25,0.9430683191467101,0.8921203628029744
llm_goals_438,test,26,0.9430683191467101,0.8840255122167773
llm_goals_438,test,27,0.9430683191467101,0.9518933904854712
llm_goals_438,test,28,0.9430683191467101,0.9239946006518056
llm_goals_438,test,29,0.9430683191467101,0.967243014785835
llm_goals_438,test,30,0.9430683191467101,0.6513131257391838
llm_goals_438,test,31,0.9430683191467101,0.9452766773393708
llm_goals_438,test,32,0.9430683191467101,0.8986559507515572
llm_goals_438,test,33,0.9430683191467101,0.9178363106363248
llm_goals_438,test,34,0.9430683191467101,0.58431126605279
llm_goals_438,test,35,0.9430683191467101,0.8549510299218779
llm_goals_438,test,36,0.9430683191467101,0.7795077576161488
llm_goals_438,test,37,0.9430683191467101,0.942087231678633
llm_goals_438,test,38,0.9430683191467101,0.9569196102046018
llm_goals_438,test,39,0.9430683191467101,0.6285572658291573
llm_goals_438,test,40,0.9430683191467101,0.9166060095399312
llm_goals_438,test,41,0.9430683191467101,0.9583812359561668
llm_goals_438,test,42,0.9430683191467101,0.7214403769582053
llm_goals_438,test,43,0.9430683191467101,0.953284323393524
llm_goals_438,test,44,0.9430683191467101,0.8806080817389553
llm_goals_438,test,45,0.9430683191467101,0.92897343737164
llm_goals_438,test,46,0.9430683191467101,0.9584044214292112
llm_goals_438,test,47,0.9430683191467101,0.8794537151734262
llm_goals_438,test,48,0.9430683191467101,0.9488244649817108
llm_goals_438,test,49,0.9430683191467101,0.96985775201818
llm_goals_293,test,0,0.889525429821455,0.8120835453586716
llm_goals_293,test,1,0.889525429821455,0.6480853571933485
llm_goals_293,test,2,0.889525429821455,0.6079345474456403
llm_goals_293,test,3,0.889525429821455,0.6129396608114358
llm_goals_293,test,4,0.889525429821455,0.98210900952278
llm_goals_293,test,5,0.889525429821455,0.8658899081858322
llm_goals_293,test,6,0.889525429821455,0.8882423636795116
llm_goals_293,test,7,0.889525429821455,0.8509290855710241
llm_goals_293,test,8,0.889525429821455,0.9446962492710368
llm_goals_293,test,9,0.889525429821455,0.7513049230182386
llm_goals_293,test,10,0.889525429821455,0.9177243110970909
llm_goals_293,test,11,0.889525429821455,0.745101023404262
llm_goals_293,test,12,0.889525429821455,0.938155530986403
llm_goals_293,test,13,0.889525429821455,0.93102258486241
llm_goals_293,test,14,0.889525429821455,0.9835613372030028
llm_goals_293,test,15,0.889525429821455,0.9863449336337948
llm_goals_293,test,16,0.889525429821455,0.9708489179126024
llm_goals_293,test,17,0.889525429821455,0.6973515732177806
llm_goals_293,test,18,0.889525429821455,0.9506214255847638
llm_goals_293,test,19,0.889525429821455,0.8167264479797811
llm_goals_293,test,20,0.889525429821455,0.9863548279811404
llm_goals_293,test,21,0.889525429821455,0.7980274506980439
llm_goals_293,test,22,0.889525429821455,0.6721615182655347
llm_goals_293,test,23,0.889525429821455,0.3710465401115394
llm_goals_293,test,24,0.889525429821455,0.9595301158883638
llm_goals_293,test,25,0.889525429821455,0.958163618329278
llm_goals_293,test,26,0.889525429821455,0.966849388190172
llm_goals_293,test,27,0.889525429821455,0.8260024784538619
llm_goals_293,test,28,0.889525429821455,0.8388491865678236
llm_goals_293,test,29,0.889525429821455,0.8884818588260758
llm_goals_293,test,30,0.889525429821455,0.918233934226988
llm_goals_293,test,31,0.889525429821455,0.7707225792789547
llm_goals_293,test,32,0.889525429821455,0.8156692405787661
llm_goals_293,test,33,0.889525429821455,0.9365220048324068
llm_goals_293,test,34,0.889525429821455,0.9379748130481748
llm_goals_293,test,35,0.889525429821455,0.8901683114693926
llm_goals_293,test,36,0.889525429821455,0.8493608200921786
llm_goals_293,test,37,0.889525429821455,0.861633780857663
llm_goals_293,test,38,0.889525429821455,0.9021887179891658
llm_goals_293,test,39,0.889525429821455,0.9140409207490428
llm_goals_293,test,40,0.889525429821455,0.7293724502897094
llm_goals_293,test,41,0.889525429821455,0.9162639417701852
llm_goals_293,test,42,0.889525429821455,0.8334788131423683
llm_goals_293,test,43,0.889525429821455,0.7597774188725597
llm_goals_293,test,44,0.889525429821455,0.9659911986912778
llm_goals_293,test,45,0.889525429821455,0.931854425798201
llm_goals_293,test,46,0.889525429821455,0.5591331662726297
llm_goals_293,test,47,0.889525429821455,0.8162434715058863
llm_goals_293,test,48,0.889525429821455,0.9539650091821064
llm_goals_293,test,49,0.889525429821455,0.7483454415724036
llm_goals_397,test,0,0.3774379807031319,0.6336495795213035
llm_goals_397,test,1,0.3774379807031319,0.5588590528022535
llm_goals_397,test,2,0.3774379807031319,0.8967757860893129
llm_goals_397,test,3,0.3774379807031319,0.5944806240686361
llm_goals_397,test,4,0.3774379807031319,0.2252168546192252
llm_goals_397,test,5,0.3774379807031319,0.4122469495302511
llm_goals_397,test,6,0.3774379807031319,0.6366335121435647
llm_goals_397,test,7,0.3774379807031319,0.8096849879343126
llm_goals_397,test,8,0.3774379807031319,0.2219286497366863
llm_goals_397,test,9,0.3774379807031319,0.3790244200754085
llm_goals_397,test,10,0.3774379807031319,0.5739754985147579
llm_goals_397,test,11,0.3774379807031319,0.5146662099973958
llm_goals_397,test,12,0.3774379807031319,0.7724721370318186
llm_goals_397,test,13,0.3774379807031319,0.5128249643851043
llm_goals_397,test,14,0.3774379807031319,0.7029672903171433
llm_goals_397,test,15,0.3774379807031319,0.1755089749954058
llm_goals_397,test,16,0.3774379807031319,0.5780643909290929
llm_goals_397,test,17,0.3774379807031319,0.5651405953323156
llm_goals_397,test,18,0.3774379807031319,0.6692897169839361
llm_goals_397,test,19,0.3774379807031319,0.3010834864311782
llm_goals_397,test,20,0.3774379807031319,0.1723383376025849
llm_goals_397,test,21,0.3774379807031319,0.5552848455448852
llm_goals_397,test,22,0.3774379807031319,0.6247249816867365
llm_goals_397,test,23,0.3774379807031319,0.6892307964539947
llm_goals_397,test,24,0.3774379807031319,0.707193144679384
llm_goals_397,test,25,0.3774379807031319,0.4728503384141321
llm_goals_397,test,26,0.3774379807031319,0.6125340479102231
llm_goals_397,test,27,0.3774379807031319,0.638109206443543
llm_goals_397,test,28,0.3774379807031319,0.6131846340287811
llm_goals_397,test,29,0.3774379807031319,0.3070471542438216
llm_goals_397,test,30,0.3774379807031319,0.5305219388850028
llm_goals_397,test,31,0.3774379807031319,0.5467284805801325
llm_goals_397,test,32,0.3774379807031319,0.6052179554793606
llm_goals_397,test,33,0.3774379807031319,0.6898052709387655
llm_goals_397,test,34,0.3774379807031319,0.4488721547034506
llm_goals_397,test,35,0.3774379807031319,0.8279244269125856
llm_goals_397,test,36,0.3774379807031319,0.4830040624014946
llm_goals_397,test,37,0.3774379807031319,0.25459376065388
llm_goals_397,test,38,0.3774379807031319,0.2830348916920439
llm_goals_397,test,39,0.3774379807031319,0.6957841399255769
llm_goals_397,test,40,0.3774379807031319,0.4595589778278475
llm_goals_397,test,41,0.3774379807031319,0.5333267612417034
llm_goals_397,test,42,0.3774379807031319,0.8577821893356561
llm_goals_397,test,43,0.3774379807031319,0.5300958828918404
llm_goals_397,test,44,0.3774379807031319,0.2841438783476365
llm_goals_397,test,45,0.3774379807031319,0.5478091730108666
llm_goals_397,test,46,0.3774379807031319,0.623584984691235
llm_goals_397,test,47,0.3774379807031319,0.5396113255522375
llm_goals_397,test,48,0.3774379807031319,0.6615871853452404
llm_goals_397,test,49,0.3774379807031319,0.4776676395182983
llm_goals_281,test,0,0.9303895898221647,0.7595571331426817
llm_goals_281,test,1,0.9303895898221647,0.9579733612090848
llm_goals_281,test,2,0.9303895898221647,0.7309832638356816
llm_goals_281,test,3,0.9303895898221647,0.909583748095366
llm_goals_281,test,4,0.9303895898221647,0.8390255026542476
llm_goals_281,test,5,0.9303895898221647,0.9811318521618418
llm_goals_281,test,6,0.9303895898221647,0.9764572976382064
llm_goals_281,test,7,0.9303895898221647,0.7324330753461098
llm_goals_281,test,8,0.9303895898221647,0.7994783462392235
llm_goals_281,test,9,0.9303895898221647,0.9815838934803736
llm_goals_281,test,10,0.9303895898221647,0.9535347237148352
llm_goals_281,test,11,0.9303895898221647,0.9162909963751452
llm_goals_281,test,12,0.9303895898221647,0.3257945040794002
llm_goals_281,test,13,0.9303895898221647,0.9844478965422564
llm_goals_281,test,14,0.9303895898221647,0.927134453638218
llm_goals_281,test,15,0.9303895898221647,0.8836817175051781
llm_goals_281,test,16,0.9303895898221647,0.9699068666000064
llm_goals_281,test,17,0.9303895898221647,0.9397605064907452
llm_goals_281,test,18,0.9303895898221647,0.9597848062242011
llm_goals_281,test,19,0.9303895898221647,0.0774181964240286
llm_goals_281,test,20,0.9303895898221647,0.7915892634199072
llm_goals_281,test,21,0.9303895898221647,0.971953988882578
llm_goals_281,test,22,0.9303895898221647,0.9602834573260726
llm_goals_281,test,23,0.9303895898221647,0.9122855662185028
llm_goals_281,test,24,0.9303895898221647,0.8979990468804274
llm_goals_281,test,25,0.9303895898221647,0.9241587506219392
llm_goals_281,test,26,0.9303895898221647,0.9170165050266824
llm_goals_281,test,27,0.9303895898221647,0.9611372957336312
llm_goals_281,test,28,0.9303895898221647,0.87756150859893
llm_goals_281,test,29,0.9303895898221647,0.0434288112667957
llm_goals_281,test,30,0.9303895898221647,0.9342891559515047
llm_goals_281,test,31,0.9303895898221647,0.9743182057709278
llm_goals_281,test,32,0.9303895898221647,0.9397307039659378
llm_goals_281,test,33,0.9303895898221647,0.9512294521408392
llm_goals_281,test,34,0.9303895898221647,0.9536682955508284
llm_goals_281,test,35,0.9303895898221647,0.7535714456504239
llm_goals_281,test,36,0.9303895898221647,0.923856973167726
llm_goals_281,test,37,0.9303895898221647,0.0418935402602879
llm_goals_281,test,38,0.9303895898221647,0.7059133681203931
llm_goals_281,test,39,0.9303895898221647,0.3500755803223985
llm_goals_281,test,40,0.9303895898221647,0.9247009790185582
llm_goals_281,test,41,0.9303895898221647,0.9782058597610022
llm_goals_281,test,42,0.9303895898221647,0.7983229743904063
llm_goals_281,test,43,0.9303895898221647,0.975883662329788
llm_goals_281,test,44,0.9303895898221647,0.8750632399664175
llm_goals_281,test,45,0.9303895898221647,0.8910572538163689
llm_goals_281,test,46,0.9303895898221647,0.8908228852175125
llm_goals_281,test,47,0.9303895898221647,0.9549922359097318
llm_goals_281,test,48,0.9303895898221647,0.953490375608375
llm_goals_281,test,49,0.9303895898221647,0.9719706773426644
llm_goals_415,test,0,0.8220192566414418,0.8577433203043316
llm_goals_415,test,1,0.8220192566414418,0.9021974832977488
llm_goals_415,test,2,0.8220192566414418,0.8694165318475334
llm_goals_415,test,3,0.8220192566414418,0.82278495857052
llm_goals_415,test,4,0.8220192566414418,0.9068547493871278
llm_goals_415,test,5,0.8220192566414418,0.4606612308159887
llm_goals_415,test,6,0.8220192566414418,0.5138990722916633
llm_goals_415,test,7,0.8220192566414418,0.7904330429356278
llm_goals_415,test,8,0.8220192566414418,0.8709577911266214
llm_goals_415,test,9,0.8220192566414418,0.4953228711784456
llm_goals_415,test,10,0.8220192566414418,0.8458883220009739
llm_goals_415,test,11,0.8220192566414418,0.7530689318495781
llm_goals_415,test,12,0.8220192566414418,0.5374074070351774
llm_goals_415,test,13,0.8220192566414418,0.4543814478672013
llm_goals_415,test,14,0.8220192566414418,0.895305392435367
llm_goals_415,test,15,0.8220192566414418,0.8949400812124582
llm_goals_415,test,16,0.8220192566414418,0.8238564098543186
llm_goals_415,test,17,0.8220192566414418,0.7003946285795368
llm_goals_415,test,18,0.8220192566414418,0.8541047516491939
llm_goals_415,test,19,0.8220192566414418,0.4356960950136901
llm_goals_415,test,20,0.8220192566414418,0.8781125499856784
llm_goals_415,test,21,0.8220192566414418,0.4662951793594435
llm_goals_415,test,22,0.8220192566414418,0.9133476600123868
llm_goals_415,test,23,0.8220192566414418,0.729661283414631
llm_goals_415,test,24,0.8220192566414418,0.8203684726547874
llm_goals_415,test,25,0.8220192566414418,0.8415742531339464
llm_goals_415,test,26,0.8220192566414418,0.9206447035427088
llm_goals_415,test,27,0.8220192566414418,0.8224443724423657
llm_goals_415,test,28,0.8220192566414418,0.7688508117653093
llm_goals_415,test,29,0.8220192566414418,0.4040278781550455
llm_goals_415,test,30,0.8220192566414418,0.8326128082774296
llm_goals_415,test,31,0.8220192566414418,0.5181213462550505
llm_goals_415,test,32,0.8220192566414418,0.7754768797937415
llm_goals_415,test,33,0.8220192566414418,0.8137893713459559
llm_goals_415,test,34,0.8220192566414418,0.8569270432280164
llm_goals_415,test,35,0.8220192566414418,0.7699967690808278
llm_goals_415,test,36,0.8220192566414418,0.921674433414038
llm_goals_415,test,37,0.8220192566414418,0.4660833031516516
llm_goals_415,test,38,0.8220192566414418,0.65152560988785
llm_goals_415,test,39,0.8220192566414418,0.5898309243469293
llm_goals_415,test,40,0.8220192566414418,0.8091818666854369
llm_goals_415,test,41,0.8220192566414418,0.6069718569678856
llm_goals_415,test,42,0.8220192566414418,0.801905695679187
llm_goals_415,test,43,0.8220192566414418,0.7026985943405766
llm_goals_415,test,44,0.8220192566414418,0.8893336073229712
llm_goals_415,test,45,0.8220192566414418,0.7374717538757577
llm_goals_415,test,46,0.8220192566414418,0.7627238714563013
llm_goals_415,test,47,0.8220192566414418,0.8843601962700689
llm_goals_415,test,48,0.8220192566414418,0.8760370596393947
llm_goals_415,test,49,0.8220192566414418,0.934119643218544
llm_goals_228,test,0,0.49505747658080396,0.5536142490727757
llm_goals_228,test,1,0.49505747658080396,0.5970781946787781
llm_goals_228,test,2,0.49505747658080396,0.6661069439112477
llm_goals_228,test,3,0.49505747658080396,0.1621815926046939
llm_goals_228,test,4,0.49505747658080396,0.576352949396635
llm_goals_228,test,5,0.49505747658080396,0.3840882428737504
llm_goals_228,test,6,0.49505747658080396,0.3586276503372383
llm_goals_228,test,7,0.49505747658080396,0.6176623614140859
llm_goals_228,test,8,0.49505747658080396,0.6954425570040618
llm_goals_228,test,9,0.49505747658080396,0.259004657946923
llm_goals_228,test,10,0.49505747658080396,0.7034691604166908
llm_goals_228,test,11,0.49505747658080396,0.3667773177860855
llm_goals_228,test,12,0.49505747658080396,0.5441412387152404
llm_goals_228,test,13,0.49505747658080396,0.1798966425933617
llm_goals_228,test,14,0.49505747658080396,0.6634600123551451
llm_goals_228,test,15,0.49505747658080396,0.5674040322938352
llm_goals_228,test,16,0.49505747658080396,0.7765365728525085
llm_goals_228,test,17,0.49505747658080396,0.4222217460157005
llm_goals_228,test,18,0.49505747658080396,0.7662538791291613
llm_goals_228,test,19,0.49505747658080396,0.551409534979895
llm_goals_228,test,20,0.49505747658080396,0.6118689802554753
llm_goals_228,test,21,0.49505747658080396,0.4397631653224428
llm_goals_228,test,22,0.49505747658080396,0.4973987580331913
llm_goals_228,test,23,0.49505747658080396,0.4235300043058759
llm_goals_228,test,24,0.49505747658080396,0.7459660834986607
llm_goals_228,test,25,0.49505747658080396,0.7296489537631492
llm_goals_228,test,26,0.49505747658080396,0.7553963575905828
llm_goals_228,test,27,0.49505747658080396,0.4245395914745872
llm_goals_228,test,28,0.49505747658080396,0.2113718455283501
llm_goals_228,test,29,0.49505747658080396,0.5839822372879856
llm_goals_228,test,30,0.49505747658080396,0.7882484823843936
llm_goals_228,test,31,0.49505747658080396,0.3978078935012989
llm_goals_228,test,32,0.49505747658080396,0.2741357451446661
llm_goals_228,test,33,0.49505747658080396,0.7841096477395639
llm_goals_228,test,34,0.49505747658080396,0.7149417896157899
llm_goals_228,test,35,0.49505747658080396,0.4510400759046654
llm_goals_228,test,36,0.49505747658080396,0.5606685093118066
llm_goals_228,test,37,0.49505747658080396,0.4949700429354497
llm_goals_228,test,38,0.49505747658080396,0.5294251416140277
llm_goals_228,test,39,0.49505747658080396,0.5303236770643239
llm_goals_228,test,40,0.49505747658080396,0.3614923254884982
llm_goals_228,test,41,0.49505747658080396,0.5566797369456766
llm_goals_228,test,42,0.49505747658080396,0.5874469302943671
llm_goals_228,test,43,0.49505747658080396,0.4047568932904402
llm_goals_228,test,44,0.49505747658080396,0.5769778999083791
llm_goals_228,test,45,0.49505747658080396,0.381513250802113
llm_goals_228,test,46,0.49505747658080396,0.3717434970639749
llm_goals_228,test,47,0.49505747658080396,0.1147154724199779
llm_goals_228,test,48,0.49505747658080396,0.8181026530840192
llm_goals_228,test,49,0.49505747658080396,0.3646229970196732
llm_goals_236,test,0,0.8635663976714065,0.7150391262778099
llm_goals_236,test,1,0.8635663976714065,0.6861406620593683
llm_goals_236,test,2,0.8635663976714065,0.871267676778662
llm_goals_236,test,3,0.8635663976714065,0.8072499568065914
llm_goals_236,test,4,0.8635663976714065,0.7988170942289826
llm_goals_236,test,5,0.8635663976714065,0.9525319342810132
llm_goals_236,test,6,0.8635663976714065,0.922369719315248
llm_goals_236,test,7,0.8635663976714065,0.8816325671024458
llm_goals_236,test,8,0.8635663976714065,0.850525379453481
llm_goals_236,test,9,0.8635663976714065,0.8905094280701752
llm_goals_236,test,10,0.8635663976714065,0.8517140753999074
llm_goals_236,test,11,0.8635663976714065,0.568158988781905
llm_goals_236,test,12,0.8635663976714065,0.81539887388713
llm_goals_236,test,13,0.8635663976714065,0.9457094685792072
llm_goals_236,test,14,0.8635663976714065,0.926884118217816
llm_goals_236,test,15,0.8635663976714065,0.6732607492268958
llm_goals_236,test,16,0.8635663976714065,0.9227134615696562
llm_goals_236,test,17,0.8635663976714065,0.6862386995801422
llm_goals_236,test,18,0.8635663976714065,0.9588107473600692
llm_goals_236,test,19,0.8635663976714065,0.4410424607670248
llm_goals_236,test,20,0.8635663976714065,0.7869937367368668
llm_goals_236,test,21,0.8635663976714065,0.9367554776085516
llm_goals_236,test,22,0.8635663976714065,0.6817940522161587
llm_goals_236,test,23,0.8635663976714065,0.6579733541579077
llm_goals_236,test,24,0.8635663976714065,0.9454425582899262
llm_goals_236,test,25,0.8635663976714065,0.8055338192842599
llm_goals_236,test,26,0.8635663976714065,0.9246634247941125
llm_goals_236,test,27,0.8635663976714065,0.5396068227032322
llm_goals_236,test,28,0.8635663976714065,0.7982258737433797
llm_goals_236,test,29,0.8635663976714065,0.3578559150563034
llm_goals_236,test,30,0.8635663976714065,0.831663663699925
llm_goals_236,test,31,0.8635663976714065,0.8995406617766696
llm_goals_236,test,32,0.8635663976714065,0.7293236306375612
llm_goals_236,test,33,0.8635663976714065,0.9457866545397724
llm_goals_236,test,34,0.8635663976714065,0.8364083160174887
llm_goals_236,test,35,0.8635663976714065,0.7920782594120231
llm_goals_236,test,36,0.8635663976714065,0.8063141051706565
llm_goals_236,test,37,0.8635663976714065,0.5136290105021059
llm_goals_236,test,38,0.8635663976714065,0.4514706416931497
llm_goals_236,test,39,0.8635663976714065,0.8644759660227708
llm_goals_236,test,40,0.8635663976714065,0.6572924853656194
llm_goals_236,test,41,0.8635663976714065,0.9311078819261616
llm_goals_236,test,42,0.8635663976714065,0.7421276499016344
llm_goals_236,test,43,0.8635663976714065,0.9182581940665174
llm_goals_236,test,44,0.8635663976714065,0.78992920712052
llm_goals_236,test,45,0.8635663976714065,0.7690354024834042
llm_goals_236,test,46,0.8635663976714065,0.7972039589337531
llm_goals_236,test,47,0.8635663976714065,0.7979662948734613
llm_goals_236,test,48,0.8635663976714065,0.9401202207915952
llm_goals_236,test,49,0.8635663976714065,0.6403300609260552
llm_goals_86,test,0,0.7898772061377882,0.848978225488033
llm_goals_86,test,1,0.7898772061377882,0.5667421908216284
llm_goals_86,test,2,0.7898772061377882,0.9666773097569414
llm_goals_86,test,3,0.7898772061377882,0.6816530119880609
llm_goals_86,test,4,0.7898772061377882,0.7288792743080739
llm_goals_86,test,5,0.7898772061377882,0.5964895998637825
llm_goals_86,test,6,0.7898772061377882,0.8656080931523872
llm_goals_86,test,7,0.7898772061377882,0.847071824665876
llm_goals_86,test,8,0.7898772061377882,0.8023766851830423
llm_goals_86,test,9,0.7898772061377882,0.8243871920658875
llm_goals_86,test,10,0.7898772061377882,0.8687054464050711
llm_goals_86,test,11,0.7898772061377882,0.8881319769937132
llm_goals_86,test,12,0.7898772061377882,0.6590020093828339
llm_goals_86,test,13,0.7898772061377882,0.6733084849210463
llm_goals_86,test,14,0.7898772061377882,0.3116476330682434
llm_goals_86,test,15,0.7898772061377882,0.663392413111642
llm_goals_86,test,16,0.7898772061377882,0.6387773046544254
llm_goals_86,test,17,0.7898772061377882,0.8044010404371023
llm_goals_86,test,18,0.7898772061377882,0.8337891051244346
llm_goals_86,test,19,0.7898772061377882,0.6396502923711483
llm_goals_86,test,20,0.7898772061377882,0.788879332405017
llm_goals_86,test,21,0.7898772061377882,0.6394004244150501
llm_goals_86,test,22,0.7898772061377882,0.8626416934726503
llm_goals_86,test,23,0.7898772061377882,0.7951470614108611
llm_goals_86,test,24,0.7898772061377882,0.7989944850297322
llm_goals_86,test,25,0.7898772061377882,0.5568233615310513
llm_goals_86,test,26,0.7898772061377882,0.7084484057432834
llm_goals_86,test,27,0.7898772061377882,0.752342212713773
llm_goals_86,test,28,0.7898772061377882,0.7815325258308541
llm_goals_86,test,29,0.7898772061377882,0.5424953082979187
llm_goals_86,test,30,0.7898772061377882,0.623081015497586
llm_goals_86,test,31,0.7898772061377882,0.7577194596401322
llm_goals_86,test,32,0.7898772061377882,0.6601579792051269
llm_goals_86,test,33,0.7898772061377882,0.8711616389038969
llm_goals_86,test,34,0.7898772061377882,0.5900015643097076
llm_goals_86,test,35,0.7898772061377882,0.7298998281488869
llm_goals_86,test,36,0.7898772061377882,0.8123467602894
llm_goals_86,test,37,0.7898772061377882,0.6271477319447354
llm_goals_86,test,38,0.7898772061377882,0.7261717872389034
llm_goals_86,test,39,0.7898772061377882,0.6599378021515605
llm_goals_86,test,40,0.7898772061377882,0.8521513981089313
llm_goals_86,test,41,0.7898772061377882,0.7704036243710474
llm_goals_86,test,42,0.7898772061377882,0.8350187493970602
llm_goals_86,test,43,0.7898772061377882,0.7481739555208251
llm_goals_86,test,44,0.7898772061377882,0.6095754460637204
llm_goals_86,test,45,0.7898772061377882,0.7827780278235656
llm_goals_86,test,46,0.7898772061377882,0.7216219938712807
llm_goals_86,test,47,0.7898772061377882,0.5942280347054933
llm_goals_86,test,48,0.7898772061377882,0.9115690572813184
llm_goals_86,test,49,0.7898772061377882,0.8632650981365884
llm_goals_230,test,0,0.8733366609361486,0.8179351702935589
llm_goals_230,test,1,0.8733366609361486,0.8188182051872285
llm_goals_230,test,2,0.8733366609361486,0.826086635244689
llm_goals_230,test,3,0.8733366609361486,0.8927791723378472
llm_goals_230,test,4,0.8733366609361486,0.5912138130658398
llm_goals_230,test,5,0.8733366609361486,0.5729324801938974
llm_goals_230,test,6,0.8733366609361486,0.5531325232730563
llm_goals_230,test,7,0.8733366609361486,0.8021489969603882
llm_goals_230,test,8,0.8733366609361486,0.581443858272074
llm_goals_230,test,9,0.8733366609361486,0.6239073379929715
llm_goals_230,test,10,0.8733366609361486,0.8046756982507505
llm_goals_230,test,11,0.8733366609361486,0.8313074111593964
llm_goals_230,test,12,0.8733366609361486,0.7681956263676517
llm_goals_230,test,13,0.8733366609361486,0.5988426118672923
llm_goals_230,test,14,0.8733366609361486,0.8599042234104695
llm_goals_230,test,15,0.8733366609361486,0.5936393834712063
llm_goals_230,test,16,0.8733366609361486,0.8206661307032131
llm_goals_230,test,17,0.8733366609361486,0.8436086722555165
llm_goals_230,test,18,0.8733366609361486,0.8499366057691331
llm_goals_230,test,19,0.8733366609361486,0.6149675790828681
llm_goals_230,test,20,0.8733366609361486,0.6266825308309105
llm_goals_230,test,21,0.8733366609361486,0.6164414775805864
llm_goals_230,test,22,0.8733366609361486,0.8343809289495249
llm_goals_230,test,23,0.8733366609361486,0.7837306823394206
llm_goals_230,test,24,0.8733366609361486,0.846372128553261
llm_goals_230,test,25,0.8733366609361486,0.7390370859690565
llm_goals_230,test,26,0.8733366609361486,0.8494265096725975
llm_goals_230,test,27,0.8733366609361486,0.8455606124040723
llm_goals_230,test,28,0.8733366609361486,0.8579674965057287
llm_goals_230,test,29,0.8733366609361486,0.5880964942153284
llm_goals_230,test,30,0.8733366609361486,0.8358535771844652
llm_goals_230,test,31,0.8733366609361486,0.5805894006126754
llm_goals_230,test,32,0.8733366609361486,0.7934818259785719
llm_goals_230,test,33,0.8733366609361486,0.834267023337033
llm_goals_230,test,34,0.8733366609361486,0.7892429815800577
llm_goals_230,test,35,0.8733366609361486,0.8120109426774391
llm_goals_230,test,36,0.8733366609361486,0.8267144565859352
llm_goals_230,test,37,0.8733366609361486,0.675275568637887
llm_goals_230,test,38,0.8733366609361486,0.601560060077995
llm_goals_230,test,39,0.8733366609361486,0.7968490736396183
llm_goals_230,test,40,0.8733366609361486,0.8216474607704832
llm_goals_230,test,41,0.8733366609361486,0.5197035792893621
llm_goals_230,test,42,0.8733366609361486,0.8097020966346316
llm_goals_230,test,43,0.8733366609361486,0.5719336953223904
llm_goals_230,test,44,0.8733366609361486,0.5981191789043642
llm_goals_230,test,45,0.8733366609361486,0.8736265335179677
llm_goals_230,test,46,0.8733366609361486,0.8487543997753076
llm_goals_230,test,47,0.8733366609361486,0.862138026666209
llm_goals_230,test,48,0.8733366609361486,0.8476904574354545
llm_goals_230,test,49,0.8733366609361486,0.8333969706647004
llm_goals_206,test,0,0.7674895895832284,0.8559101199930208
llm_goals_206,test,1,0.7674895895832284,0.7879802535556255
llm_goals_206,test,2,0.7674895895832284,0.8428787031752032
llm_goals_206,test,3,0.7674895895832284,0.8372089275473125
llm_goals_206,test,4,0.7674895895832284,0.7926284648989284
llm_goals_206,test,5,0.7674895895832284,0.5153650037350492
llm_goals_206,test,6,0.7674895895832284,0.3343649675741765
llm_goals_206,test,7,0.7674895895832284,0.9070251599505484
llm_goals_206,test,8,0.7674895895832284,0.8455585838330733
llm_goals_206,test,9,0.7674895895832284,0.6389058176485727
llm_goals_206,test,10,0.7674895895832284,0.1182260710030537
llm_goals_206,test,11,0.7674895895832284,0.7467083406482149
llm_goals_206,test,12,0.7674895895832284,0.4574706710312913
llm_goals_206,test,13,0.7674895895832284,0.0931690538173042
llm_goals_206,test,14,0.7674895895832284,0.6621974660772205
llm_goals_206,test,15,0.7674895895832284,0.494185809495628
llm_goals_206,test,16,0.7674895895832284,0.7829698941017894
llm_goals_206,test,17,0.7674895895832284,0.8449901332087761
llm_goals_206,test,18,0.7674895895832284,0.5445193157731812
llm_goals_206,test,19,0.7674895895832284,0.1852277467567061
llm_goals_206,test,20,0.7674895895832284,0.779411075601452
llm_goals_206,test,21,0.7674895895832284,0.8588447585962018
llm_goals_206,test,22,0.7674895895832284,0.6656724760322136
llm_goals_206,test,23,0.7674895895832284,0.7493727269767156
llm_goals_206,test,24,0.7674895895832284,0.9005759943815377
llm_goals_206,test,25,0.7674895895832284,0.6107508047041867
llm_goals_206,test,26,0.7674895895832284,0.6818652741926582
llm_goals_206,test,27,0.7674895895832284,0.101753575918842
llm_goals_206,test,28,0.7674895895832284,0.7895615709538879
llm_goals_206,test,29,0.7674895895832284,0.6033396275372427
llm_goals_206,test,30,0.7674895895832284,0.5204197590718647
llm_goals_206,test,31,0.7674895895832284,0.552048008783336
llm_goals_206,test,32,0.7674895895832284,0.6983551428844045
llm_goals_206,test,33,0.7674895895832284,0.7920455896978277
llm_goals_206,test,34,0.7674895895832284,0.8229582905649624
llm_goals_206,test,35,0.7674895895832284,0.7513486755861682
llm_goals_206,test,36,0.7674895895832284,0.8837921634473136
llm_goals_206,test,37,0.7674895895832284,0.2323070941836299
llm_goals_206,test,38,0.7674895895832284,0.6051056320867053
llm_goals_206,test,39,0.7674895895832284,0.3355604905336211
llm_goals_206,test,40,0.7674895895832284,0.0412251261013626
llm_goals_206,test,41,0.7674895895832284,0.8154974559604902
llm_goals_206,test,42,0.7674895895832284,0.650940780779249
llm_goals_206,test,43,0.7674895895832284,0.8136300459617928
llm_goals_206,test,44,0.7674895895832284,0.7293123065101965
llm_goals_206,test,45,0.7674895895832284,0.7633236130088205
llm_goals_206,test,46,0.7674895895832284,0.7359003505062409
llm_goals_206,test,47,0.7674895895832284,0.1849221570121216
llm_goals_206,test,48,0.7674895895832284,0.5419546416667619
llm_goals_206,test,49,0.7674895895832284,0.7725634685769378
llm_goals_146,test,0,0.5853169093902086,0.4053194295707414
llm_goals_146,test,1,0.5853169093902086,0.77863227297152
llm_goals_146,test,2,0.5853169093902086,0.4040155724720515
llm_goals_146,test,3,0.5853169093902086,0.5871794799134783
llm_goals_146,test,4,0.5853169093902086,0.560196939517166
llm_goals_146,test,5,0.5853169093902086,0.3825763215338447
llm_goals_146,test,6,0.5853169093902086,0.4487256154760436
llm_goals_146,test,7,0.5853169093902086,0.4411791015965565
llm_goals_146,test,8,0.5853169093902086,0.6130303084936348
llm_goals_146,test,9,0.5853169093902086,0.416171525001919
llm_goals_146,test,10,0.5853169093902086,0.8501744885482464
llm_goals_146,test,11,0.5853169093902086,0.4275203540944987
llm_goals_146,test,12,0.5853169093902086,0.1433368859863564
llm_goals_146,test,13,0.5853169093902086,0.3454179305560879
llm_goals_146,test,14,0.5853169093902086,0.3984231289972209
llm_goals_146,test,15,0.5853169093902086,0.7779127849429681
llm_goals_146,test,16,0.5853169093902086,0.3923375995541924
llm_goals_146,test,17,0.5853169093902086,0.7787704480980863
llm_goals_146,test,18,0.5853169093902086,0.4485241820972409
llm_goals_146,test,19,0.5853169093902086,0.3670787385820063
llm_goals_146,test,20,0.5853169093902086,0.5808513911957404
llm_goals_146,test,21,0.5853169093902086,0.348566839291943
llm_goals_146,test,22,0.5853169093902086,0.8201150868695501
llm_goals_146,test,23,0.5853169093902086,0.4340105664556233
llm_goals_146,test,24,0.5853169093902086,0.3779777975457017
llm_goals_146,test,25,0.5853169093902086,0.7064739339171033
llm_goals_146,test,26,0.5853169093902086,0.5068406448496142
llm_goals_146,test,27,0.5853169093902086,0.8190644408840766
llm_goals_146,test,28,0.5853169093902086,0.5180591218776336
llm_goals_146,test,29,0.5853169093902086,0.333344294156815
llm_goals_146,test,30,0.5853169093902086,0.7747827278582075
llm_goals_146,test,31,0.5853169093902086,0.407372660950012
llm_goals_146,test,32,0.5853169093902086,0.410007141610074
llm_goals_146,test,33,0.5853169093902086,0.4871137583409777
llm_goals_146,test,34,0.5853169093902086,0.7239974058432814
llm_goals_146,test,35,0.5853169093902086,0.4717056489178101
llm_goals_146,test,36,0.5853169093902086,0.7518023835632467
llm_goals_146,test,37,0.5853169093902086,0.4299980307715084
llm_goals_146,test,38,0.5853169093902086,0.6853837869126352
llm_goals_146,test,39,0.5853169093902086,0.3821269496784033
llm_goals_146,test,40,0.5853169093902086,0.358534933784248
llm_goals_146,test,41,0.5853169093902086,0.3237407407589303
llm_goals_146,test,42,0.5853169093902086,0.465061399698899
llm_goals_146,test,43,0.5853169093902086,0.4315601062358607
llm_goals_146,test,44,0.5853169093902086,0.5556539728312679
llm_goals_146,test,45,0.5853169093902086,0.5920740253668018
llm_goals_146,test,46,0.5853169093902086,0.4871274917312868
llm_goals_146,test,47,0.5853169093902086,0.581843033103631
llm_goals_146,test,48,0.5853169093902086,0.3075919216632473
llm_goals_146,test,49,0.5853169093902086,0.7619587682314233
llm_goals_115,test,0,0.6064370745571904,0.4434632286904964
llm_goals_115,test,1,0.6064370745571904,0.6904317046527385
llm_goals_115,test,2,0.6064370745571904,0.6516189539788452
llm_goals_115,test,3,0.6064370745571904,0.4339340266994299
llm_goals_115,test,4,0.6064370745571904,0.3268096695267067
llm_goals_115,test,5,0.6064370745571904,0.5710080860563095
llm_goals_115,test,6,0.6064370745571904,0.5525431491717658
llm_goals_115,test,7,0.6064370745571904,0.4917475457547118
llm_goals_115,test,8,0.6064370745571904,0.5222463726327303
llm_goals_115,test,9,0.6064370745571904,0.7214239291876969
llm_goals_115,test,10,0.6064370745571904,0.1423416680133991
llm_goals_115,test,11,0.6064370745571904,0.0211501267474188
llm_goals_115,test,12,0.6064370745571904,0.7876465277644278
llm_goals_115,test,13,0.6064370745571904,0.7712913027170795
llm_goals_115,test,14,0.6064370745571904,0.8433526700949283
llm_goals_115,test,15,0.6064370745571904,0.4617767241926875
llm_goals_115,test,16,0.6064370745571904,0.751642873633365
llm_goals_115,test,17,0.6064370745571904,0.5750395750632571
llm_goals_115,test,18,0.6064370745571904,0.731190860777953
llm_goals_115,test,19,0.6064370745571904,0.4010090785721757
llm_goals_115,test,20,0.6064370745571904,0.4639274084070101
llm_goals_115,test,21,0.6064370745571904,0.8439438875722727
llm_goals_115,test,22,0.6064370745571904,0.4930168575659444
llm_goals_115,test,23,0.6064370745571904,0.1606455731785788
llm_goals_115,test,24,0.6064370745571904,0.8225050510480415
llm_goals_115,test,25,0.6064370745571904,0.4682683350736841
llm_goals_115,test,26,0.6064370745571904,0.8534070288351345
llm_goals_115,test,27,0.6064370745571904,0.4742317939252941
llm_goals_115,test,28,0.6064370745571904,0.0572278600376891
llm_goals_115,test,29,0.6064370745571904,0.4907303253909411
llm_goals_115,test,30,0.6064370745571904,0.1910564822051387
llm_goals_115,test,31,0.6064370745571904,0.8779074551007869
llm_goals_115,test,32,0.6064370745571904,0.504762116367231
llm_goals_115,test,33,0.6064370745571904,0.7961870421429237
llm_goals_115,test,34,0.6064370745571904,0.3117413427150098
llm_goals_115,test,35,0.6064370745571904,0.6062498233633526
llm_goals_115,test,36,0.6064370745571904,0.5465164093133901
llm_goals_115,test,37,0.6064370745571904,0.5868361038548235
llm_goals_115,test,38,0.6064370745571904,0.3403703059415776
llm_goals_115,test,39,0.6064370745571904,0.8219108606932716
llm_goals_115,test,40,0.6064370745571904,0.1035981058362717
llm_goals_115,test,41,0.6064370745571904,0.8823458588361053
llm_goals_115,test,42,0.6064370745571904,0.2803475549795062
llm_goals_115,test,43,0.6064370745571904,0.8513012565900029
llm_goals_115,test,44,0.6064370745571904,0.7679774087348048
llm_goals_115,test,45,0.6064370745571904,0.2698108084459203
llm_goals_115,test,46,0.6064370745571904,0.0357215216493676
llm_goals_115,test,47,0.6064370745571904,0.3874775112245213
llm_goals_115,test,48,0.6064370745571904,0.7725214275580398
llm_goals_115,test,49,0.6064370745571904,0.6720584616591353
llm_goals_182,test,0,0.5608515127252434,0.8652063058172594
llm_goals_182,test,1,0.5608515127252434,0.0826947230522371
llm_goals_182,test,2,0.5608515127252434,0.798587619624287
llm_goals_182,test,3,0.5608515127252434,0.1153333326317589
llm_goals_182,test,4,0.5608515127252434,0.8911074983818299
llm_goals_182,test,5,0.5608515127252434,0.322673941983326
llm_goals_182,test,6,0.5608515127252434,0.3873713790307967
llm_goals_182,test,7,0.5608515127252434,0.7954637431338407
llm_goals_182,test,8,0.5608515127252434,0.8713126766724444
llm_goals_182,test,9,0.5608515127252434,0.3727719680238343
llm_goals_182,test,10,0.5608515127252434,0.344259508803394
llm_goals_182,test,11,0.5608515127252434,0.826409100211895
llm_goals_182,test,12,0.5608515127252434,0.6995229144237722
llm_goals_182,test,13,0.5608515127252434,0.2983322739239659
llm_goals_182,test,14,0.5608515127252434,0.1121533235192302
llm_goals_182,test,15,0.5608515127252434,0.8530130402661898
llm_goals_182,test,16,0.5608515127252434,0.140642355581753
llm_goals_182,test,17,0.5608515127252434,0.0750534295482943
llm_goals_182,test,18,0.5608515127252434,0.1021012312203676
llm_goals_182,test,19,0.5608515127252434,0.7930271065360427
llm_goals_182,test,20,0.5608515127252434,0.8727144576853948
llm_goals_182,test,21,0.5608515127252434,0.3883832635395169
llm_goals_182,test,22,0.5608515127252434,0.0858987886275301
llm_goals_182,test,23,0.5608515127252434,0.8587499834361978
llm_goals_182,test,24,0.5608515127252434,0.1529090764042953
llm_goals_182,test,25,0.5608515127252434,0.3907861244891192
llm_goals_182,test,26,0.5608515127252434,0.0898813936513848
llm_goals_182,test,27,0.5608515127252434,0.0749023763424232
llm_goals_182,test,28,0.5608515127252434,0.1190598459155961
llm_goals_182,test,29,0.5608515127252434,0.7016449528375276
llm_goals_182,test,30,0.5608515127252434,0.3981986561532387
llm_goals_182,test,31,0.5608515127252434,0.4033468376136607
llm_goals_182,test,32,0.5608515127252434,0.8175631740353995
llm_goals_182,test,33,0.5608515127252434,0.1448325966795168
llm_goals_182,test,34,0.5608515127252434,0.3547330626609051
llm_goals_182,test,35,0.5608515127252434,0.823988084949945
llm_goals_182,test,36,0.5608515127252434,0.3920453941320438
llm_goals_182,test,37,0.5608515127252434,0.7340161718404824
llm_goals_182,test,38,0.5608515127252434,0.7157883671582869
llm_goals_182,test,39,0.5608515127252434,0.6255065804950025
llm_goals_182,test,40,0.5608515127252434,0.8448494619425109
llm_goals_182,test,41,0.5608515127252434,0.3755363161560536
llm_goals_182,test,42,0.5608515127252434,0.8729538896060706
llm_goals_182,test,43,0.5608515127252434,0.3845820969466132
llm_goals_182,test,44,0.5608515127252434,0.8535886434286102
llm_goals_182,test,45,0.5608515127252434,0.1216040102965252
llm_goals_182,test,46,0.5608515127252434,0.8235719161892086
llm_goals_182,test,47,0.5608515127252434,0.1493568636498045
llm_goals_182,test,48,0.5608515127252434,0.0977336313667494
llm_goals_182,test,49,0.5608515127252434,0.1145731477706443
llm_goals_326,test,0,0.7234208944853292,0.7210679537447465
llm_goals_326,test,1,0.7234208944853292,0.3698897290610674
llm_goals_326,test,2,0.7234208944853292,0.6763902331902123
llm_goals_326,test,3,0.7234208944853292,0.6144636338527515
llm_goals_326,test,4,0.7234208944853292,0.7226604268728406
llm_goals_326,test,5,0.7234208944853292,0.225010837259175
llm_goals_326,test,6,0.7234208944853292,0.2511202974122448
llm_goals_326,test,7,0.7234208944853292,0.682107850479918
llm_goals_326,test,8,0.7234208944853292,0.7688388280774076
llm_goals_326,test,9,0.7234208944853292,0.2201601423152862
llm_goals_326,test,10,0.7234208944853292,0.5927527654534117
llm_goals_326,test,11,0.7234208944853292,0.6402653335664261
llm_goals_326,test,12,0.7234208944853292,0.5219165167657188
llm_goals_326,test,13,0.7234208944853292,0.0912598670014219
llm_goals_326,test,14,0.7234208944853292,0.6237388815231029
llm_goals_326,test,15,0.7234208944853292,0.58422994911281
llm_goals_326,test,16,0.7234208944853292,0.598158895081766
llm_goals_326,test,17,0.7234208944853292,0.3075615988754216
llm_goals_326,test,18,0.7234208944853292,0.5624766832927214
llm_goals_326,test,19,0.7234208944853292,0.5837591950755885
llm_goals_326,test,20,0.7234208944853292,0.7023531773229094
llm_goals_326,test,21,0.7234208944853292,0.2231004774292705
llm_goals_326,test,22,0.7234208944853292,0.2981176158853984
llm_goals_326,test,23,0.7234208944853292,0.5947662537107573
llm_goals_326,test,24,0.7234208944853292,0.6704973022514685
llm_goals_326,test,25,0.7234208944853292,0.7548767212573778
llm_goals_326,test,26,0.7234208944853292,0.6431580812900115
llm_goals_326,test,27,0.7234208944853292,0.3327881124528037
llm_goals_326,test,28,0.7234208944853292,0.7641554441675951
llm_goals_326,test,29,0.7234208944853292,0.4778539914575542
llm_goals_326,test,30,0.7234208944853292,0.7097294996625062
llm_goals_326,test,31,0.7234208944853292,0.2337370659971392
llm_goals_326,test,32,0.7234208944853292,0.6377238074883209
llm_goals_326,test,33,0.7234208944853292,0.6003066307923431
llm_goals_326,test,34,0.7234208944853292,0.6119511714458287
llm_goals_326,test,35,0.7234208944853292,0.5639635886155634
llm_goals_326,test,36,0.7234208944853292,0.6540181072858835
llm_goals_326,test,37,0.7234208944853292,0.6297099560404894
llm_goals_326,test,38,0.7234208944853292,0.5278265562464118
llm_goals_326,test,39,0.7234208944853292,0.5029836143581652
llm_goals_326,test,40,0.7234208944853292,0.5904794288270965
llm_goals_326,test,41,0.7234208944853292,0.2163880989100536
llm_goals_326,test,42,0.7234208944853292,0.6295586948815126
llm_goals_326,test,43,0.7234208944853292,0.2120109108404722
llm_goals_326,test,44,0.7234208944853292,0.6940786874714112
llm_goals_326,test,45,0.7234208944853292,0.6451782543850242
llm_goals_326,test,46,0.7234208944853292,0.5818721654926584
llm_goals_326,test,47,0.7234208944853292,0.6937841106268494
llm_goals_326,test,48,0.7234208944853292,0.6520763720762168
llm_goals_326,test,49,0.7234208944853292,0.3675984402598143
