template_id,split,question_idx,prediction,label
llm_goals_236,test,0,0.8857956278406323,0.9999990463256836
llm_goals_236,test,1,0.8857956278406323,0.9998601079056368
llm_goals_236,test,2,0.8857956278406323,0.9999994039535594
llm_goals_236,test,3,0.8857956278406323,0.999998450279186
llm_goals_236,test,4,0.8857956278406323,0.9999971389770508
llm_goals_236,test,5,0.8857956278406323,0.9999998211860676
llm_goals_236,test,6,0.8857956278406323,0.9999996423721385
llm_goals_236,test,7,0.8857956278406323,0.999999344348895
llm_goals_236,test,8,0.8857956278406323,0.9999988675117084
llm_goals_236,test,9,0.8857956278406323,0.9999998211860676
llm_goals_236,test,10,0.8857956278406323,0.9942808746609532
llm_goals_236,test,11,0.8857956278406323,0.9998060464816904
llm_goals_236,test,12,0.8857956278406323,0.9999784827237244
llm_goals_236,test,13,0.8857956278406323,0.9999998211860676
llm_goals_236,test,14,0.8857956278406323,0.9999877214430704
llm_goals_236,test,15,0.8857956278406323,0.9999918937684243
llm_goals_236,test,16,0.8857956278406323,0.9998958706868224
llm_goals_236,test,17,0.8857956278406323,0.9999055266407578
llm_goals_236,test,18,0.8857956278406323,0.9999948143957074
llm_goals_236,test,19,0.8857956278406323,0.0724598805251418
llm_goals_236,test,20,0.8857956278406323,0.9999921321869182
llm_goals_236,test,21,0.8857956278406323,0.9999992847442344
llm_goals_236,test,22,0.8857956278406323,0.9997341632930924
llm_goals_236,test,23,0.8857956278406323,0.9998326301518724
llm_goals_236,test,24,0.8857956278406323,0.999985396862246
llm_goals_236,test,25,0.8857956278406323,0.9778256407805812
llm_goals_236,test,26,0.8857956278406323,0.9999951124192492
llm_goals_236,test,27,0.8857956278406323,0.9285253300141496
llm_goals_236,test,28,0.8857956278406323,0.9999996423721385
llm_goals_236,test,29,0.8857956278406323,0.0552585651110835
llm_goals_236,test,30,0.8857956278406323,0.9193987256529454
llm_goals_236,test,31,0.8857956278406323,0.9999983310699748
llm_goals_236,test,32,0.8857956278406323,0.999973952771136
llm_goals_236,test,33,0.8857956278406323,0.9999884366984664
llm_goals_236,test,34,0.8857956278406323,0.9757304783109252
llm_goals_236,test,35,0.8857956278406323,0.9999988675117084
llm_goals_236,test,36,0.8857956278406323,0.9998944997781798
llm_goals_236,test,37,0.8857956278406323,0.1365288892720467
llm_goals_236,test,38,0.8857956278406323,0.719762510833872
llm_goals_236,test,39,0.8857956278406323,0.9999720454212542
llm_goals_236,test,40,0.8857956278406323,0.9984533787155216
llm_goals_236,test,41,0.8857956278406323,0.9999998211860676
llm_goals_236,test,42,0.8857956278406323,0.9999989271164011
llm_goals_236,test,43,0.8857956278406323,0.9999982714653176
llm_goals_236,test,44,0.8857956278406323,0.9999991655349802
llm_goals_236,test,45,0.8857956278406323,0.9999994635581704
llm_goals_236,test,46,0.8857956278406323,0.9999888539316992
llm_goals_236,test,47,0.8857956278406323,0.9999989271164011
llm_goals_236,test,48,0.8857956278406323,0.9999687075599843
llm_goals_236,test,49,0.8857956278406323,0.9976178406916212
llm_goals_228,test,0,0.7794968579635925,0.9999923110003712
llm_goals_228,test,1,0.7794968579635925,0.9997239112788898
llm_goals_228,test,2,0.7794968579635925,0.9999983310699748
llm_goals_228,test,3,0.7794968579635925,0.3235730208667373
llm_goals_228,test,4,0.7794968579635925,0.9999561309796544
llm_goals_228,test,5,0.7794968579635925,0.0500382433432339
llm_goals_228,test,6,0.7794968579635925,0.0325581693591018
llm_goals_228,test,7,0.7794968579635925,0.9999955296516294
llm_goals_228,test,8,0.7794968579635925,0.9999945759774836
llm_goals_228,test,9,0.7794968579635925,0.0028912413507839
llm_goals_228,test,10,0.7794968579635925,0.999972343445286
llm_goals_228,test,11,0.7794968579635925,0.2356525274624049
llm_goals_228,test,12,0.7794968579635925,0.7824152121811281
llm_goals_228,test,13,0.7794968579635925,9.272773905172216e-05
llm_goals_228,test,14,0.7794968579635925,0.999985396862246
llm_goals_228,test,15,0.7794968579635925,0.9997810721409376
llm_goals_228,test,16,0.7794968579635925,0.9999924302101154
llm_goals_228,test,17,0.7794968579635925,0.9964962600884054
llm_goals_228,test,18,0.7794968579635925,0.9999846816053862
llm_goals_228,test,19,0.7794968579635925,0.80150937475593
llm_goals_228,test,20,0.7794968579635925,0.9999823570243526
llm_goals_228,test,21,0.7794968579635925,0.7620198101590071
llm_goals_228,test,22,0.7794968579635925,0.999146759521554
llm_goals_228,test,23,0.7794968579635925,0.9753957978718134
llm_goals_228,test,24,0.7794968579635925,0.9999912381174048
llm_goals_228,test,25,0.7794968579635925,0.9997735619549886
llm_goals_228,test,26,0.7794968579635925,0.999994218349345
llm_goals_228,test,27,0.7794968579635925,0.9975230096939942
llm_goals_228,test,28,0.7794968579635925,0.0282825634665972
llm_goals_228,test,29,0.7794968579635925,0.989357948515744
llm_goals_228,test,30,0.7794968579635925,0.9999648928656788
llm_goals_228,test,31,0.7794968579635925,0.1841044242752227
llm_goals_228,test,32,0.7794968579635925,0.6401162870682584
llm_goals_228,test,33,0.7794968579635925,0.999995231628418
llm_goals_228,test,34,0.7794968579635925,0.9999182820314436
llm_goals_228,test,35,0.7794968579635925,0.999788165093598
llm_goals_228,test,36,0.7794968579635925,0.9875653984316132
llm_goals_228,test,37,0.7794968579635925,0.99879342314863
llm_goals_228,test,38,0.7794968579635925,0.9949926138514864
llm_goals_228,test,39,0.7794968579635925,0.9871301051093162
llm_goals_228,test,40,0.7794968579635925,0.9374855739864648
llm_goals_228,test,41,0.7794968579635925,0.768526607723976
llm_goals_228,test,42,0.7794968579635925,0.9999880194663172
llm_goals_228,test,43,0.7794968579635925,0.5863317957282166
llm_goals_228,test,44,0.7794968579635925,0.9999881386760048
llm_goals_228,test,45,0.7794968579635925,0.8984286803691676
llm_goals_228,test,46,0.7794968579635925,0.012311546088274
llm_goals_228,test,47,0.7794968579635925,0.0766497555033863
llm_goals_228,test,48,0.7794968579635925,0.9999973773956584
llm_goals_228,test,49,0.7794968579635925,0.939641477083989
llm_goals_397,test,0,0.6098338209052918,0.9814099073764808
llm_goals_397,test,1,0.6098338209052918,0.9999912381174048
llm_goals_397,test,2,0.6098338209052918,0.9999979138373352
llm_goals_397,test,3,0.6098338209052918,0.9999809861190028
llm_goals_397,test,4,0.6098338209052918,0.0255301341302224
llm_goals_397,test,5,0.6098338209052918,0.9999864101405658
llm_goals_397,test,6,0.6098338209052918,0.9998381137785032
llm_goals_397,test,7,0.6098338209052918,0.99997174739913
llm_goals_397,test,8,0.6098338209052918,0.130829360211786
llm_goals_397,test,9,0.6098338209052918,0.9999025464035022
llm_goals_397,test,10,0.6098338209052918,0.9995446801111892
llm_goals_397,test,11,0.6098338209052918,0.9833766826787343
llm_goals_397,test,12,0.6098338209052918,0.999996542930667
llm_goals_397,test,13,0.6098338209052918,0.999946773053646
llm_goals_397,test,14,0.6098338209052918,0.9999846816053862
llm_goals_397,test,15,0.6098338209052918,0.0066017277153082
llm_goals_397,test,16,0.6098338209052918,0.9999932646750854
llm_goals_397,test,17,0.6098338209052918,0.9999726414675878
llm_goals_397,test,18,0.6098338209052918,0.9999631643313146
llm_goals_397,test,19,0.6098338209052918,0.9990255832870808
llm_goals_397,test,20,0.6098338209052918,0.0470702684705779
llm_goals_397,test,21,0.6098338209052918,0.999989688396868
llm_goals_397,test,22,0.6098338209052918,0.9999497532844842
llm_goals_397,test,23,0.6098338209052918,0.9997248649522246
llm_goals_397,test,24,0.6098338209052918,0.9999954104424252
llm_goals_397,test,25,0.6098338209052918,0.9892253874904372
llm_goals_397,test,26,0.6098338209052918,0.9999661445600752
llm_goals_397,test,27,0.6098338209052918,0.999984502792388
llm_goals_397,test,28,0.6098338209052918,0.9999876022334326
llm_goals_397,test,29,0.6098338209052918,0.99916046856021
llm_goals_397,test,30,0.6098338209052918,0.9993026852479712
llm_goals_397,test,31,0.6098338209052918,0.999975025654656
llm_goals_397,test,32,0.6098338209052918,0.9996371865271196
llm_goals_397,test,33,0.6098338209052918,0.9999744892118428
llm_goals_397,test,34,0.6098338209052918,0.999513149271868
llm_goals_397,test,35,0.6098338209052918,0.9999858140942104
llm_goals_397,test,36,0.6098338209052918,0.9909363981874668
llm_goals_397,test,37,0.6098338209052918,0.9967403410768448
llm_goals_397,test,38,0.6098338209052918,0.9700924159576454
llm_goals_397,test,39,0.6098338209052918,0.9999973177909444
llm_goals_397,test,40,0.6098338209052918,0.8681342672732176
llm_goals_397,test,41,0.6098338209052918,0.999994218349345
llm_goals_397,test,42,0.6098338209052918,0.9999906420709002
llm_goals_397,test,43,0.6098338209052918,0.9999807476995284
llm_goals_397,test,44,0.6098338209052918,0.6356807298065411
llm_goals_397,test,45,0.6098338209052918,0.999989688396868
llm_goals_397,test,46,0.6098338209052918,0.9996384382368032
llm_goals_397,test,47,0.6098338209052918,0.9997389316595698
llm_goals_397,test,48,0.6098338209052918,0.9999530911461468
llm_goals_397,test,49,0.6098338209052918,0.9999887943268112
llm_goals_401,test,0,0.9967230575487187,0.9999994635581704
llm_goals_401,test,1,0.9967230575487187,0.9999995231628418
llm_goals_401,test,2,0.9967230575487187,0.9999994635581704
llm_goals_401,test,3,0.9967230575487187,0.9999074339856228
llm_goals_401,test,4,0.9967230575487187,0.999999940395357
llm_goals_401,test,5,0.9967230575487187,0.999999940395357
llm_goals_401,test,6,0.9967230575487187,0.999999940395357
llm_goals_401,test,7,0.9967230575487187,0.9999992847442344
llm_goals_401,test,8,0.9967230575487187,0.999999940395357
llm_goals_401,test,9,0.9967230575487187,0.9999998211860676
llm_goals_401,test,10,0.9967230575487187,0.9999995827674883
llm_goals_401,test,11,0.9967230575487187,0.9999995827674883
llm_goals_401,test,12,0.9967230575487187,0.9999995827674883
llm_goals_401,test,13,0.9967230575487187,0.9999997019767636
llm_goals_401,test,14,0.9967230575487187,0.9999986886977652
llm_goals_401,test,15,0.9967230575487187,0.9999998211860676
llm_goals_401,test,16,0.9967230575487187,0.9999991655349802
llm_goals_401,test,17,0.9967230575487187,0.9999992847442344
llm_goals_401,test,18,0.9967230575487187,0.9999995231628418
llm_goals_401,test,19,0.9967230575487187,0.9713776109091996
llm_goals_401,test,20,0.9967230575487187,0.9999998807907032
llm_goals_401,test,21,0.9967230575487187,1.0
llm_goals_401,test,22,0.9967230575487187,0.9999998807907032
llm_goals_401,test,23,0.9967230575487187,0.9999996423721385
llm_goals_401,test,24,0.9967230575487187,0.9999989867209838
llm_goals_401,test,25,0.9967230575487187,0.9999995231628418
llm_goals_401,test,26,0.9967230575487187,0.9999997615814208
llm_goals_401,test,27,0.9967230575487187,0.9999994039535594
llm_goals_401,test,28,0.9967230575487187,0.9983195662475728
llm_goals_401,test,29,0.9967230575487187,0.9993320703468634
llm_goals_401,test,30,0.9967230575487187,0.9999997019767636
llm_goals_401,test,31,0.9967230575487187,0.9999998807907032
llm_goals_401,test,32,0.9967230575487187,0.9999989271164011
llm_goals_401,test,33,0.9967230575487187,0.9999992847442344
llm_goals_401,test,34,0.9967230575487187,0.9999994635581704
llm_goals_401,test,35,0.9967230575487187,0.9999998807907032
llm_goals_401,test,36,0.9967230575487187,0.9999997019767636
llm_goals_401,test,37,0.9967230575487187,0.8060779005212295
llm_goals_401,test,38,0.9967230575487187,0.9999966025353348
llm_goals_401,test,39,0.9967230575487187,0.9999998211860676
llm_goals_401,test,40,0.9967230575487187,0.9999996423721385
llm_goals_401,test,41,0.9967230575487187,0.999999940395357
llm_goals_401,test,42,0.9967230575487187,0.9999996423721385
llm_goals_401,test,43,0.9967230575487187,0.999999940395357
llm_goals_401,test,44,0.9967230575487187,0.9999997615814208
llm_goals_401,test,45,0.9967230575487187,0.9992901682960044
llm_goals_401,test,46,0.9967230575487187,0.9999996423721385
llm_goals_401,test,47,0.9967230575487187,0.9999059438703174
llm_goals_401,test,48,0.9967230575487187,0.9999988079071328
llm_goals_401,test,49,0.9967230575487187,0.999999344348895
llm_goals_326,test,0,0.9635700468639421,0.9998103380222648
llm_goals_326,test,1,0.9635700468639421,0.1015499721104398
llm_goals_326,test,2,0.9635700468639421,0.9995523691298543
llm_goals_326,test,3,0.9635700468639421,0.9820513126171384
llm_goals_326,test,4,0.9635700468639421,0.9997708797458836
llm_goals_326,test,5,0.9635700468639421,0.0041024868608885
llm_goals_326,test,6,0.9635700468639421,0.0013792452717851
llm_goals_326,test,7,0.9635700468639421,0.9970470071684427
llm_goals_326,test,8,0.9635700468639421,0.9994441866676194
llm_goals_326,test,9,0.9635700468639421,0.058725887838439
llm_goals_326,test,10,0.9635700468639421,0.9983887672460816
llm_goals_326,test,11,0.9635700468639421,0.9773504733838247
llm_goals_326,test,12,0.9635700468639421,0.5111671721675201
llm_goals_326,test,13,0.9635700468639421,0.0023213561119498
llm_goals_326,test,14,0.9635700468639421,0.9992487430849846
llm_goals_326,test,15,0.9635700468639421,0.9998496770786612
llm_goals_326,test,16,0.9635700468639421,0.9995788335870258
llm_goals_326,test,17,0.9635700468639421,0.0289194533041716
llm_goals_326,test,18,0.9635700468639421,0.9941717982892394
llm_goals_326,test,19,0.9635700468639421,0.9898712036276838
llm_goals_326,test,20,0.9635700468639421,0.998426973781836
llm_goals_326,test,21,0.9635700468639421,0.0080112452725568
llm_goals_326,test,22,0.9635700468639421,0.0170446490301255
llm_goals_326,test,23,0.9635700468639421,0.9315074100877992
llm_goals_326,test,24,0.9635700468639421,0.9996359944310432
llm_goals_326,test,25,0.9635700468639421,0.9993702173479914
llm_goals_326,test,26,0.9635700468639421,0.99954205751167
llm_goals_326,test,27,0.9635700468639421,0.1439592978368308
llm_goals_326,test,28,0.9635700468639421,0.9782873980924596
llm_goals_326,test,29,0.9635700468639421,0.6406475907057047
llm_goals_326,test,30,0.9635700468639421,0.9997262358610556
llm_goals_326,test,31,0.9635700468639421,0.0025467661319066
llm_goals_326,test,32,0.9635700468639421,0.927265467234428
llm_goals_326,test,33,0.9635700468639421,0.9970411657688188
llm_goals_326,test,34,0.9635700468639421,0.9924188256928188
llm_goals_326,test,35,0.9635700468639421,0.9999433159814316
llm_goals_326,test,36,0.9635700468639421,0.7828563458619708
llm_goals_326,test,37,0.9635700468639421,0.9921779035200892
llm_goals_326,test,38,0.9635700468639421,0.9710912105847416
llm_goals_326,test,39,0.9635700468639421,0.9591411966937028
llm_goals_326,test,40,0.9635700468639421,0.9675343030198714
llm_goals_326,test,41,0.9635700468639421,0.0125675465450323
llm_goals_326,test,42,0.9635700468639421,0.9817813030107898
llm_goals_326,test,43,0.9635700468639421,0.0210821160744808
llm_goals_326,test,44,0.9635700468639421,0.9984526634039176
llm_goals_326,test,45,0.9635700468639421,0.7725256637892597
llm_goals_326,test,46,0.9635700468639421,0.7800079567380194
llm_goals_326,test,47,0.9635700468639421,0.9949684144438216
llm_goals_326,test,48,0.9635700468639421,0.9985677004408368
llm_goals_326,test,49,0.9635700468639421,0.045807901396548
llm_goals_415,test,0,0.9163398176110138,0.9997588992066258
llm_goals_415,test,1,0.9163398176110138,0.9999479055404636
llm_goals_415,test,2,0.9163398176110138,0.9957069754348792
llm_goals_415,test,3,0.9163398176110138,0.9998519420664436
llm_goals_415,test,4,0.9163398176110138,0.9993222355665604
llm_goals_415,test,5,0.9163398176110138,0.0031238526915668
llm_goals_415,test,6,0.9163398176110138,0.0017953563962722
llm_goals_415,test,7,0.9163398176110138,0.9612127544780552
llm_goals_415,test,8,0.9163398176110138,0.9824366570655148
llm_goals_415,test,9,0.9163398176110138,0.0016438446411424
llm_goals_415,test,10,0.9163398176110138,0.9999850988388712
llm_goals_415,test,11,0.9163398176110138,0.9989992976042504
llm_goals_415,test,12,0.9163398176110138,0.3845905785054697
llm_goals_415,test,13,0.9163398176110138,0.0001663988005876
llm_goals_415,test,14,0.9163398176110138,0.99998015165382
llm_goals_415,test,15,0.9163398176110138,0.9986550807653384
llm_goals_415,test,16,0.9163398176110138,0.9999568462370104
llm_goals_415,test,17,0.9163398176110138,0.9992712139839848
llm_goals_415,test,18,0.9163398176110138,0.9999991655349802
llm_goals_415,test,19,0.9163398176110138,0.1268431093615233
llm_goals_415,test,20,0.9163398176110138,0.9989575147526004
llm_goals_415,test,21,0.9163398176110138,0.0009023478721852
llm_goals_415,test,22,0.9163398176110138,0.9999995231628418
llm_goals_415,test,23,0.9163398176110138,0.993058026033597
llm_goals_415,test,24,0.9163398176110138,0.9999659061423206
llm_goals_415,test,25,0.9163398176110138,0.9999040365210196
llm_goals_415,test,26,0.9163398176110138,0.9999980330466104
llm_goals_415,test,27,0.9163398176110138,0.9999982118606638
llm_goals_415,test,28,0.9163398176110138,0.9999243617070486
llm_goals_415,test,29,0.9163398176110138,0.0442403483495126
llm_goals_415,test,30,0.9163398176110138,0.9996343254989244
llm_goals_415,test,31,0.9163398176110138,0.0007251523135023
llm_goals_415,test,32,0.9163398176110138,0.8080266673914581
llm_goals_415,test,33,0.9163398176110138,0.9999894499780476
llm_goals_415,test,34,0.9163398176110138,0.9994327426028377
llm_goals_415,test,35,0.9163398176110138,0.9989529847642252
llm_goals_415,test,36,0.9163398176110138,0.9999961853027344
llm_goals_415,test,37,0.9163398176110138,0.3947042465556775
llm_goals_415,test,38,0.9163398176110138,0.8703240197518964
llm_goals_415,test,39,0.9163398176110138,0.0273997177536015
llm_goals_415,test,40,0.9163398176110138,0.9999445676815596
llm_goals_415,test,41,0.9163398176110138,0.0002682073682728
llm_goals_415,test,42,0.9163398176110138,0.9981696606070336
llm_goals_415,test,43,0.9163398176110138,0.2786076155583993
llm_goals_415,test,44,0.9163398176110138,0.9965623020600424
llm_goals_415,test,45,0.9163398176110138,0.9966514706305192
llm_goals_415,test,46,0.9163398176110138,0.9965545534402274
llm_goals_415,test,47,0.9163398176110138,0.9999976754188272
llm_goals_415,test,48,0.9163398176110138,0.9999974966048696
llm_goals_415,test,49,0.9163398176110138,0.9999994635581704
llm_goals_146,test,0,0.7734401894046818,0.9937213660464576
llm_goals_146,test,1,0.7734401894046818,0.9919615387432202
llm_goals_146,test,2,0.7734401894046818,0.9951347707289916
llm_goals_146,test,3,0.7734401894046818,0.9912926556861676
llm_goals_146,test,4,0.7734401894046818,0.7208669260139297
llm_goals_146,test,5,0.7734401894046818,0.0092084125425934
llm_goals_146,test,6,0.7734401894046818,0.1369906233450708
llm_goals_146,test,7,0.7734401894046818,0.9175609963819736
llm_goals_146,test,8,0.7734401894046818,0.0841403066718625
llm_goals_146,test,9,0.7734401894046818,0.1684153143767103
llm_goals_146,test,10,0.7734401894046818,0.908113835652124
llm_goals_146,test,11,0.7734401894046818,0.8938514016497744
llm_goals_146,test,12,0.7734401894046818,0.0100032471486232
llm_goals_146,test,13,0.7734401894046818,0.0298375477746486
llm_goals_146,test,14,0.7734401894046818,0.3167174882579391
llm_goals_146,test,15,0.7734401894046818,0.927414416219921
llm_goals_146,test,16,0.7734401894046818,0.0159187313778433
llm_goals_146,test,17,0.7734401894046818,0.9978384970986696
llm_goals_146,test,18,0.7734401894046818,0.4101569026026918
llm_goals_146,test,19,0.7734401894046818,0.9986221193952473
llm_goals_146,test,20,0.7734401894046818,0.7513560649612049
llm_goals_146,test,21,0.7734401894046818,0.0021027028134696
llm_goals_146,test,22,0.7734401894046818,0.9998958110811108
llm_goals_146,test,23,0.7734401894046818,0.7051541837582169
llm_goals_146,test,24,0.7734401894046818,0.0397261476166626
llm_goals_146,test,25,0.7734401894046818,0.8227276184379292
llm_goals_146,test,26,0.7734401894046818,0.2677446993446601
llm_goals_146,test,27,0.7734401894046818,0.99998730421031
llm_goals_146,test,28,0.7734401894046818,0.492199104386424
llm_goals_146,test,29,0.7734401894046818,0.987386405278924
llm_goals_146,test,30,0.7734401894046818,0.9782173041265074
llm_goals_146,test,31,0.7734401894046818,0.0704110414375715
llm_goals_146,test,32,0.7734401894046818,0.5230369446492051
llm_goals_146,test,33,0.7734401894046818,0.3253501541923078
llm_goals_146,test,34,0.7734401894046818,0.9673128124700084
llm_goals_146,test,35,0.7734401894046818,0.9997146725628192
llm_goals_146,test,36,0.7734401894046818,0.9323108220562318
llm_goals_146,test,37,0.7734401894046818,0.9997609853775884
llm_goals_146,test,38,0.7734401894046818,0.9964783192363952
llm_goals_146,test,39,0.7734401894046818,0.0664083062639811
llm_goals_146,test,40,0.7734401894046818,0.6598511913765792
llm_goals_146,test,41,0.7734401894046818,0.1032532555810967
llm_goals_146,test,42,0.7734401894046818,0.9252474342352108
llm_goals_146,test,43,0.7734401894046818,0.2905593299202337
llm_goals_146,test,44,0.7734401894046818,0.3807617993711434
llm_goals_146,test,45,0.7734401894046818,0.972134053996152
llm_goals_146,test,46,0.7734401894046818,0.1382936231589401
llm_goals_146,test,47,0.7734401894046818,0.9162934404085756
llm_goals_146,test,48,0.7734401894046818,0.2466934390927757
llm_goals_146,test,49,0.7734401894046818,0.9999247193370324
llm_goals_293,test,0,0.9983531134248399,0.9999973177909444
llm_goals_293,test,1,0.9983531134248399,0.9999983310699748
llm_goals_293,test,2,0.9983531134248399,0.9999885559082036
llm_goals_293,test,3,0.9983531134248399,0.9996450543386908
llm_goals_293,test,4,0.9983531134248399,0.9999996423721385
llm_goals_293,test,5,0.9983531134248399,0.9999819397920116
llm_goals_293,test,6,0.9983531134248399,0.9999997019767636
llm_goals_293,test,7,0.9983531134248399,0.999996066093452
llm_goals_293,test,8,0.9983531134248399,0.9999997615814208
llm_goals_293,test,9,0.9983531134248399,0.9999495744722752
llm_goals_293,test,10,0.9983531134248399,0.9999885559082036
llm_goals_293,test,11,0.9983531134248399,0.999996721744454
llm_goals_293,test,12,0.9983531134248399,0.9999988675117084
llm_goals_293,test,13,0.9983531134248399,0.9999983906746356
llm_goals_293,test,14,0.9983531134248399,0.9999996423721385
llm_goals_293,test,15,0.9983531134248399,0.9999997615814208
llm_goals_293,test,16,0.9983531134248399,0.9999994039535594
llm_goals_293,test,17,0.9983531134248399,0.9999927282334016
llm_goals_293,test,18,0.9983531134248399,0.9999998211860676
llm_goals_293,test,19,0.9983531134248399,0.9999971985817542
llm_goals_293,test,20,0.9983531134248399,0.9999998211860676
llm_goals_293,test,21,0.9983531134248399,0.999999344348895
llm_goals_293,test,22,0.9983531134248399,0.999999225139634
llm_goals_293,test,23,0.9983531134248399,0.9999982714653176
llm_goals_293,test,24,0.9983531134248399,0.9999997019767636
llm_goals_293,test,25,0.9983531134248399,0.9999955296516294
llm_goals_293,test,26,0.9983531134248399,0.9999997615814208
llm_goals_293,test,27,0.9983531134248399,0.9999994635581704
llm_goals_293,test,28,0.9983531134248399,0.9999988675117084
llm_goals_293,test,29,0.9983531134248399,0.9999997615814208
llm_goals_293,test,30,0.9983531134248399,0.9999886751170456
llm_goals_293,test,31,0.9983531134248399,0.9999983906746356
llm_goals_293,test,32,0.9983531134248399,0.9999979734420849
llm_goals_293,test,33,0.9983531134248399,0.9999989271164011
llm_goals_293,test,34,0.9983531134248399,0.9999950528144428
llm_goals_293,test,35,0.9983531134248399,0.9999990463256836
llm_goals_293,test,36,0.9983531134248399,0.9974341988179988
llm_goals_293,test,37,0.9983531134248399,0.999947488307946
llm_goals_293,test,38,0.9983531134248399,0.9999994039535594
llm_goals_293,test,39,0.9983531134248399,0.9999996423721385
llm_goals_293,test,40,0.9983531134248399,0.9999990463256836
llm_goals_293,test,41,0.9983531134248399,0.9999995827674883
llm_goals_293,test,42,0.9983531134248399,0.999998450279186
llm_goals_293,test,43,0.9983531134248399,0.999937295915171
llm_goals_293,test,44,0.9983531134248399,0.9999994635581704
llm_goals_293,test,45,0.9983531134248399,0.9999981522560136
llm_goals_293,test,46,0.9983531134248399,0.999995648860848
llm_goals_293,test,47,0.9983531134248399,0.9999973177909444
llm_goals_293,test,48,0.9983531134248399,0.9999997019767636
llm_goals_293,test,49,0.9983531134248399,0.9999975562095944
llm_goals_230,test,0,0.999949577688939,0.9999988675117084
llm_goals_230,test,1,0.999949577688939,0.9999197721505853
llm_goals_230,test,2,0.999949577688939,0.9999986290932004
llm_goals_230,test,3,0.999949577688939,0.9999998807907032
llm_goals_230,test,4,0.999949577688939,0.9999992847442344
llm_goals_230,test,5,0.999949577688939,0.97145622955703
llm_goals_230,test,6,0.999949577688939,0.9931073785733624
llm_goals_230,test,7,0.999949577688939,0.9999989271164011
llm_goals_230,test,8,0.999949577688939,0.9999994039535594
llm_goals_230,test,9,0.999949577688939,0.999468743814106
llm_goals_230,test,10,0.999949577688939,0.9999828934677488
llm_goals_230,test,11,0.999949577688939,0.9999996423721385
llm_goals_230,test,12,0.999949577688939,0.999997794628074
llm_goals_230,test,13,0.999949577688939,0.9983894825119092
llm_goals_230,test,14,0.999949577688939,0.9999980926513672
llm_goals_230,test,15,0.999949577688939,0.9999994039535594
llm_goals_230,test,16,0.999949577688939,0.99999570846569
llm_goals_230,test,17,0.999949577688939,0.9997287988607096
llm_goals_230,test,18,0.999949577688939,0.9999986290932004
llm_goals_230,test,19,0.999949577688939,0.792201278640246
llm_goals_230,test,20,0.999949577688939,0.9999989271164011
llm_goals_230,test,21,0.999949577688939,0.9993889927972028
llm_goals_230,test,22,0.999949577688939,0.9999741315840668
llm_goals_230,test,23,0.999949577688939,0.9999991655349802
llm_goals_230,test,24,0.999949577688939,0.9999988675117084
llm_goals_230,test,25,0.999949577688939,0.9999902248378308
llm_goals_230,test,26,0.999949577688939,0.9999990463256836
llm_goals_230,test,27,0.999949577688939,0.9999489188180812
llm_goals_230,test,28,0.999949577688939,0.9999998211860676
llm_goals_230,test,29,0.999949577688939,0.9489630473854872
llm_goals_230,test,30,0.999949577688939,0.9999970197676546
llm_goals_230,test,31,0.999949577688939,0.997134745101166
llm_goals_230,test,32,0.999949577688939,0.9999995231628418
llm_goals_230,test,33,0.999949577688939,0.999997437000376
llm_goals_230,test,34,0.999949577688939,0.9999924898147656
llm_goals_230,test,35,0.999949577688939,0.9999969005585
llm_goals_230,test,36,0.999949577688939,0.9999945163727092
llm_goals_230,test,37,0.999949577688939,0.9779089689145934
llm_goals_230,test,38,0.999949577688939,0.9570343502785515
llm_goals_230,test,39,0.999949577688939,0.9999988079071328
llm_goals_230,test,40,0.999949577688939,0.9999989271164011
llm_goals_230,test,41,0.999949577688939,0.99562537655113
llm_goals_230,test,42,0.999949577688939,0.999997794628074
llm_goals_230,test,43,0.999949577688939,0.9952926635719378
llm_goals_230,test,44,0.999949577688939,0.9999994635581704
llm_goals_230,test,45,0.999949577688939,0.9999998211860676
llm_goals_230,test,46,0.999949577688939,0.9999992847442344
llm_goals_230,test,47,0.999949577688939,0.9999998211860676
llm_goals_230,test,48,0.999949577688939,0.9999990463256836
llm_goals_230,test,49,0.999949577688939,0.9998905062670348
llm_goals_115,test,0,0.9999656397102759,0.9999962449073808
llm_goals_115,test,1,0.9999656397102759,0.9999990463256836
llm_goals_115,test,2,0.9999656397102759,0.9999997019767636
llm_goals_115,test,3,0.9999656397102759,0.9999576807027534
llm_goals_115,test,4,0.9999656397102759,0.999958157538035
llm_goals_115,test,5,0.9999656397102759,0.999957859516412
llm_goals_115,test,6,0.9999656397102759,0.9999822974207612
llm_goals_115,test,7,0.9999656397102759,0.9999992847442344
llm_goals_115,test,8,0.9999656397102759,0.9999833106986686
llm_goals_115,test,9,0.9999656397102759,0.9999994635581704
llm_goals_115,test,10,0.9999656397102759,0.9999232888251398
llm_goals_115,test,11,0.9999656397102759,0.1735883698655277
llm_goals_115,test,12,0.9999656397102759,0.9999995231628418
llm_goals_115,test,13,0.9999656397102759,0.999999344348895
llm_goals_115,test,14,0.9999656397102759,0.999998450279186
llm_goals_115,test,15,0.9999656397102759,0.9952644706725092
llm_goals_115,test,16,0.9999656397102759,0.9999927878380692
llm_goals_115,test,17,0.9999656397102759,0.999998509883854
llm_goals_115,test,18,0.9999656397102759,0.9999974966048696
llm_goals_115,test,19,0.9999656397102759,0.99996823072331
llm_goals_115,test,20,0.9999656397102759,0.9999916553499876
llm_goals_115,test,21,0.9999656397102759,0.999999344348895
llm_goals_115,test,22,0.9999656397102759,0.9999989867209838
llm_goals_115,test,23,0.9999656397102759,0.9994583130121676
llm_goals_115,test,24,0.9999656397102759,0.9999986290932004
llm_goals_115,test,25,0.9999656397102759,0.9999879002575536
llm_goals_115,test,26,0.9999656397102759,0.9999988079071328
llm_goals_115,test,27,0.9999656397102759,0.9999988079071328
llm_goals_115,test,28,0.9999656397102759,0.0502507498981832
llm_goals_115,test,29,0.9999656397102759,0.999960899353502
llm_goals_115,test,30,0.9999656397102759,0.9999914169306978
llm_goals_115,test,31,0.9999656397102759,0.9999992847442344
llm_goals_115,test,32,0.9999656397102759,0.9999759793274372
llm_goals_115,test,33,0.9999656397102759,0.9999992847442344
llm_goals_115,test,34,0.9999656397102759,0.9999864101405658
llm_goals_115,test,35,0.9999656397102759,0.999999344348895
llm_goals_115,test,36,0.9999656397102759,0.999999344348895
llm_goals_115,test,37,0.9999656397102759,0.9999979734420849
llm_goals_115,test,38,0.9999656397102759,0.9999599456769136
llm_goals_115,test,39,0.9999656397102759,0.999999344348895
llm_goals_115,test,40,0.9999656397102759,0.9998471736847392
llm_goals_115,test,41,0.9999656397102759,0.9999997615814208
llm_goals_115,test,42,0.9999656397102759,0.9999936819076042
llm_goals_115,test,43,0.9999656397102759,0.9999994039535594
llm_goals_115,test,44,0.9999656397102759,0.9999966621397788
llm_goals_115,test,45,0.9999656397102759,0.9908538461901172
llm_goals_115,test,46,0.9999656397102759,0.5668339122107139
llm_goals_115,test,47,0.9999656397102759,0.999965012074428
llm_goals_115,test,48,0.9999656397102759,0.9999986290932004
llm_goals_115,test,49,0.9999656397102759,0.9999966025353348
llm_goals_86,test,0,0.9470218735581555,0.9999950528144428
llm_goals_86,test,1,0.9470218735581555,0.9733920102032824
llm_goals_86,test,2,0.9470218735581555,0.9999997019767636
llm_goals_86,test,3,0.9470218735581555,0.9999989867209838
llm_goals_86,test,4,0.9470218735581555,0.9999939203260696
llm_goals_86,test,5,0.9470218735581555,0.9799200289999128
llm_goals_86,test,6,0.9470218735581555,0.9999989271164011
llm_goals_86,test,7,0.9470218735581555,0.9999911785123744
llm_goals_86,test,8,0.9470218735581555,0.9906920788388957
llm_goals_86,test,9,0.9470218735581555,0.960079549439269
llm_goals_86,test,10,0.9470218735581555,0.9999979734420849
llm_goals_86,test,11,0.9470218735581555,0.998329818271824
llm_goals_86,test,12,0.9470218735581555,0.9999976158140952
llm_goals_86,test,13,0.9470218735581555,0.997893571823832
llm_goals_86,test,14,0.9470218735581555,0.9994581937511068
llm_goals_86,test,15,0.9470218735581555,0.9993743300463472
llm_goals_86,test,16,0.9470218735581555,0.9959942101456876
llm_goals_86,test,17,0.9470218735581555,0.9989233016552924
llm_goals_86,test,18,0.9470218735581555,0.999989688396868
llm_goals_86,test,19,0.9470218735581555,0.99977147578688
llm_goals_86,test,20,0.9470218735581555,0.999986886977724
llm_goals_86,test,21,0.9470218735581555,0.9995875954544448
llm_goals_86,test,22,0.9470218735581555,0.9998529553413918
llm_goals_86,test,23,0.9470218735581555,0.9999995827674883
llm_goals_86,test,24,0.9470218735581555,0.98040735685252
llm_goals_86,test,25,0.9470218735581555,0.9999257922204762
llm_goals_86,test,26,0.9470218735581555,0.9992931485112122
llm_goals_86,test,27,0.9470218735581555,0.999970734120207
llm_goals_86,test,28,0.9470218735581555,0.9998175501809444
llm_goals_86,test,29,0.9470218735581555,0.9995185136816022
llm_goals_86,test,30,0.9470218735581555,0.9807010897549824
llm_goals_86,test,31,0.9470218735581555,0.9998762011476526
llm_goals_86,test,32,0.9470218735581555,0.9988895059174044
llm_goals_86,test,33,0.9470218735581555,0.9999738931662266
llm_goals_86,test,34,0.9470218735581555,0.9977411627147142
llm_goals_86,test,35,0.9470218735581555,0.9999870657920578
llm_goals_86,test,36,0.9470218735581555,0.9994595050999702
llm_goals_86,test,37,0.9470218735581555,0.9993578791799612
llm_goals_86,test,38,0.9470218735581555,0.9999866485595712
llm_goals_86,test,39,0.9470218735581555,0.99997985362928
llm_goals_86,test,40,0.9470218735581555,0.999995470046798
llm_goals_86,test,41,0.9470218735581555,0.99996912479408
llm_goals_86,test,42,0.9470218735581555,0.9999997615814208
llm_goals_86,test,43,0.9470218735581555,0.9999995827674883
llm_goals_86,test,44,0.9470218735581555,0.997135043199176
llm_goals_86,test,45,0.9470218735581555,0.9999841451646688
llm_goals_86,test,46,0.9470218735581555,0.3364333057002893
llm_goals_86,test,47,0.9470218735581555,0.9991943836221492
llm_goals_86,test,48,0.9470218735581555,0.9999958872793276
llm_goals_86,test,49,0.9470218735581555,0.999995648860848
llm_goals_281,test,0,0.9592691862824174,0.9996947049971306
llm_goals_281,test,1,0.9592691862824174,0.9999986290932004
llm_goals_281,test,2,0.9592691862824174,0.9983671307551129
llm_goals_281,test,3,0.9592691862824174,0.993962764832135
llm_goals_281,test,4,0.9592691862824174,0.9999989271164011
llm_goals_281,test,5,0.9592691862824174,0.9999997019767636
llm_goals_281,test,6,0.9592691862824174,0.9999997019767636
llm_goals_281,test,7,0.9592691862824174,0.973559082090764
llm_goals_281,test,8,0.9592691862824174,0.9999968409538144
llm_goals_281,test,9,0.9592691862824174,0.9999994635581704
llm_goals_281,test,10,0.9592691862824174,0.9999997019767636
llm_goals_281,test,11,0.9592691862824174,0.9999951720236044
llm_goals_281,test,12,0.9592691862824174,0.9999264478667818
llm_goals_281,test,13,0.9592691862824174,0.9999998807907032
llm_goals_281,test,14,0.9592691862824174,0.9999976158140952
llm_goals_281,test,15,0.9592691862824174,0.9999992847442344
llm_goals_281,test,16,0.9592691862824174,0.9999986886977652
llm_goals_281,test,17,0.9592691862824174,0.9999985694885254
llm_goals_281,test,18,0.9592691862824174,0.999999344348895
llm_goals_281,test,19,0.9592691862824174,2.503036581908297e-05
llm_goals_281,test,20,0.9592691862824174,0.999996542930667
llm_goals_281,test,21,0.9592691862824174,0.9999997615814208
llm_goals_281,test,22,0.9592691862824174,0.9999986886977652
llm_goals_281,test,23,0.9592691862824174,0.999999344348895
llm_goals_281,test,24,0.9592691862824174,0.9999715089800396
llm_goals_281,test,25,0.9592691862824174,0.9999983310699748
llm_goals_281,test,26,0.9592691862824174,0.9999986290932004
llm_goals_281,test,27,0.9592691862824174,0.9999990463256836
llm_goals_281,test,28,0.9592691862824174,0.8906972993247301
llm_goals_281,test,29,0.9592691862824174,7.346078924151352e-05
llm_goals_281,test,30,0.9592691862824174,0.9999995827674883
llm_goals_281,test,31,0.9592691862824174,0.9999997019767636
llm_goals_281,test,32,0.9592691862824174,0.99999910593033
llm_goals_281,test,33,0.9592691862824174,0.9999994039535594
llm_goals_281,test,34,0.9592691862824174,0.9999989867209838
llm_goals_281,test,35,0.9592691862824174,0.9934774041946208
llm_goals_281,test,36,0.9592691862824174,0.9999990463256836
llm_goals_281,test,37,0.9592691862824174,3.4259730994143734e-05
llm_goals_281,test,38,0.9592691862824174,0.3148602040230503
llm_goals_281,test,39,0.9592691862824174,0.9940564630440718
llm_goals_281,test,40,0.9592691862824174,0.999999344348895
llm_goals_281,test,41,0.9592691862824174,0.9999998211860676
llm_goals_281,test,42,0.9592691862824174,0.999860048294782
llm_goals_281,test,43,0.9592691862824174,0.9999997019767636
llm_goals_281,test,44,0.9592691862824174,0.9999992847442344
llm_goals_281,test,45,0.9592691862824174,0.9728845352464304
llm_goals_281,test,46,0.9592691862824174,0.9999996423721385
llm_goals_281,test,47,0.9592691862824174,0.999986290931994
llm_goals_281,test,48,0.9592691862824174,0.9999994039535594
llm_goals_281,test,49,0.9592691862824174,0.999999344348895
llm_goals_182,test,0,0.7328947647114809,0.9999994039535594
llm_goals_182,test,1,0.7328947647114809,0.0005625917030918
llm_goals_182,test,2,0.7328947647114809,0.9999986886977652
llm_goals_182,test,3,0.7328947647114809,7.296223953885346e-06
llm_goals_182,test,4,0.7328947647114809,0.9999976158140952
llm_goals_182,test,5,0.7328947647114809,0.003103044503552
llm_goals_182,test,6,0.7328947647114809,0.0119719938396825
llm_goals_182,test,7,0.7328947647114809,0.9999994635581704
llm_goals_182,test,8,0.7328947647114809,0.9999964833260028
llm_goals_182,test,9,0.7328947647114809,0.0113900113927541
llm_goals_182,test,10,0.7328947647114809,0.9961416126209276
llm_goals_182,test,11,0.7328947647114809,0.999994337558862
llm_goals_182,test,12,0.7328947647114809,0.0378442217787105
llm_goals_182,test,13,0.7328947647114809,0.0008868430627717
llm_goals_182,test,14,0.7328947647114809,0.0008985942545946
llm_goals_182,test,15,0.7328947647114809,0.9999988675117084
llm_goals_182,test,16,0.7328947647114809,0.0033689156613595
llm_goals_182,test,17,0.7328947647114809,0.0006440135974187
llm_goals_182,test,18,0.7328947647114809,0.0016946532068186
llm_goals_182,test,19,0.7328947647114809,0.9999406933800118
llm_goals_182,test,20,0.7328947647114809,0.99999910593033
llm_goals_182,test,21,0.7328947647114809,0.006514652424738
llm_goals_182,test,22,0.7328947647114809,0.0008693644862334
llm_goals_182,test,23,0.7328947647114809,0.9999617934213552
llm_goals_182,test,24,0.7328947647114809,0.0038374716596311
llm_goals_182,test,25,0.7328947647114809,0.9941936732536844
llm_goals_182,test,26,0.7328947647114809,0.001039830413279
llm_goals_182,test,27,0.7328947647114809,0.0007135811001391
llm_goals_182,test,28,0.7328947647114809,7.789882184923891e-06
llm_goals_182,test,29,0.7328947647114809,0.999957442283379
llm_goals_182,test,30,0.7328947647114809,0.9981520175441102
llm_goals_182,test,31,0.7328947647114809,0.0117830754540077
llm_goals_182,test,32,0.7328947647114809,0.9999659657485728
llm_goals_182,test,33,0.7328947647114809,0.003031636673792
llm_goals_182,test,34,0.7328947647114809,0.9774106140350124
llm_goals_182,test,35,0.7328947647114809,0.9999996423721385
llm_goals_182,test,36,0.7328947647114809,0.9979310631755344
llm_goals_182,test,37,0.7328947647114809,0.9998408556030968
llm_goals_182,test,38,0.7328947647114809,0.999994218349345
llm_goals_182,test,39,0.7328947647114809,0.1486108277942357
llm_goals_182,test,40,0.7328947647114809,0.9999673962596765
llm_goals_182,test,41,0.7328947647114809,0.0004129864967066
llm_goals_182,test,42,0.7328947647114809,0.9999995231628418
llm_goals_182,test,43,0.7328947647114809,0.0046706145770988
llm_goals_182,test,44,0.7328947647114809,0.9999978542328164
llm_goals_182,test,45,0.7328947647114809,1.853969397415038e-05
llm_goals_182,test,46,0.7328947647114809,0.9999624490730772
llm_goals_182,test,47,0.7328947647114809,2.5724993639382006e-05
llm_goals_182,test,48,0.7328947647114809,0.0005832931102604
llm_goals_182,test,49,0.7328947647114809,0.0013167466449808
llm_goals_438,test,0,0.9502779692135944,0.0127917126432779
llm_goals_438,test,1,0.9502779692135944,0.9999138712868518
llm_goals_438,test,2,0.9502779692135944,0.001266465311242
llm_goals_438,test,3,0.9502779692135944,0.9997649192827218
llm_goals_438,test,4,0.9502779692135944,0.995094418582848
llm_goals_438,test,5,0.9502779692135944,0.9676808127608026
llm_goals_438,test,6,0.9502779692135944,0.9681100847526048
llm_goals_438,test,7,0.9502779692135944,0.1433627923531326
llm_goals_438,test,8,0.9502779692135944,0.9999272823362588
llm_goals_438,test,9,0.9502779692135944,0.3346369990700403
llm_goals_438,test,10,0.9502779692135944,0.0032511657787224
llm_goals_438,test,11,0.9502779692135944,0.9991979598760046
llm_goals_438,test,12,0.9502779692135944,0.9979441166238928
llm_goals_438,test,13,0.9502779692135944,0.1369715342565285
llm_goals_438,test,14,0.9502779692135944,0.9999860525130736
llm_goals_438,test,15,0.9502779692135944,0.9995588660290228
llm_goals_438,test,16,0.9502779692135944,0.9999721646308564
llm_goals_438,test,17,0.9502779692135944,0.9999966025353348
llm_goals_438,test,18,0.9502779692135944,0.9999983906746356
llm_goals_438,test,19,0.9502779692135944,0.9999996423721385
llm_goals_438,test,20,0.9502779692135944,0.9997635483790388
llm_goals_438,test,21,0.9502779692135944,0.9481995120869072
llm_goals_438,test,22,0.9502779692135944,0.9999990463256836
llm_goals_438,test,23,0.9502779692135944,0.9995222687768196
llm_goals_438,test,24,0.9502779692135944,0.999998450279186
llm_goals_438,test,25,0.9502779692135944,0.0119505141994216
llm_goals_438,test,26,0.9502779692135944,0.9546977279083356
llm_goals_438,test,27,0.9502779692135944,0.9999922513961864
llm_goals_438,test,28,0.9502779692135944,0.9999902844428042
llm_goals_438,test,29,0.9502779692135944,0.9999998211860676
llm_goals_438,test,30,0.9502779692135944,0.0012244399528321
llm_goals_438,test,31,0.9502779692135944,0.9598621719385948
llm_goals_438,test,32,0.9502779692135944,0.9979359506472824
llm_goals_438,test,33,0.9502779692135944,0.9999122619631158
llm_goals_438,test,34,0.9502779692135944,0.0033786082834978
llm_goals_438,test,35,0.9502779692135944,0.7030742694516781
llm_goals_438,test,36,0.9502779692135944,0.0009362307836721
llm_goals_438,test,37,0.9502779692135944,0.9999994635581704
llm_goals_438,test,38,0.9502779692135944,0.9999997019767636
llm_goals_438,test,39,0.9502779692135944,0.0899507873745254
llm_goals_438,test,40,0.9502779692135944,0.8368337146398075
llm_goals_438,test,41,0.9502779692135944,0.9687532202387088
llm_goals_438,test,42,0.9502779692135944,0.001642352875252
llm_goals_438,test,43,0.9502779692135944,0.994022190528956
llm_goals_438,test,44,0.9502779692135944,0.999978065491181
llm_goals_438,test,45,0.9502779692135944,0.9999783635133692
llm_goals_438,test,46,0.9502779692135944,0.9999961853027344
llm_goals_438,test,47,0.9502779692135944,0.9998934864975054
llm_goals_438,test,48,0.9502779692135944,0.9999979734420849
llm_goals_438,test,49,0.9502779692135944,0.9999861717225268
llm_goals_206,test,0,0.6255354657048874,0.9991406798194884
llm_goals_206,test,1,0.6255354657048874,0.7026181814697341
llm_goals_206,test,2,0.6255354657048874,0.9495592135330754
llm_goals_206,test,3,0.6255354657048874,0.4597382924578109
llm_goals_206,test,4,0.6255354657048874,0.456834747394902
llm_goals_206,test,5,0.6255354657048874,0.0069897250631233
llm_goals_206,test,6,0.6255354657048874,0.1198500283021958
llm_goals_206,test,7,0.6255354657048874,0.9853912589369151
llm_goals_206,test,8,0.6255354657048874,0.9858354928324288
llm_goals_206,test,9,0.6255354657048874,0.7676771375411302
llm_goals_206,test,10,0.6255354657048874,6.0325856974144665e-05
llm_goals_206,test,11,0.6255354657048874,0.9932408335154868
llm_goals_206,test,12,0.6255354657048874,0.87151349073003
llm_goals_206,test,13,0.6255354657048874,4.2185384445727474e-05
llm_goals_206,test,14,0.6255354657048874,0.8643435780923203
llm_goals_206,test,15,0.6255354657048874,0.3192446879498265
llm_goals_206,test,16,0.6255354657048874,0.8269734919284588
llm_goals_206,test,17,0.6255354657048874,0.9885780813553218
llm_goals_206,test,18,0.6255354657048874,0.004661507854032
llm_goals_206,test,19,0.6255354657048874,2.09967085772139e-05
llm_goals_206,test,20,0.6255354657048874,0.98699533957105
llm_goals_206,test,21,0.6255354657048874,0.9343360672856648
llm_goals_206,test,22,0.6255354657048874,0.0175621316229822
llm_goals_206,test,23,0.6255354657048874,0.8257364630087937
llm_goals_206,test,24,0.6255354657048874,0.9999812841420614
llm_goals_206,test,25,0.6255354657048874,0.5058550948948065
llm_goals_206,test,26,0.6255354657048874,0.993140757045314
llm_goals_206,test,27,0.6255354657048874,2.2270664938206257e-05
llm_goals_206,test,28,0.6255354657048874,0.950193582732028
llm_goals_206,test,29,0.6255354657048874,0.9696497918757307
llm_goals_206,test,30,0.6255354657048874,0.0026329471014817
llm_goals_206,test,31,0.6255354657048874,0.892615734505986
llm_goals_206,test,32,0.6255354657048874,0.6161747460126132
llm_goals_206,test,33,0.6255354657048874,0.0330446953951764
llm_goals_206,test,34,0.6255354657048874,0.9667759539880174
llm_goals_206,test,35,0.6255354657048874,0.9067099130837172
llm_goals_206,test,36,0.6255354657048874,0.9999364614518882
llm_goals_206,test,37,0.6255354657048874,3.930535533630151e-05
llm_goals_206,test,38,0.6255354657048874,0.8118365412646018
llm_goals_206,test,39,0.6255354657048874,0.6533351590647749
llm_goals_206,test,40,0.6255354657048874,1.0367098236044126e-05
llm_goals_206,test,41,0.6255354657048874,0.9999849200248888
llm_goals_206,test,42,0.6255354657048874,0.9495081916810176
llm_goals_206,test,43,0.6255354657048874,0.967551113836368
llm_goals_206,test,44,0.6255354657048874,0.0156578839862262
llm_goals_206,test,45,0.6255354657048874,0.0016468393065651
llm_goals_206,test,46,0.6255354657048874,0.0561833196086265
llm_goals_206,test,47,0.6255354657048874,8.951690490961762e-05
llm_goals_206,test,48,0.6255354657048874,0.3268218248822932
llm_goals_206,test,49,0.6255354657048874,0.0047424109160671
