template_id,split,question_idx,prediction,label
llm_goals_236,test,0,0.9999997019767636,0.9999990463256836
llm_goals_236,test,1,0.9998456835792138,0.9998601079056368
llm_goals_236,test,2,0.9999997019767636,0.9999994039535594
llm_goals_236,test,3,0.9997988343186986,0.999998450279186
llm_goals_236,test,4,0.9999963641166848,0.9999971389770508
llm_goals_236,test,5,0.9999997019767636,0.9999998211860676
llm_goals_236,test,6,0.9999997019767636,0.9999996423721385
llm_goals_236,test,7,0.9999997019767636,0.999999344348895
llm_goals_236,test,8,0.9999548196776498,0.9999988675117084
llm_goals_236,test,9,0.9999998211860676,0.9999998211860676
llm_goals_236,test,10,0.9544473884056286,0.9942808746609532
llm_goals_236,test,11,0.9999996423721385,0.9998060464816904
llm_goals_236,test,12,0.9999979734420849,0.9999784827237244
llm_goals_236,test,13,0.9999997019767636,0.9999998211860676
llm_goals_236,test,14,0.0658720040901912,0.9999877214430704
llm_goals_236,test,15,0.9999198913575932,0.9999918937684243
llm_goals_236,test,16,0.999994397163171,0.9998958706868224
llm_goals_236,test,17,0.0692839614704294,0.9999055266407578
llm_goals_236,test,18,0.0707097485657529,0.9999948143957074
llm_goals_236,test,19,0.9999797344205802,0.0724598805251418
llm_goals_236,test,20,0.9862641694878852,0.9999921321869182
llm_goals_236,test,21,0.9999995827674883,0.9999992847442344
llm_goals_236,test,22,0.999999344348895,0.9997341632930924
llm_goals_236,test,23,0.9999997019767636,0.9998326301518724
llm_goals_236,test,24,0.0692839614704294,0.999985396862246
llm_goals_236,test,25,0.9544473884056286,0.9778256407805812
llm_goals_236,test,26,0.9999906420709002,0.9999951124192492
llm_goals_236,test,27,0.0692839614704294,0.9285253300141496
llm_goals_236,test,28,0.9999998807907032,0.9999996423721385
llm_goals_236,test,29,0.9999996423721385,0.0552585651110835
llm_goals_236,test,30,0.5563546942186555,0.9193987256529454
llm_goals_236,test,31,0.9999709725372938,0.9999983310699748
llm_goals_236,test,32,0.9999858140942104,0.999973952771136
llm_goals_236,test,33,0.9999830126768252,0.9999884366984664
llm_goals_236,test,34,0.9413548105625718,0.9757304783109252
llm_goals_236,test,35,0.9999997019767636,0.9999988675117084
llm_goals_236,test,36,0.9994282126700658,0.9998944997781798
llm_goals_236,test,37,0.9999797344205802,0.1365288892720467
llm_goals_236,test,38,0.9999988675117084,0.719762510833872
llm_goals_236,test,39,0.999994099140297,0.9999720454212542
llm_goals_236,test,40,0.999981403350946,0.9984533787155216
llm_goals_236,test,41,0.9999997019767636,0.9999998211860676
llm_goals_236,test,42,0.9999997019767636,0.9999989271164011
llm_goals_236,test,43,0.9999997019767636,0.9999982714653176
llm_goals_236,test,44,0.1117761043486536,0.9999991655349802
llm_goals_236,test,45,0.0195412785509914,0.9999994635581704
llm_goals_236,test,46,0.9999979734420849,0.9999888539316992
llm_goals_236,test,47,0.2600221241325686,0.9999989271164011
llm_goals_236,test,48,0.9999672770506428,0.9999687075599843
llm_goals_236,test,49,0.1117761043486536,0.9976178406916212
llm_goals_228,test,0,0.3651794439901545,0.9999923110003712
llm_goals_228,test,1,0.0368960100986097,0.9997239112788898
llm_goals_228,test,2,0.6657766169140295,0.9999983310699748
llm_goals_228,test,3,0.2759552088687312,0.3235730208667373
llm_goals_228,test,4,0.0368960100986097,0.9999561309796544
llm_goals_228,test,5,0.0117672640712041,0.0500382433432339
llm_goals_228,test,6,0.0002711790209174,0.0325581693591018
llm_goals_228,test,7,0.1267842423307981,0.9999955296516294
llm_goals_228,test,8,0.9999628663045615,0.9999945759774836
llm_goals_228,test,9,0.9215878856881934,0.0028912413507839
llm_goals_228,test,10,0.0227561110367086,0.999972343445286
llm_goals_228,test,11,0.0101573020731447,0.2356525274624049
llm_goals_228,test,12,0.9311889408011224,0.7824152121811281
llm_goals_228,test,13,0.9999458789810336,9.272773905172216e-05
llm_goals_228,test,14,0.9764576559405816,0.999985396862246
llm_goals_228,test,15,0.8816398977736623,0.9997810721409376
llm_goals_228,test,16,0.9999946951865883,0.9999924302101154
llm_goals_228,test,17,0.9999849200248888,0.9964962600884054
llm_goals_228,test,18,0.9999946951865883,0.9999846816053862
llm_goals_228,test,19,0.999984383583134,0.80150937475593
llm_goals_228,test,20,0.0855834260377811,0.9999823570243526
llm_goals_228,test,21,0.9972915648548224,0.7620198101590071
llm_goals_228,test,22,0.99201571951911,0.999146759521554
llm_goals_228,test,23,0.0855834260377811,0.9753957978718134
llm_goals_228,test,24,0.0190664862530615,0.9999912381174048
llm_goals_228,test,25,0.0229286300468708,0.9997735619549886
llm_goals_228,test,26,0.0011133973949371,0.999994218349345
llm_goals_228,test,27,0.9999859929083526,0.9975230096939942
llm_goals_228,test,28,0.9905846711402768,0.0282825634665972
llm_goals_228,test,29,0.9999788999564418,0.989357948515744
llm_goals_228,test,30,0.0003097251082973,0.9999648928656788
llm_goals_228,test,31,0.9999918341633552,0.1841044242752227
llm_goals_228,test,32,0.1267842423307981,0.6401162870682584
llm_goals_228,test,33,0.9999946951865883,0.999995231628418
llm_goals_228,test,34,0.0033051037114815,0.9999182820314436
llm_goals_228,test,35,0.9297304128949796,0.999788165093598
llm_goals_228,test,36,0.99989032745087,0.9875653984316132
llm_goals_228,test,37,0.3651794439901545,0.99879342314863
llm_goals_228,test,38,0.7145846469328722,0.9949926138514864
llm_goals_228,test,39,0.9297304128949796,0.9871301051093162
llm_goals_228,test,40,0.981050729114242,0.9374855739864648
llm_goals_228,test,41,0.7533057448689202,0.768526607723976
llm_goals_228,test,42,0.9999858140942104,0.9999880194663172
llm_goals_228,test,43,0.9999859333036348,0.5863317957282166
llm_goals_228,test,44,0.9999921321869182,0.9999881386760048
llm_goals_228,test,45,0.3130094081738239,0.8984286803691676
llm_goals_228,test,46,0.9533845772071362,0.012311546088274
llm_goals_228,test,47,0.0011133973949371,0.0766497555033863
llm_goals_228,test,48,0.0147535732700302,0.9999973773956584
llm_goals_228,test,49,0.9932094811245052,0.939641477083989
llm_goals_397,test,0,0.9999858736989208,0.9814099073764808
llm_goals_397,test,1,0.043130386469839,0.9999912381174048
llm_goals_397,test,2,0.0587736518307726,0.9999979138373352
llm_goals_397,test,3,0.9996868372021046,0.9999809861190028
llm_goals_397,test,4,0.1668342760540509,0.0255301341302224
llm_goals_397,test,5,0.9999573826776348,0.9999864101405658
llm_goals_397,test,6,0.997873365865664,0.9998381137785032
llm_goals_397,test,7,0.9999858736989208,0.99997174739913
llm_goals_397,test,8,0.0418199918750143,0.130829360211786
llm_goals_397,test,9,0.0181501820511032,0.9999025464035022
llm_goals_397,test,10,0.0284022495833814,0.9995446801111892
llm_goals_397,test,11,0.0181501820511032,0.9833766826787343
llm_goals_397,test,12,0.9998869895913725,0.999996542930667
llm_goals_397,test,13,0.0572053788375615,0.999946773053646
llm_goals_397,test,14,0.9999804496766298,0.9999846816053862
llm_goals_397,test,15,0.043130386469839,0.0066017277153082
llm_goals_397,test,16,0.031147640270006,0.9999932646750854
llm_goals_397,test,17,0.9997357130104304,0.9999726414675878
llm_goals_397,test,18,0.999972403050103,0.9999631643313146
llm_goals_397,test,19,0.0572053788375615,0.9990255832870808
llm_goals_397,test,20,0.5277264571096292,0.0470702684705779
llm_goals_397,test,21,0.9999585747713666,0.999989688396868
llm_goals_397,test,22,0.0587736518307726,0.9999497532844842
llm_goals_397,test,23,0.1214980593318017,0.9997248649522246
llm_goals_397,test,24,0.9999804496766298,0.9999954104424252
llm_goals_397,test,25,0.9971730709279916,0.9892253874904372
llm_goals_397,test,26,0.0055503521129896,0.9999661445600752
llm_goals_397,test,27,0.0108113761393381,0.999984502792388
llm_goals_397,test,28,0.0090501220468409,0.9999876022334326
llm_goals_397,test,29,0.997873365865664,0.99916046856021
llm_goals_397,test,30,0.1592366467117022,0.9993026852479712
llm_goals_397,test,31,0.9999573826776348,0.999975025654656
llm_goals_397,test,32,0.0213679253663005,0.9996371865271196
llm_goals_397,test,33,0.1576879666038143,0.9999744892118428
llm_goals_397,test,34,0.9979307650718996,0.999513149271868
llm_goals_397,test,35,0.9999858736989208,0.9999858140942104
llm_goals_397,test,36,0.043130386469839,0.9909363981874668
llm_goals_397,test,37,0.047299853838797,0.9967403410768448
llm_goals_397,test,38,0.997873365865664,0.9700924159576454
llm_goals_397,test,39,0.9998869895913725,0.9999973177909444
llm_goals_397,test,40,0.0274103222178659,0.8681342672732176
llm_goals_397,test,41,0.9999822974207612,0.999994218349345
llm_goals_397,test,42,0.0587736518307726,0.9999906420709002
llm_goals_397,test,43,0.0271702465297832,0.9999807476995284
llm_goals_397,test,44,0.864069875804333,0.6356807298065411
llm_goals_397,test,45,0.0022058087180333,0.999989688396868
llm_goals_397,test,46,0.0236038651040782,0.9996384382368032
llm_goals_397,test,47,0.999625802045809,0.9997389316595698
llm_goals_397,test,48,0.9999804496766298,0.9999530911461468
llm_goals_397,test,49,0.0140560976313271,0.9999887943268112
llm_goals_401,test,0,0.9999955892564644,0.9999994635581704
llm_goals_401,test,1,0.99999910593033,0.9999995231628418
llm_goals_401,test,2,0.9999988079071328,0.9999994635581704
llm_goals_401,test,3,0.99984550476379,0.9999074339856228
llm_goals_401,test,4,0.9999997019767636,0.999999940395357
llm_goals_401,test,5,0.9999997615814208,0.999999940395357
llm_goals_401,test,6,0.9999998211860676,0.999999940395357
llm_goals_401,test,7,0.9999994039535594,0.9999992847442344
llm_goals_401,test,8,0.9999998807907032,0.999999940395357
llm_goals_401,test,9,0.9999997615814208,0.9999998211860676
llm_goals_401,test,10,0.9953570962274482,0.9999995827674883
llm_goals_401,test,11,0.9999970197676546,0.9999995827674883
llm_goals_401,test,12,0.9999995231628418,0.9999995827674883
llm_goals_401,test,13,0.9999997615814208,0.9999997019767636
llm_goals_401,test,14,0.9937143921530034,0.9999986886977652
llm_goals_401,test,15,0.9999998211860676,0.9999998211860676
llm_goals_401,test,16,0.9999926686287371,0.9999991655349802
llm_goals_401,test,17,0.9999997615814208,0.9999992847442344
llm_goals_401,test,18,0.9937143921530034,0.9999995231628418
llm_goals_401,test,19,0.9999994039535594,0.9713776109091996
llm_goals_401,test,20,0.9999997019767636,0.9999998807907032
llm_goals_401,test,21,0.9999997615814208,1.0
llm_goals_401,test,22,0.9999953508376008,0.9999998807907032
llm_goals_401,test,23,0.9999948143957074,0.9999996423721385
llm_goals_401,test,24,0.9999903440477812,0.9999989867209838
llm_goals_401,test,25,0.9999997019767636,0.9999995231628418
llm_goals_401,test,26,0.9937143921530034,0.9999997615814208
llm_goals_401,test,27,0.9999980926513672,0.9999994039535594
llm_goals_401,test,28,0.9999889135356814,0.9983195662475728
llm_goals_401,test,29,0.9999876022334326,0.9993320703468634
llm_goals_401,test,30,0.9999995827674883,0.9999997019767636
llm_goals_401,test,31,0.9999998211860676,0.9999998807907032
llm_goals_401,test,32,0.9999994039535594,0.9999989271164011
llm_goals_401,test,33,0.999957323075532,0.9999992847442344
llm_goals_401,test,34,0.9999995827674883,0.9999994635581704
llm_goals_401,test,35,0.9999740719791466,0.9999998807907032
llm_goals_401,test,36,0.9999983310699748,0.9999997019767636
llm_goals_401,test,37,0.9993956685328474,0.8060779005212295
llm_goals_401,test,38,0.9999997019767636,0.9999966025353348
llm_goals_401,test,39,0.9999995231628418,0.9999998211860676
llm_goals_401,test,40,0.9999986290932004,0.9999996423721385
llm_goals_401,test,41,0.9999998211860676,0.999999940395357
llm_goals_401,test,42,0.9999953508376008,0.9999996423721385
llm_goals_401,test,43,0.9999997615814208,0.999999940395357
llm_goals_401,test,44,0.9999998211860676,0.9999997615814208
llm_goals_401,test,45,0.999787747862263,0.9992901682960044
llm_goals_401,test,46,0.999994158744592,0.9999996423721385
llm_goals_401,test,47,0.999787747862263,0.9999059438703174
llm_goals_401,test,48,0.9999903440477812,0.9999988079071328
llm_goals_401,test,49,0.9970360995204356,0.999999344348895
llm_goals_326,test,0,0.9999448657028588,0.9998103380222648
llm_goals_326,test,1,0.9997162222790396,0.1015499721104398
llm_goals_326,test,2,0.9999448657028588,0.9995523691298543
llm_goals_326,test,3,0.993652939695984,0.9820513126171384
llm_goals_326,test,4,0.9994552731394392,0.9997708797458836
llm_goals_326,test,5,0.9997428655652144,0.0041024868608885
llm_goals_326,test,6,0.008697928448145,0.0013792452717851
llm_goals_326,test,7,0.9999448657028588,0.9970470071684427
llm_goals_326,test,8,0.9997829198894748,0.9994441866676194
llm_goals_326,test,9,0.00967461000004,0.058725887838439
llm_goals_326,test,10,0.9995234012483056,0.9983887672460816
llm_goals_326,test,11,0.9999688863756148,0.9773504733838247
llm_goals_326,test,12,0.9110749985946988,0.5111671721675201
llm_goals_326,test,13,0.00967461000004,0.0023213561119498
llm_goals_326,test,14,0.9779286376412862,0.9992487430849846
llm_goals_326,test,15,0.9977266191515928,0.9998496770786612
llm_goals_326,test,16,0.9997965693493795,0.9995788335870258
llm_goals_326,test,17,0.9998925924288866,0.0289194533041716
llm_goals_326,test,18,0.9997892379832868,0.9941717982892394
llm_goals_326,test,19,0.9969296455445616,0.9898712036276838
llm_goals_326,test,20,0.9994552731394392,0.998426973781836
llm_goals_326,test,21,0.0110746234382364,0.0080112452725568
llm_goals_326,test,22,0.998944938221402,0.0170446490301255
llm_goals_326,test,23,0.9886808986843612,0.9315074100877992
llm_goals_326,test,24,0.9998468756634564,0.9996359944310432
llm_goals_326,test,25,0.9870499964536364,0.9993702173479914
llm_goals_326,test,26,0.9997892379832868,0.99954205751167
llm_goals_326,test,27,0.9999347329121044,0.1439592978368308
llm_goals_326,test,28,0.9841483229619022,0.9782873980924596
llm_goals_326,test,29,0.9965493082191592,0.6406475907057047
llm_goals_326,test,30,0.9995728731197,0.9997262358610556
llm_goals_326,test,31,0.0147799642204839,0.0025467661319066
llm_goals_326,test,32,0.99824374914187,0.927265467234428
llm_goals_326,test,33,0.9997965693493795,0.9970411657688188
llm_goals_326,test,34,0.9995234012483056,0.9924188256928188
llm_goals_326,test,35,0.9999988079071328,0.9999433159814316
llm_goals_326,test,36,0.9986789226973706,0.7828563458619708
llm_goals_326,test,37,0.9660068167312932,0.9921779035200892
llm_goals_326,test,38,0.9998027682272717,0.9710912105847416
llm_goals_326,test,39,0.9581601024396612,0.9591411966937028
llm_goals_326,test,40,0.9995600581203944,0.9675343030198714
llm_goals_326,test,41,0.998944938221402,0.0125675465450323
llm_goals_326,test,42,0.9999864697453116,0.9817813030107898
llm_goals_326,test,43,0.0147799642204839,0.0210821160744808
llm_goals_326,test,44,0.9998901486420124,0.9984526634039176
llm_goals_326,test,45,0.9977530837347932,0.7725256637892597
llm_goals_326,test,46,0.994196474613498,0.7800079567380194
llm_goals_326,test,47,0.9983267187817976,0.9949684144438216
llm_goals_326,test,48,0.9998714923927384,0.9985677004408368
llm_goals_326,test,49,0.9976051450305792,0.045807901396548
llm_goals_415,test,0,0.9388349621129216,0.9997588992066258
llm_goals_415,test,1,0.9999971985817542,0.9999479055404636
llm_goals_415,test,2,0.9666739714933148,0.9957069754348792
llm_goals_415,test,3,0.7380818619443205,0.9998519420664436
llm_goals_415,test,4,0.9999874234199122,0.9993222355665604
llm_goals_415,test,5,0.9999944567679384,0.0031238526915668
llm_goals_415,test,6,0.0015909601944626,0.0017953563962722
llm_goals_415,test,7,0.9999831318859156,0.9612127544780552
llm_goals_415,test,8,0.9999964833260028,0.9824366570655148
llm_goals_415,test,9,0.999990940094108,0.0016438446411424
llm_goals_415,test,10,0.9999619126333728,0.9999850988388712
llm_goals_415,test,11,0.999999225139634,0.9989992976042504
llm_goals_415,test,12,0.1299853213149313,0.3845905785054697
llm_goals_415,test,13,0.999311327923382,0.0001663988005876
llm_goals_415,test,14,0.9999619126333728,0.99998015165382
llm_goals_415,test,15,0.9999979734420849,0.9986550807653384
llm_goals_415,test,16,0.9999971985817542,0.9999568462370104
llm_goals_415,test,17,0.9999921917910958,0.9992712139839848
llm_goals_415,test,18,0.9999864101405658,0.9999991655349802
llm_goals_415,test,19,0.9999925494194192,0.1268431093615233
llm_goals_415,test,20,0.9999989867209838,0.9989575147526004
llm_goals_415,test,21,0.0007868110325522,0.0009023478721852
llm_goals_415,test,22,0.9999844431868498,0.9999995231628418
llm_goals_415,test,23,0.9999971985817542,0.993058026033597
llm_goals_415,test,24,0.9999986886977652,0.9999659061423206
llm_goals_415,test,25,0.999808549874483,0.9999040365210196
llm_goals_415,test,26,0.9999080300352768,0.9999980330466104
llm_goals_415,test,27,0.867310221105661,0.9999982118606638
llm_goals_415,test,28,0.9999080300352768,0.9999243617070486
llm_goals_415,test,29,0.9999619126333728,0.0442403483495126
llm_goals_415,test,30,0.9998183250457464,0.9996343254989244
llm_goals_415,test,31,0.0007868110325522,0.0007251523135023
llm_goals_415,test,32,0.9999831318859156,0.8080266673914581
llm_goals_415,test,33,0.9999909996982146,0.9999894499780476
llm_goals_415,test,34,0.9999738335613207,0.9994327426028377
llm_goals_415,test,35,0.9847260716465316,0.9989529847642252
llm_goals_415,test,36,0.9999619126333728,0.9999961853027344
llm_goals_415,test,37,0.999937295915171,0.3947042465556775
llm_goals_415,test,38,0.9999991655349802,0.8703240197518964
llm_goals_415,test,39,0.9999992847442344,0.0273997177536015
llm_goals_415,test,40,0.9999974966048696,0.9999445676815596
llm_goals_415,test,41,0.9999998807907032,0.0002682073682728
llm_goals_415,test,42,0.9999971985817542,0.9981696606070336
llm_goals_415,test,43,0.0007868110325522,0.2786076155583993
llm_goals_415,test,44,0.9999968409538144,0.9965623020600424
llm_goals_415,test,45,0.999989688396868,0.9966514706305192
llm_goals_415,test,46,0.999970734120207,0.9965545534402274
llm_goals_415,test,47,0.9999309182164476,0.9999976754188272
llm_goals_415,test,48,0.9999771714215115,0.9999974966048696
llm_goals_415,test,49,0.9999982118606638,0.9999994635581704
llm_goals_146,test,0,0.9240624341125064,0.9937213660464576
llm_goals_146,test,1,0.9969121813069188,0.9919615387432202
llm_goals_146,test,2,0.0212794746481859,0.9951347707289916
llm_goals_146,test,3,0.99997317790941,0.9912926556861676
llm_goals_146,test,4,0.99965834617083,0.7208669260139297
llm_goals_146,test,5,0.988017201735565,0.0092084125425934
llm_goals_146,test,6,0.9993112683016196,0.1369906233450708
llm_goals_146,test,7,0.9988038539880396,0.9175609963819736
llm_goals_146,test,8,0.9973825215246378,0.0841403066718625
llm_goals_146,test,9,0.999562978747354,0.1684153143767103
llm_goals_146,test,10,0.9999626278875888,0.908113835652124
llm_goals_146,test,11,0.9999741315840668,0.8938514016497744
llm_goals_146,test,12,0.9903303981170524,0.0100032471486232
llm_goals_146,test,13,0.0315264321723481,0.0298375477746486
llm_goals_146,test,14,0.0209805824317376,0.3167174882579391
llm_goals_146,test,15,0.9979699254528004,0.927414416219921
llm_goals_146,test,16,0.3566676000975422,0.0159187313778433
llm_goals_146,test,17,0.9986089467539164,0.9978384970986696
llm_goals_146,test,18,0.852414364402017,0.4101569026026918
llm_goals_146,test,19,0.9999039173159018,0.9986221193952473
llm_goals_146,test,20,0.999562978747354,0.7513560649612049
llm_goals_146,test,21,0.3296304655279529,0.0021027028134696
llm_goals_146,test,22,0.999931395057156,0.9998958110811108
llm_goals_146,test,23,0.9792481665207596,0.7051541837582169
llm_goals_146,test,24,0.9990951419115592,0.0397261476166626
llm_goals_146,test,25,0.9999870657920578,0.8227276184379292
llm_goals_146,test,26,0.999562978747354,0.2677446993446601
llm_goals_146,test,27,0.0622701407003412,0.99998730421031
llm_goals_146,test,28,0.9999741315840668,0.492199104386424
llm_goals_146,test,29,0.9997434020147056,0.987386405278924
llm_goals_146,test,30,0.9999466538434332,0.9782173041265074
llm_goals_146,test,31,0.9999535083773644,0.0704110414375715
llm_goals_146,test,32,0.9988038539880396,0.5230369446492051
llm_goals_146,test,33,0.9988038539880396,0.3253501541923078
llm_goals_146,test,34,0.0593467884644384,0.9673128124700084
llm_goals_146,test,35,0.9999626278875888,0.9997146725628192
llm_goals_146,test,36,0.3296304655279529,0.9323108220562318
llm_goals_146,test,37,0.9778761260465448,0.9997609853775884
llm_goals_146,test,38,0.1718327041450559,0.9964783192363952
llm_goals_146,test,39,0.9996777772940014,0.0664083062639811
llm_goals_146,test,40,0.999931395057156,0.6598511913765792
llm_goals_146,test,41,0.9996270537412372,0.1032532555810967
llm_goals_146,test,42,0.1660562795782488,0.9252474342352108
llm_goals_146,test,43,0.0209805824317376,0.2905593299202337
llm_goals_146,test,44,0.9998908042940472,0.3807617993711434
llm_goals_146,test,45,0.999875664714204,0.972134053996152
llm_goals_146,test,46,0.9416558139635912,0.1382936231589401
llm_goals_146,test,47,0.9944762586870528,0.9162934404085756
llm_goals_146,test,48,0.9999928474427408,0.2466934390927757
llm_goals_146,test,49,0.9999039173159018,0.9999247193370324
llm_goals_293,test,0,0.9856056573069608,0.9999973177909444
llm_goals_293,test,1,0.9999995231628418,0.9999983310699748
llm_goals_293,test,2,0.9999994039535594,0.9999885559082036
llm_goals_293,test,3,0.9999866485595712,0.9996450543386908
llm_goals_293,test,4,0.9999996423721385,0.9999996423721385
llm_goals_293,test,5,0.9999992847442344,0.9999819397920116
llm_goals_293,test,6,0.99999910593033,0.9999997019767636
llm_goals_293,test,7,0.9999997019767636,0.999996066093452
llm_goals_293,test,8,0.9997166395096212,0.9999997615814208
llm_goals_293,test,9,0.9953658582561524,0.9999495744722752
llm_goals_293,test,10,0.9999976158140952,0.9999885559082036
llm_goals_293,test,11,0.999996721744454,0.999996721744454
llm_goals_293,test,12,0.9999912381174048,0.9999988675117084
llm_goals_293,test,13,0.9999037981035228,0.9999983906746356
llm_goals_293,test,14,0.9999924302101154,0.9999996423721385
llm_goals_293,test,15,0.9999995827674883,0.9999997615814208
llm_goals_293,test,16,0.9999924302101154,0.9999994039535594
llm_goals_293,test,17,0.9754672649571284,0.9999927282334016
llm_goals_293,test,18,0.9953658582561524,0.9999998211860676
llm_goals_293,test,19,0.9998058676733556,0.9999971985817542
llm_goals_293,test,20,0.9999996423721385,0.9999998211860676
llm_goals_293,test,21,0.9999992847442344,0.999999344348895
llm_goals_293,test,22,0.9953658582561524,0.999999225139634
llm_goals_293,test,23,0.9999924302101154,0.9999982714653176
llm_goals_293,test,24,0.9999992847442344,0.9999997019767636
llm_goals_293,test,25,0.9856056573069608,0.9999955296516294
llm_goals_293,test,26,0.9953658582561524,0.9999997615814208
llm_goals_293,test,27,0.9999037981035228,0.9999994635581704
llm_goals_293,test,28,0.999998509883854,0.9999988675117084
llm_goals_293,test,29,0.999994099140297,0.9999997615814208
llm_goals_293,test,30,0.999981403350946,0.9999886751170456
llm_goals_293,test,31,0.9999989271164011,0.9999983906746356
llm_goals_293,test,32,0.9999997615814208,0.9999979734420849
llm_goals_293,test,33,0.9999866485595712,0.9999989271164011
llm_goals_293,test,34,0.9999964833260028,0.9999950528144428
llm_goals_293,test,35,0.9999992847442344,0.9999990463256836
llm_goals_293,test,36,0.9625019422893564,0.9974341988179988
llm_goals_293,test,37,0.9999037981035228,0.999947488307946
llm_goals_293,test,38,0.999994099140297,0.9999994039535594
llm_goals_293,test,39,0.9999898672107936,0.9999996423721385
llm_goals_293,test,40,0.9953658582561524,0.9999990463256836
llm_goals_293,test,41,0.9999992847442344,0.9999995827674883
llm_goals_293,test,42,0.9999992847442344,0.999998450279186
llm_goals_293,test,43,0.9999994039535594,0.999937295915171
llm_goals_293,test,44,0.9999995827674883,0.9999994635581704
llm_goals_293,test,45,0.9999866485595712,0.9999981522560136
llm_goals_293,test,46,0.9999361038177048,0.999995648860848
llm_goals_293,test,47,0.9999995827674883,0.9999973177909444
llm_goals_293,test,48,0.9999997615814208,0.9999997019767636
llm_goals_293,test,49,0.999997437000376,0.9999975562095944
llm_goals_230,test,0,0.9999910593032342,0.9999988675117084
llm_goals_230,test,1,0.99999910593033,0.9999197721505853
llm_goals_230,test,2,0.9999967813491324,0.9999986290932004
llm_goals_230,test,3,0.9999995827674883,0.9999998807907032
llm_goals_230,test,4,0.999999344348895,0.9999992847442344
llm_goals_230,test,5,0.9982005954015007,0.97145622955703
llm_goals_230,test,6,0.9990922808645516,0.9931073785733624
llm_goals_230,test,7,0.9999945163727092,0.9999989271164011
llm_goals_230,test,8,0.9999989867209838,0.9999994039535594
llm_goals_230,test,9,0.9906488654407964,0.999468743814106
llm_goals_230,test,10,0.999994158744592,0.9999828934677488
llm_goals_230,test,11,0.9999990463256836,0.9999996423721385
llm_goals_230,test,12,0.9999983906746356,0.999997794628074
llm_goals_230,test,13,0.9998332858098395,0.9983894825119092
llm_goals_230,test,14,0.9999982714653176,0.9999980926513672
llm_goals_230,test,15,0.999999344348895,0.9999994039535594
llm_goals_230,test,16,0.9999973773956584,0.99999570846569
llm_goals_230,test,17,0.999999225139634,0.9997287988607096
llm_goals_230,test,18,0.9999974966048696,0.9999986290932004
llm_goals_230,test,19,0.9999990463256836,0.792201278640246
llm_goals_230,test,20,0.99999910593033,0.9999989271164011
llm_goals_230,test,21,0.9991578459510064,0.9993889927972028
llm_goals_230,test,22,0.9999996423721385,0.9999741315840668
llm_goals_230,test,23,0.9999990463256836,0.9999991655349802
llm_goals_230,test,24,0.999998450279186,0.9999988675117084
llm_goals_230,test,25,0.9999955296516294,0.9999902248378308
llm_goals_230,test,26,0.9999969005585,0.9999990463256836
llm_goals_230,test,27,0.9999995231628418,0.9999489188180812
llm_goals_230,test,28,0.9999997019767636,0.9999998211860676
llm_goals_230,test,29,0.9999989867209838,0.9489630473854872
llm_goals_230,test,30,0.9999973773956584,0.9999970197676546
llm_goals_230,test,31,0.9991578459510064,0.997134745101166
llm_goals_230,test,32,0.9999990463256836,0.9999995231628418
llm_goals_230,test,33,0.999998450279186,0.999997437000376
llm_goals_230,test,34,0.9999657869334646,0.9999924898147656
llm_goals_230,test,35,0.9999967813491324,0.9999969005585
llm_goals_230,test,36,0.9999973773956584,0.9999945163727092
llm_goals_230,test,37,0.9999985694885254,0.9779089689145934
llm_goals_230,test,38,0.9999988079071328,0.9570343502785515
llm_goals_230,test,39,0.9999983906746356,0.9999988079071328
llm_goals_230,test,40,0.9999985694885254,0.9999989271164011
llm_goals_230,test,41,0.9995568394653176,0.99562537655113
llm_goals_230,test,42,0.9999910593032342,0.999997794628074
llm_goals_230,test,43,0.9982005954015007,0.9952926635719378
llm_goals_230,test,44,0.9999992847442344,0.9999994635581704
llm_goals_230,test,45,0.9999998807907032,0.9999998211860676
llm_goals_230,test,46,0.9999994635581704,0.9999992847442344
llm_goals_230,test,47,0.9999998807907032,0.9999998211860676
llm_goals_230,test,48,0.999998450279186,0.9999990463256836
llm_goals_230,test,49,0.9999995827674883,0.9998905062670348
llm_goals_115,test,0,0.99999910593033,0.9999962449073808
llm_goals_115,test,1,0.999935865399837,0.9999990463256836
llm_goals_115,test,2,0.9999990463256836,0.9999997019767636
llm_goals_115,test,3,0.999790668485264,0.9999576807027534
llm_goals_115,test,4,0.9999980330466104,0.999958157538035
llm_goals_115,test,5,0.9999992847442344,0.999957859516412
llm_goals_115,test,6,0.9999995231628418,0.9999822974207612
llm_goals_115,test,7,0.9999994039535594,0.9999992847442344
llm_goals_115,test,8,0.9999547600756996,0.9999833106986686
llm_goals_115,test,9,0.9999634027484156,0.9999994635581704
llm_goals_115,test,10,0.9999958872793276,0.9999232888251398
llm_goals_115,test,11,0.9999979138373352,0.1735883698655277
llm_goals_115,test,12,0.9999994635581704,0.9999995231628418
llm_goals_115,test,13,0.9999949336052952,0.999999344348895
llm_goals_115,test,14,0.9999980926513672,0.999998450279186
llm_goals_115,test,15,0.9999978542328164,0.9952644706725092
llm_goals_115,test,16,0.9999995827674883,0.9999927878380692
llm_goals_115,test,17,0.9999951124192492,0.999998509883854
llm_goals_115,test,18,0.9999986290932004,0.9999974966048696
llm_goals_115,test,19,0.9999921917910958,0.99996823072331
llm_goals_115,test,20,0.999984383583134,0.9999916553499876
llm_goals_115,test,21,0.9999951124192492,0.999999344348895
llm_goals_115,test,22,0.9999634027484156,0.9999989867209838
llm_goals_115,test,23,0.9999942779541016,0.9994583130121676
llm_goals_115,test,24,0.9999547600756996,0.9999986290932004
llm_goals_115,test,25,0.9999995231628418,0.9999879002575536
llm_goals_115,test,26,0.999999225139634,0.9999988079071328
llm_goals_115,test,27,0.9999920725818348,0.9999988079071328
llm_goals_115,test,28,0.9999979138373352,0.0502507498981832
llm_goals_115,test,29,0.9999986886977652,0.999960899353502
llm_goals_115,test,30,0.9999995231628418,0.9999914169306978
llm_goals_115,test,31,0.9999921917910958,0.9999992847442344
llm_goals_115,test,32,0.9999547600756996,0.9999759793274372
llm_goals_115,test,33,0.9999994635581704,0.9999992847442344
llm_goals_115,test,34,0.9999995231628418,0.9999864101405658
llm_goals_115,test,35,0.9999966025353348,0.999999344348895
llm_goals_115,test,36,0.9999426007264782,0.999999344348895
llm_goals_115,test,37,0.9999935626981654,0.9999979734420849
llm_goals_115,test,38,0.9999982118606638,0.9999599456769136
llm_goals_115,test,39,0.9978380203630004,0.999999344348895
llm_goals_115,test,40,0.9999992847442344,0.9998471736847392
llm_goals_115,test,41,0.999999225139634,0.9999997615814208
llm_goals_115,test,42,0.9999979734420849,0.9999936819076042
llm_goals_115,test,43,0.9999973177909444,0.9999994039535594
llm_goals_115,test,44,0.9999958276749296,0.9999966621397788
llm_goals_115,test,45,0.9999978542328164,0.9908538461901172
llm_goals_115,test,46,0.9999921917910958,0.5668339122107139
llm_goals_115,test,47,0.9999978542328164,0.999965012074428
llm_goals_115,test,48,0.9999926090240764,0.9999986290932004
llm_goals_115,test,49,0.9999986886977652,0.9999966025353348
llm_goals_86,test,0,0.9974777102913972,0.9999950528144428
llm_goals_86,test,1,0.9999807476995284,0.9733920102032824
llm_goals_86,test,2,0.9985559582407884,0.9999997019767636
llm_goals_86,test,3,0.9996252059898348,0.9999989867209838
llm_goals_86,test,4,0.999997437000376,0.9999939203260696
llm_goals_86,test,5,0.998824417623073,0.9799200289999128
llm_goals_86,test,6,0.9999229907957206,0.9999989271164011
llm_goals_86,test,7,0.999997437000376,0.9999911785123744
llm_goals_86,test,8,0.9999989867209838,0.9906920788388957
llm_goals_86,test,9,0.9999970793723508,0.960079549439269
llm_goals_86,test,10,0.939100741663466,0.9999979734420849
llm_goals_86,test,11,0.9974777102913972,0.998329818271824
llm_goals_86,test,12,0.999995648860848,0.9999976158140952
llm_goals_86,test,13,0.9970803260630642,0.997893571823832
llm_goals_86,test,14,0.9999976754188272,0.9994581937511068
llm_goals_86,test,15,0.939100741663466,0.9993743300463472
llm_goals_86,test,16,0.9996252059898348,0.9959942101456876
llm_goals_86,test,17,0.989278435750766,0.9989233016552924
llm_goals_86,test,18,0.99999910593033,0.999989688396868
llm_goals_86,test,19,0.9999970793723508,0.99977147578688
llm_goals_86,test,20,0.9999762773508224,0.999986886977724
llm_goals_86,test,21,0.989278435750766,0.9995875954544448
llm_goals_86,test,22,0.9999773502350175,0.9998529553413918
llm_goals_86,test,23,0.999994099140297,0.9999995827674883
llm_goals_86,test,24,0.9999773502350175,0.98040735685252
llm_goals_86,test,25,0.9775279767878964,0.9999257922204762
llm_goals_86,test,26,0.9970803260630642,0.9992931485112122
llm_goals_86,test,27,0.9417402153048168,0.999970734120207
llm_goals_86,test,28,0.9999997615814208,0.9998175501809444
llm_goals_86,test,29,0.9999969005585,0.9995185136816022
llm_goals_86,test,30,0.9951816795315672,0.9807010897549824
llm_goals_86,test,31,0.9996092915605792,0.9998762011476526
llm_goals_86,test,32,0.9996252059898348,0.9988895059174044
llm_goals_86,test,33,0.9970803260630642,0.9999738931662266
llm_goals_86,test,34,0.9996252059898348,0.9977411627147142
llm_goals_86,test,35,0.9997342824997948,0.9999870657920578
llm_goals_86,test,36,0.9134991171840257,0.9994595050999702
llm_goals_86,test,37,0.9258488989970004,0.9993578791799612
llm_goals_86,test,38,0.999995648860848,0.9999866485595712
llm_goals_86,test,39,0.999995648860848,0.99997985362928
llm_goals_86,test,40,0.9999773502350175,0.999995470046798
llm_goals_86,test,41,0.999998509883854,0.99996912479408
llm_goals_86,test,42,0.9999946951865883,0.9999997615814208
llm_goals_86,test,43,0.9996252059898348,0.9999995827674883
llm_goals_86,test,44,0.9999496936791984,0.997135043199176
llm_goals_86,test,45,0.9914942385541772,0.9999841451646688
llm_goals_86,test,46,0.999997437000376,0.3364333057002893
llm_goals_86,test,47,0.9999677538868628,0.9991943836221492
llm_goals_86,test,48,0.9999946951865883,0.9999958872793276
llm_goals_86,test,49,0.6224250119631531,0.999995648860848
llm_goals_281,test,0,0.9999995827674883,0.9996947049971306
llm_goals_281,test,1,0.9139502074350812,0.9999986290932004
llm_goals_281,test,2,0.0074812797660518,0.9983671307551129
llm_goals_281,test,3,0.9139502074350812,0.993962764832135
llm_goals_281,test,4,0.9999990463256836,0.9999989271164011
llm_goals_281,test,5,0.9999998807907032,0.9999997019767636
llm_goals_281,test,6,0.999996125697864,0.9999997019767636
llm_goals_281,test,7,0.0074812797660518,0.973559082090764
llm_goals_281,test,8,0.9999852180482104,0.9999968409538144
llm_goals_281,test,9,0.9999997019767636,0.9999994635581704
llm_goals_281,test,10,0.999999344348895,0.9999997019767636
llm_goals_281,test,11,0.9999997615814208,0.9999951720236044
llm_goals_281,test,12,0.9999997615814208,0.9999264478667818
llm_goals_281,test,13,0.9999997019767636,0.9999998807907032
llm_goals_281,test,14,0.9999988079071328,0.9999976158140952
llm_goals_281,test,15,0.9999997019767636,0.9999992847442344
llm_goals_281,test,16,0.9139502074350812,0.9999986886977652
llm_goals_281,test,17,0.9999994039535594,0.9999985694885254
llm_goals_281,test,18,0.9999988079071328,0.999999344348895
llm_goals_281,test,19,0.0439512243670495,2.503036581908297e-05
llm_goals_281,test,20,0.9999990463256836,0.999996542930667
llm_goals_281,test,21,0.9999988079071328,0.9999997615814208
llm_goals_281,test,22,0.996452748738464,0.9999986886977652
llm_goals_281,test,23,0.9999998211860676,0.999999344348895
llm_goals_281,test,24,0.9999988079071328,0.9999715089800396
llm_goals_281,test,25,0.0014431735721192,0.9999983310699748
llm_goals_281,test,26,0.9999988079071328,0.9999986290932004
llm_goals_281,test,27,0.9999969005585,0.9999990463256836
llm_goals_281,test,28,0.9999997019767636,0.8906972993247301
llm_goals_281,test,29,0.0014431735721192,7.346078924151352e-05
llm_goals_281,test,30,0.9999997019767636,0.9999995827674883
llm_goals_281,test,31,0.9999997019767636,0.9999997019767636
llm_goals_281,test,32,0.9999991655349802,0.99999910593033
llm_goals_281,test,33,0.9999995231628418,0.9999994039535594
llm_goals_281,test,34,0.9999996423721385,0.9999989867209838
llm_goals_281,test,35,0.1365123869003957,0.9934774041946208
llm_goals_281,test,36,0.9999995827674883,0.9999990463256836
llm_goals_281,test,37,0.0439512243670495,3.4259730994143734e-05
llm_goals_281,test,38,0.9999989867209838,0.3148602040230503
llm_goals_281,test,39,0.9999396800998164,0.9940564630440718
llm_goals_281,test,40,0.9999994635581704,0.999999344348895
llm_goals_281,test,41,0.9999988079071328,0.9999998211860676
llm_goals_281,test,42,0.0101683509824279,0.999860048294782
llm_goals_281,test,43,0.999997437000376,0.9999997019767636
llm_goals_281,test,44,0.9999974966048696,0.9999992847442344
llm_goals_281,test,45,0.9999998211860676,0.9728845352464304
llm_goals_281,test,46,0.9999970197676546,0.9999996423721385
llm_goals_281,test,47,0.9996691942345924,0.999986290931994
llm_goals_281,test,48,0.9999988079071328,0.9999994039535594
llm_goals_281,test,49,0.9999921917910958,0.999999344348895
llm_goals_182,test,0,0.0001504057953164,0.9999994039535594
llm_goals_182,test,1,3.195697806756672e-05,0.0005625917030918
llm_goals_182,test,2,0.9999084472658808,0.9999986886977652
llm_goals_182,test,3,0.999627709380766,7.296223953885346e-06
llm_goals_182,test,4,0.9998146891603084,0.9999976158140952
llm_goals_182,test,5,0.0334681510622184,0.003103044503552
llm_goals_182,test,6,0.9998146891603084,0.0119719938396825
llm_goals_182,test,7,0.9998146891603084,0.9999994635581704
llm_goals_182,test,8,0.993182599646965,0.9999964833260028
llm_goals_182,test,9,0.0334681510622184,0.0113900113927541
llm_goals_182,test,10,0.9998276233683632,0.9961416126209276
llm_goals_182,test,11,0.9996523857239654,0.999994337558862
llm_goals_182,test,12,0.996753275444625,0.0378442217787105
llm_goals_182,test,13,0.9996523857239654,0.0008868430627717
llm_goals_182,test,14,0.0079104431402619,0.0008985942545946
llm_goals_182,test,15,5.369393308464664e-05,0.9999988675117084
llm_goals_182,test,16,0.0067910556637482,0.0033689156613595
llm_goals_182,test,17,0.999627709380766,0.0006440135974187
llm_goals_182,test,18,0.0067910556637482,0.0016946532068186
llm_goals_182,test,19,0.9995110631089896,0.9999406933800118
llm_goals_182,test,20,0.9999983310699748,0.99999910593033
llm_goals_182,test,21,0.9996523857239654,0.006514652424738
llm_goals_182,test,22,0.0001072651944523,0.0008693644862334
llm_goals_182,test,23,0.9999913573265664,0.9999617934213552
llm_goals_182,test,24,0.9998463392311912,0.0038374716596311
llm_goals_182,test,25,0.999912440775928,0.9941936732536844
llm_goals_182,test,26,0.0079104431402619,0.001039830413279
llm_goals_182,test,27,0.9992952346555128,0.0007135811001391
llm_goals_182,test,28,0.999661982069597,7.789882184923891e-06
llm_goals_182,test,29,0.999661982069597,0.999957442283379
llm_goals_182,test,30,0.9998146891603084,0.9981520175441102
llm_goals_182,test,31,0.0334681510622184,0.0117830754540077
llm_goals_182,test,32,0.9998146891603084,0.9999659657485728
llm_goals_182,test,33,0.0010786427361255,0.003031636673792
llm_goals_182,test,34,0.9998276233683632,0.9774106140350124
llm_goals_182,test,35,0.9996523857239654,0.9999996423721385
llm_goals_182,test,36,0.9999771118164102,0.9979310631755344
llm_goals_182,test,37,0.9566062083793906,0.9998408556030968
llm_goals_182,test,38,0.9998146891603084,0.999994218349345
llm_goals_182,test,39,0.9996523857239654,0.1486108277942357
llm_goals_182,test,40,0.8639939385900572,0.9999673962596765
llm_goals_182,test,41,0.0334681510622184,0.0004129864967066
llm_goals_182,test,42,0.9999084472658808,0.9999995231628418
llm_goals_182,test,43,0.0334681510622184,0.0046706145770988
llm_goals_182,test,44,0.999998450279186,0.9999978542328164
llm_goals_182,test,45,0.999912440775928,1.853969397415038e-05
llm_goals_182,test,46,0.0001051781594594,0.9999624490730772
llm_goals_182,test,47,0.7184901792804654,2.5724993639382006e-05
llm_goals_182,test,48,0.0067910556637482,0.0005832931102604
llm_goals_182,test,49,0.997590422744337,0.0013167466449808
llm_goals_438,test,0,0.9999816417687576,0.0127917126432779
llm_goals_438,test,1,0.9999995231628418,0.9999138712868518
llm_goals_438,test,2,0.9999997019767636,0.001266465311242
llm_goals_438,test,3,0.9999997019767636,0.9997649192827218
llm_goals_438,test,4,0.9999997019767636,0.995094418582848
llm_goals_438,test,5,0.9999996423721385,0.9676808127608026
llm_goals_438,test,6,0.9999637603741734,0.9681100847526048
llm_goals_438,test,7,0.9999987483024472,0.1433627923531326
llm_goals_438,test,8,0.9999997019767636,0.9999272823362588
llm_goals_438,test,9,0.999976515769231,0.3346369990700403
llm_goals_438,test,10,0.9999996423721385,0.0032511657787224
llm_goals_438,test,11,0.9999960064885888,0.9991979598760046
llm_goals_438,test,12,0.999919593336462,0.9979441166238928
llm_goals_438,test,13,0.9999998211860676,0.1369715342565285
llm_goals_438,test,14,0.9999891519543742,0.9999860525130736
llm_goals_438,test,15,0.999975919724226,0.9995588660290228
llm_goals_438,test,16,0.9999994039535594,0.9999721646308564
llm_goals_438,test,17,0.9999960064885888,0.9999966025353348
llm_goals_438,test,18,0.9999979138373352,0.9999983906746356
llm_goals_438,test,19,0.9999998211860676,0.9999996423721385
llm_goals_438,test,20,0.9999989867209838,0.9997635483790388
llm_goals_438,test,21,0.9999979138373352,0.9481995120869072
llm_goals_438,test,22,0.9999979138373352,0.9999990463256836
llm_goals_438,test,23,0.9999998807907032,0.9995222687768196
llm_goals_438,test,24,0.999976515769231,0.999998450279186
llm_goals_438,test,25,0.9999998211860676,0.0119505141994216
llm_goals_438,test,26,0.999986290931994,0.9546977279083356
llm_goals_438,test,27,0.9999960064885888,0.9999922513961864
llm_goals_438,test,28,0.999976515769231,0.9999902844428042
llm_goals_438,test,29,0.9999998211860676,0.9999998211860676
llm_goals_438,test,30,0.9999992847442344,0.0012244399528321
llm_goals_438,test,31,0.9977121352687408,0.9598621719385948
llm_goals_438,test,32,0.9999931454656964,0.9979359506472824
llm_goals_438,test,33,0.9999878406527222,0.9999122619631158
llm_goals_438,test,34,0.9999990463256836,0.0033786082834978
llm_goals_438,test,35,0.9999994635581704,0.7030742694516781
llm_goals_438,test,36,0.999986290931994,0.0009362307836721
llm_goals_438,test,37,0.9999992847442344,0.9999994635581704
llm_goals_438,test,38,0.9999980330466104,0.9999997019767636
llm_goals_438,test,39,0.9999979138373352,0.0899507873745254
llm_goals_438,test,40,0.9999979138373352,0.8368337146398075
llm_goals_438,test,41,0.9999979138373352,0.9687532202387088
llm_goals_438,test,42,0.9999997019767636,0.001642352875252
llm_goals_438,test,43,0.999919593336462,0.994022190528956
llm_goals_438,test,44,0.9999994039535594,0.999978065491181
llm_goals_438,test,45,0.9999997615814208,0.9999783635133692
llm_goals_438,test,46,0.9999851584435392,0.9999961853027344
llm_goals_438,test,47,0.999986290931994,0.9998934864975054
llm_goals_438,test,48,0.9999979138373352,0.9999979734420849
llm_goals_438,test,49,0.999999225139634,0.9999861717225268
llm_goals_206,test,0,0.9998595714517224,0.9991406798194884
llm_goals_206,test,1,0.4039679908137117,0.7026181814697341
llm_goals_206,test,2,0.990578711460228,0.9495592135330754
llm_goals_206,test,3,0.4039679908137117,0.4597382924578109
llm_goals_206,test,4,0.4039679908137117,0.456834747394902
llm_goals_206,test,5,0.0129513687364137,0.0069897250631233
llm_goals_206,test,6,0.4039679908137117,0.1198500283021958
llm_goals_206,test,7,0.9727253917498584,0.9853912589369151
llm_goals_206,test,8,0.990578711460228,0.9858354928324288
llm_goals_206,test,9,0.3912683703963872,0.7676771375411302
llm_goals_206,test,10,0.0001266659740735,6.0325856974144665e-05
llm_goals_206,test,11,0.4039679908137117,0.9932408335154868
llm_goals_206,test,12,0.3008499922160146,0.87151349073003
llm_goals_206,test,13,0.3912683703963872,4.2185384445727474e-05
llm_goals_206,test,14,0.9998595714517224,0.8643435780923203
llm_goals_206,test,15,0.3008499922160146,0.3192446879498265
llm_goals_206,test,16,0.3912683703963872,0.8269734919284588
llm_goals_206,test,17,0.9998595714517224,0.9885780813553218
llm_goals_206,test,18,0.0345846013859482,0.004661507854032
llm_goals_206,test,19,0.0001266659740735,2.09967085772139e-05
llm_goals_206,test,20,0.9998595714517224,0.98699533957105
llm_goals_206,test,21,0.9999807476995284,0.9343360672856648
llm_goals_206,test,22,0.0345846013859482,0.0175621316229822
llm_goals_206,test,23,0.0345846013859482,0.8257364630087937
llm_goals_206,test,24,0.0345846013859482,0.9999812841420614
llm_goals_206,test,25,0.3008499922160146,0.5058550948948065
llm_goals_206,test,26,0.990578711460228,0.993140757045314
llm_goals_206,test,27,0.4039679908137117,2.2270664938206257e-05
llm_goals_206,test,28,0.0540173816471918,0.950193582732028
llm_goals_206,test,29,0.3008499922160146,0.9696497918757307
llm_goals_206,test,30,0.0345846013859482,0.0026329471014817
llm_goals_206,test,31,0.9998595714517224,0.892615734505986
llm_goals_206,test,32,0.001660377810379,0.6161747460126132
llm_goals_206,test,33,0.2058874006337182,0.0330446953951764
llm_goals_206,test,34,0.0345846013859482,0.9667759539880174
llm_goals_206,test,35,0.9727253917498584,0.9067099130837172
llm_goals_206,test,36,0.9998595714517224,0.9999364614518882
llm_goals_206,test,37,0.0001266659740735,3.930535533630151e-05
llm_goals_206,test,38,0.3008499922160146,0.8118365412646018
llm_goals_206,test,39,0.3008499922160146,0.6533351590647749
llm_goals_206,test,40,0.0345846013859482,1.0367098236044126e-05
llm_goals_206,test,41,0.0345846013859482,0.9999849200248888
llm_goals_206,test,42,0.9998595714517224,0.9495081916810176
llm_goals_206,test,43,0.010122909476313,0.967551113836368
llm_goals_206,test,44,0.010122909476313,0.0156578839862262
llm_goals_206,test,45,0.0129513687364137,0.0016468393065651
llm_goals_206,test,46,0.2058874006337182,0.0561833196086265
llm_goals_206,test,47,0.0001266659740735,8.951690490961762e-05
llm_goals_206,test,48,0.0345846013859482,0.3268218248822932
llm_goals_206,test,49,0.010122909476313,0.0047424109160671
