template_id,split,question_idx,prediction,label
llm_goals_75,test,0,0.3068688036584422,0.0759730864369293
llm_goals_75,test,1,0.5767034253517606,0.8120127334654941
llm_goals_75,test,2,0.7999957232306157,0.114709127325878
llm_goals_75,test,3,0.0294749366162102,0.1496870071208148
llm_goals_75,test,4,0.4057050201261458,0.321632167436288
llm_goals_75,test,5,0.6031458962308629,0.0308084020440725
llm_goals_75,test,6,0.6286039301347505,0.1843175427563358
llm_goals_75,test,7,0.5868280589337401,0.0324508518984932
llm_goals_75,test,8,0.4057050201261458,0.5189439655904322
llm_goals_75,test,9,0.3600750164661534,0.1502023728460554
llm_goals_75,test,10,0.5708956803947145,0.7657257241793485
llm_goals_75,test,11,0.5943327063322009,0.8035850534204568
llm_goals_75,test,12,0.6405356594803939,0.7307072346740583
llm_goals_75,test,13,0.8583149274562963,0.048717541539827
llm_goals_75,test,14,0.1325166322092669,0.4316714754134473
llm_goals_75,test,15,0.7647029127345544,0.3935335107130105
llm_goals_75,test,16,0.3084394536514855,0.6144967070154126
llm_goals_75,test,17,0.365730679907023,0.4488809036296748
llm_goals_75,test,18,0.0791565045704971,0.3920271677291012
llm_goals_75,test,19,0.6341828111241506,0.7810532991351343
llm_goals_75,test,20,0.4057050201261458,0.5443958675997833
llm_goals_75,test,21,0.0294749366162102,0.1604437012338976
llm_goals_75,test,22,0.3485213008307055,0.856696781503626
llm_goals_75,test,23,0.0624200166095117,0.590876283737086
llm_goals_75,test,24,0.5405230572381776,0.4156776627984636
llm_goals_75,test,25,0.5708956803947145,0.5957841371692396
llm_goals_75,test,26,0.3084394536514855,0.3752723036244256
llm_goals_75,test,27,0.0242340711534791,0.7866846353759014
llm_goals_75,test,28,0.8814999424034016,0.1838073487826972
llm_goals_75,test,29,0.021364379881235,0.853944837222159
llm_goals_75,test,30,0.8325525501560704,0.5992601606803653
llm_goals_75,test,31,0.8226421489684412,0.0743179753131944
llm_goals_75,test,32,0.8440009959574867,0.8015013965908157
llm_goals_75,test,33,0.4144994378967592,0.3498422912836759
llm_goals_75,test,34,0.5708956803947145,0.6692496458902099
llm_goals_75,test,35,0.3068688036584422,0.134422492314073
llm_goals_75,test,36,0.5708956803947145,0.6683886675406214
llm_goals_75,test,37,0.7786760389258277,0.7419528346018889
llm_goals_75,test,38,0.4373798010027779,0.6995551035614008
llm_goals_75,test,39,0.620840660561244,0.4983520000991506
llm_goals_75,test,40,0.0791565045704971,0.8622382893733471
llm_goals_75,test,41,0.3485213008307055,0.1026909531781266
llm_goals_75,test,42,0.6753702019847287,0.0240063792397545
llm_goals_75,test,43,0.4224439228959971,0.1143049422953708
llm_goals_75,test,44,0.0399867913863788,0.6884653626060131
llm_goals_75,test,45,0.8319838053603508,0.1059329319681491
llm_goals_75,test,46,0.5782899794776535,0.405588044943207
llm_goals_75,test,47,0.8668903080082331,0.1393457779753145
llm_goals_75,test,48,0.0791565045704971,0.3670858714001939
llm_goals_75,test,49,0.6031458962308629,0.8052537448889737
llm_goals_78,test,0,0.6822444709950509,0.710685793210421
llm_goals_78,test,1,0.8270828152920608,0.4521352090792044
llm_goals_78,test,2,0.6464536249088614,0.6984783435600235
llm_goals_78,test,3,0.5743450001053583,0.2113029164438998
llm_goals_78,test,4,0.4542766207204357,0.59362413330766
llm_goals_78,test,5,0.5444853355267106,0.2973601904856865
llm_goals_78,test,6,0.5100221612732417,0.4911861319335979
llm_goals_78,test,7,0.6917939744240497,0.5109292120432304
llm_goals_78,test,8,0.4542766207204357,0.0214058927819057
llm_goals_78,test,9,0.5817260673757445,0.4561729519761929
llm_goals_78,test,10,0.0936293345782832,0.0679189625299845
llm_goals_78,test,11,0.7906007729423511,0.0515682065315942
llm_goals_78,test,12,0.7799818518622924,0.2832565853408079
llm_goals_78,test,13,0.4319092311401894,0.3661356287525266
llm_goals_78,test,14,0.4061888739514105,0.5580731095047592
llm_goals_78,test,15,0.4542766207204357,0.3539146882613382
llm_goals_78,test,16,0.6352574932224988,0.5198975918853231
llm_goals_78,test,17,0.4868079205788171,0.5974518854580513
llm_goals_78,test,18,0.4132247639915835,0.2539582988569515
llm_goals_78,test,19,0.2043426526047344,0.7818671446797811
llm_goals_78,test,20,0.0413921803781449,0.0817902870466741
llm_goals_78,test,21,0.4319092311401894,0.5313736848686219
llm_goals_78,test,22,0.8176622980082344,0.0578457193154468
llm_goals_78,test,23,0.7134991276280912,0.0588067732422271
llm_goals_78,test,24,0.5685954041374128,0.504620490567031
llm_goals_78,test,25,0.0936293345782832,0.1421301439321696
llm_goals_78,test,26,0.6352574932224988,0.4043160008204248
llm_goals_78,test,27,0.7322745324147136,0.1341547030792127
llm_goals_78,test,28,0.2521321573167069,0.585613528389559
llm_goals_78,test,29,0.1747727196185824,0.8037635629119642
llm_goals_78,test,30,0.2272895988536463,0.2785354206868534
llm_goals_78,test,31,0.5444853355267106,0.5074585147112473
llm_goals_78,test,32,0.7906007729423511,0.1365325187594412
llm_goals_78,test,33,0.4132247639915835,0.559776178990876
llm_goals_78,test,34,0.1273955252451034,0.3923464392379233
llm_goals_78,test,35,0.6822444709950509,0.8694947336510349
llm_goals_78,test,36,0.1273955252451034,0.3406365028138333
llm_goals_78,test,37,0.2534894821969934,0.7407991807699866
llm_goals_78,test,38,0.2361500269221528,0.5783193820848918
llm_goals_78,test,39,0.6831688821251135,0.2552456607848852
llm_goals_78,test,40,0.7974889815541777,0.0543816822443674
llm_goals_78,test,41,0.5127252347789132,0.5111749720190839
llm_goals_78,test,42,0.6464536249088614,0.6373460300781935
llm_goals_78,test,43,0.5444853355267106,0.5824615770869916
llm_goals_78,test,44,0.0755504491541333,0.0725045867582824
llm_goals_78,test,45,0.262446508103782,0.2055844845637347
llm_goals_78,test,46,0.7400305309304561,0.3443727538373435
llm_goals_78,test,47,0.6600166545876675,0.5137599661573641
llm_goals_78,test,48,0.6352574932224988,0.2386868392211005
llm_goals_78,test,49,0.863897320773013,0.1092249314217729
llm_goals_53,test,0,0.086291442715796,0.0313037944392233
llm_goals_53,test,1,0.1431386250455935,0.8240056677766623
llm_goals_53,test,2,0.1937102113583906,0.1449565288533016
llm_goals_53,test,3,0.1431386250455935,0.3918474727299789
llm_goals_53,test,4,0.1431386250455935,0.8286818229760559
llm_goals_53,test,5,0.0784143016661606,0.0496580173268359
llm_goals_53,test,6,0.0815386721815671,0.0987357123371914
llm_goals_53,test,7,0.3513624169403929,0.0188377606185046
llm_goals_53,test,8,0.1455647845223463,0.4663370658319237
llm_goals_53,test,9,0.0815386721815671,0.0353320635735392
llm_goals_53,test,10,0.2143526418664328,0.2465247528295183
llm_goals_53,test,11,0.1041216999762559,0.3482216267575191
llm_goals_53,test,12,0.4264205070820123,0.252877033485255
llm_goals_53,test,13,0.4793935715251785,0.1153444147006914
llm_goals_53,test,14,0.1313961918636896,0.3868210483124377
llm_goals_53,test,15,0.0763437727942194,0.3705090883623566
llm_goals_53,test,16,0.3110171826043897,0.3407126088990169
llm_goals_53,test,17,0.1041556406636899,0.7543820151744927
llm_goals_53,test,18,0.2298888353575327,0.3322955201354975
llm_goals_53,test,19,0.1455647845223463,0.2261316448538241
llm_goals_53,test,20,0.1041556406636899,0.7343425814116562
llm_goals_53,test,21,0.4915130302593928,0.1601759070107346
llm_goals_53,test,22,0.2206843295358783,0.4190051893758809
llm_goals_53,test,23,0.053139286166162,0.2354442333363782
llm_goals_53,test,24,0.1008499025703548,0.9719922543639756
llm_goals_53,test,25,0.1008499025703548,0.3289260309913144
llm_goals_53,test,26,0.3355730913774248,0.5781819989075234
llm_goals_53,test,27,0.1634053214372049,0.790876622992061
llm_goals_53,test,28,0.3513624169403929,0.2747068584160578
llm_goals_53,test,29,0.1008499025703548,0.796844478423965
llm_goals_53,test,30,0.3637465947695278,0.3573432990729852
llm_goals_53,test,31,0.4915130302593928,0.1489779797461384
llm_goals_53,test,32,0.3513624169403929,0.4788477745757265
llm_goals_53,test,33,0.0543428252540774,0.967617631882366
llm_goals_53,test,34,0.099087182966085,0.2252558680565209
llm_goals_53,test,35,0.4142117118370106,0.2300146581986259
llm_goals_53,test,36,0.1313961918636896,0.2311446011459964
llm_goals_53,test,37,0.2143526418664328,0.144409781340655
llm_goals_53,test,38,0.0763437727942194,0.705274211964156
llm_goals_53,test,39,0.3890205344692807,0.5921281985506138
llm_goals_53,test,40,0.0987578899109361,0.2443004460536172
llm_goals_53,test,41,0.0629405330302794,0.061497045516474
llm_goals_53,test,42,0.1113883619695171,0.1570495895565415
llm_goals_53,test,43,0.0891274091255782,0.0641649100604756
llm_goals_53,test,44,0.0300241983796468,0.8074959504603542
llm_goals_53,test,45,0.2774148540189107,0.1813221143349916
llm_goals_53,test,46,0.1855846741477459,0.2352295334667747
llm_goals_53,test,47,0.0763437727942194,0.820244135045574
llm_goals_53,test,48,0.3513624169403929,0.4512817747836695
llm_goals_53,test,49,0.0784143016661606,0.7022675298006026
llm_goals_305,test,0,0.1805087884515928,0.0438240495208372
llm_goals_305,test,1,0.2990334937225582,0.1352509650243347
llm_goals_305,test,2,0.3052631719451498,0.1723536643548477
llm_goals_305,test,3,0.5931365469936355,0.250094549889143
llm_goals_305,test,4,0.8568785216113738,0.8419536365764244
llm_goals_305,test,5,0.4588778095785792,0.1913177614094214
llm_goals_305,test,6,0.2477978862269462,0.3723916849874114
llm_goals_305,test,7,0.3052631719451498,0.3337485526549648
llm_goals_305,test,8,0.818498250915137,0.5824263052609597
llm_goals_305,test,9,0.1805087884515928,0.620184539039364
llm_goals_305,test,10,0.8443229804594178,0.494000537986959
llm_goals_305,test,11,0.2622762107729275,0.0482253546984711
llm_goals_305,test,12,0.0922363552977074,0.0565816635108951
llm_goals_305,test,13,0.2884553173949558,0.1136796894182332
llm_goals_305,test,14,0.8047077018046639,0.6102884358627442
llm_goals_305,test,15,0.818498250915137,0.8302422164176205
llm_goals_305,test,16,0.8133642699678834,0.589511050327059
llm_goals_305,test,17,0.7548630881503642,0.2622011524235305
llm_goals_305,test,18,0.81990385540467,0.3737828315077605
llm_goals_305,test,19,0.8392968122606024,0.0401465973617238
llm_goals_305,test,20,0.8021761784326338,0.8971526617856483
llm_goals_305,test,21,0.5964751652968486,0.513862561708882
llm_goals_305,test,22,0.1805087884515928,0.6617399492970566
llm_goals_305,test,23,0.3500512929889038,0.3090300849059566
llm_goals_305,test,24,0.8028539449859309,0.4310886044152408
llm_goals_305,test,25,0.8443229804594178,0.7346082271960779
llm_goals_305,test,26,0.8028539449859309,0.7784622217319951
llm_goals_305,test,27,0.4580653223916483,0.2285268892180965
llm_goals_305,test,28,0.7195585874756826,0.1970890988987535
llm_goals_305,test,29,0.3301640123172258,0.0543679274789402
llm_goals_305,test,30,0.585765665385881,0.8325365217586828
llm_goals_305,test,31,0.5964751652968486,0.5078524819974076
llm_goals_305,test,32,0.2990334937225582,0.2061603354174771
llm_goals_305,test,33,0.7548630881503642,0.6039954962603894
llm_goals_305,test,34,0.8443229804594178,0.5754865922825898
llm_goals_305,test,35,0.3052631719451498,0.1664152616423
llm_goals_305,test,36,0.8773294673445245,0.7880486291444165
llm_goals_305,test,37,0.8392968122606024,0.03605078558617
llm_goals_305,test,38,0.7882234406988442,0.0575570687729377
llm_goals_305,test,39,0.1871636870372754,0.4297583044645929
llm_goals_305,test,40,0.2283008336290452,0.1915445959084499
llm_goals_305,test,41,0.3618855927231801,0.6536953532364804
llm_goals_305,test,42,0.5789179620147493,0.122527873906398
llm_goals_305,test,43,0.6767153792198894,0.1711906255032107
llm_goals_305,test,44,0.818498250915137,0.8371975999741996
llm_goals_305,test,45,0.7101963205916099,0.3836914756409174
llm_goals_305,test,46,0.3485487644642978,0.0543049670678201
llm_goals_305,test,47,0.7449461766594887,0.5245484205428286
llm_goals_305,test,48,0.8028539449859309,0.5969765977742552
llm_goals_305,test,49,0.2990334937225582,0.2351952691938564
llm_goals_81,test,0,0.4228302540928913,0.2060992725380174
llm_goals_81,test,1,0.5951213288319915,0.1581010259271764
llm_goals_81,test,2,0.8371621336852599,0.6899052301996583
llm_goals_81,test,3,0.6358091124765567,0.7805136989347726
llm_goals_81,test,4,0.4382020083082198,0.0972643506873081
llm_goals_81,test,5,0.4341441230144615,0.3089356066572108
llm_goals_81,test,6,0.6106942907536795,0.0383605574042886
llm_goals_81,test,7,0.7740736484864277,0.3161536190910042
llm_goals_81,test,8,0.5189287165994112,0.5126683642741202
llm_goals_81,test,9,0.2506143228118148,0.1286837550045714
llm_goals_81,test,10,0.4383241310631228,0.1256029490894943
llm_goals_81,test,11,0.4172793832877546,0.408772132619307
llm_goals_81,test,12,0.4382020083082198,0.1214277758013974
llm_goals_81,test,13,0.3644995297484198,0.0409721836992895
llm_goals_81,test,14,0.4295100842515329,0.0827685330888261
llm_goals_81,test,15,0.3365211893688499,0.224678660518271
llm_goals_81,test,16,0.4345081839133936,0.0872837265533343
llm_goals_81,test,17,0.359784750723547,0.2837028272857018
llm_goals_81,test,18,0.2755207263298379,0.1193591553103013
llm_goals_81,test,19,0.4133976789389234,0.4952181327203863
llm_goals_81,test,20,0.4382020083082198,0.2564665599863756
llm_goals_81,test,21,0.5743151491560133,0.2041083994609424
llm_goals_81,test,22,0.8371621336852599,0.3119739178030907
llm_goals_81,test,23,0.2695648342177801,0.0994638293022036
llm_goals_81,test,24,0.2506143228118148,0.1575467450844306
llm_goals_81,test,25,0.4133976789389234,0.0291125673317165
llm_goals_81,test,26,0.6106942907536795,0.0869071714890548
llm_goals_81,test,27,0.3044179081756628,0.1863589895989203
llm_goals_81,test,28,0.8892110006881788,0.119977738469712
llm_goals_81,test,29,0.4133976789389234,0.4410572612602489
llm_goals_81,test,30,0.0463304807014273,0.0555125882985712
llm_goals_81,test,31,0.1002833048402372,0.3486004983652399
llm_goals_81,test,32,0.5309738453980498,0.189941914212834
llm_goals_81,test,33,0.2755207263298379,0.1890390776737304
llm_goals_81,test,34,0.3441463830603157,0.1328217427635933
llm_goals_81,test,35,0.7454944130936314,0.1343397356978365
llm_goals_81,test,36,0.6106942907536795,0.0899701336915993
llm_goals_81,test,37,0.1885774674836381,0.6478431799513802
llm_goals_81,test,38,0.5951213288319915,0.7351879424598803
llm_goals_81,test,39,0.7454944130936314,0.0885373562628188
llm_goals_81,test,40,0.8371621336852599,0.3150516869571108
llm_goals_81,test,41,0.2755207263298379,0.0498826197855212
llm_goals_81,test,42,0.2755207263298379,0.1381899328653333
llm_goals_81,test,43,0.4382020083082198,0.3536647169335493
llm_goals_81,test,44,0.5951213288319915,0.4857917971856136
llm_goals_81,test,45,0.8892110006881788,0.3921515914618259
llm_goals_81,test,46,0.4682762897670633,0.1179764264181158
llm_goals_81,test,47,0.5951213288319915,0.2786576050295211
llm_goals_81,test,48,0.2755207263298379,0.0726556891905063
llm_goals_81,test,49,0.4382020083082198,0.3912461690418435
llm_goals_133,test,0,0.5565640478747458,0.4440529323069227
llm_goals_133,test,1,0.4735361028432665,0.3955848959165448
llm_goals_133,test,2,0.4615075900401043,0.5130030466159122
llm_goals_133,test,3,0.5373515461696827,0.220245744335209
llm_goals_133,test,4,0.7342403631574029,0.5879895213269322
llm_goals_133,test,5,0.3100199536201398,0.8588037554744828
llm_goals_133,test,6,0.6477536585055937,0.8322442189227136
llm_goals_133,test,7,0.4380594485637765,0.6588760518065184
llm_goals_133,test,8,0.1982967539493013,0.5253890103378467
llm_goals_133,test,9,0.1641082835260257,0.8170254264656348
llm_goals_133,test,10,0.5652803716983201,0.4608975636274737
llm_goals_133,test,11,0.5791972190067328,0.2002942757447116
llm_goals_133,test,12,0.5506990563272943,0.4022389740133304
llm_goals_133,test,13,0.4650665833340392,0.8516519653230656
llm_goals_133,test,14,0.1829175998669873,0.0158444788418117
llm_goals_133,test,15,0.577687090509347,0.5978365001716675
llm_goals_133,test,16,0.5373515461696827,0.0529535109452945
llm_goals_133,test,17,0.5731142181661228,0.2556263204518722
llm_goals_133,test,18,0.637382272408275,0.0167466717766424
llm_goals_133,test,19,0.8755572488446913,0.0944244428527934
llm_goals_133,test,20,0.5677876459383606,0.6914976263434149
llm_goals_133,test,21,0.5677876459383606,0.8436048633272258
llm_goals_133,test,22,0.6051744159674504,0.2868007235124719
llm_goals_133,test,23,0.528642401324249,0.1160262834732456
llm_goals_133,test,24,0.6410251280988652,0.0154812210183983
llm_goals_133,test,25,0.5169776748172129,0.3119789757098087
llm_goals_133,test,26,0.6111847074749347,0.7929420521534107
llm_goals_133,test,27,0.5652803716983201,0.2037716603127804
llm_goals_133,test,28,0.3730529657282914,0.3118772754734958
llm_goals_133,test,29,0.4951045041500913,0.1808521166351184
llm_goals_133,test,30,0.7433770353132725,0.5045142070808941
llm_goals_133,test,31,0.7940816848292265,0.8498369503935175
llm_goals_133,test,32,0.5264633877763822,0.2694815541177057
llm_goals_133,test,33,0.624716771090101,0.0177588567715867
llm_goals_133,test,34,0.6156508946501522,0.445395356923409
llm_goals_133,test,35,0.6670648332548883,0.4995371449295338
llm_goals_133,test,36,0.5091253997374466,0.4823747071618506
llm_goals_133,test,37,0.8755572488446913,0.0266815206082507
llm_goals_133,test,38,0.7247332896708099,0.0874820007739646
llm_goals_133,test,39,0.577687090509347,0.3366422826024648
llm_goals_133,test,40,0.6384056763794065,0.2329899847029727
llm_goals_133,test,41,0.8633878775653411,0.8571491285285516
llm_goals_133,test,42,0.561406807467735,0.8193201391590431
llm_goals_133,test,43,0.5677876459383606,0.8422289427227235
llm_goals_133,test,44,0.757959835853425,0.5294372908894646
llm_goals_133,test,45,0.1451710305674921,0.2588603231187393
llm_goals_133,test,46,0.628932476678453,0.2337208499272645
llm_goals_133,test,47,0.5652803716983201,0.1166634693988454
llm_goals_133,test,48,0.1615195746057607,0.6138306242825586
llm_goals_133,test,49,0.4735361028432665,0.2806552214021111
llm_goals_157,test,0,0.0783462237969408,0.6355320308190959
llm_goals_157,test,1,0.21804264559213,0.7424853921670768
llm_goals_157,test,2,0.0814263067820931,0.073314241900373
llm_goals_157,test,3,0.0372321228771999,0.4675850432855137
llm_goals_157,test,4,0.7595899795109367,0.5458627288071527
llm_goals_157,test,5,0.0569230992466332,0.0771889198722071
llm_goals_157,test,6,0.9153426303300908,0.0818153292956077
llm_goals_157,test,7,0.0814263067820931,0.0574362851972565
llm_goals_157,test,8,0.7595899795109367,0.612650525482466
llm_goals_157,test,9,0.1685745373583969,0.025148981997583
llm_goals_157,test,10,0.312217906422823,0.075973919657683
llm_goals_157,test,11,0.1864531636187178,0.1464687737403695
llm_goals_157,test,12,0.4461033337598723,0.7268917489370714
llm_goals_157,test,13,0.050439187536746,0.0531648084509613
llm_goals_157,test,14,0.9048082261859532,0.3299706213737123
llm_goals_157,test,15,0.5634052871942227,0.3043292296967997
llm_goals_157,test,16,0.4531820812338111,0.7463776357566768
llm_goals_157,test,17,0.1758025299476422,0.8521737469617978
llm_goals_157,test,18,0.8425842507542706,0.6376039881194869
llm_goals_157,test,19,0.9234125653424572,0.6077618725185671
llm_goals_157,test,20,0.7595899795109367,0.7242060188576479
llm_goals_157,test,21,0.0569230992466332,0.2051165554994685
llm_goals_157,test,22,0.176650888752814,0.7995715125449558
llm_goals_157,test,23,0.1486055131519092,0.1467023010082007
llm_goals_157,test,24,0.6897299923864526,0.3108830330026099
llm_goals_157,test,25,0.3232493247326294,0.1001087986592319
llm_goals_157,test,26,0.0223185805452163,0.4552169748909065
llm_goals_157,test,27,0.9222837109962984,0.8485816155817194
llm_goals_157,test,28,0.1240315884986272,0.2265082237706469
llm_goals_157,test,29,0.9222837109962984,0.6283476283012512
llm_goals_157,test,30,0.3232493247326294,0.2620283904445711
llm_goals_157,test,31,0.9252827785542556,0.167952021094149
llm_goals_157,test,32,0.0515354020994226,0.0898426790762853
llm_goals_157,test,33,0.4531820812338111,0.5043942365008254
llm_goals_157,test,34,0.2283531207452461,0.0725868476993519
llm_goals_157,test,35,0.1201901175308664,0.1237829648198263
llm_goals_157,test,36,0.312217906422823,0.1925318890375481
llm_goals_157,test,37,0.1730908505000684,0.6842419436738383
llm_goals_157,test,38,0.8425842507542706,0.691649855522258
llm_goals_157,test,39,0.3923387220426743,0.5264401359594252
llm_goals_157,test,40,0.176650888752814,0.1777385641102212
llm_goals_157,test,41,0.1031229144323203,0.0328183379619016
llm_goals_157,test,42,0.0814263067820931,0.1949198629220696
llm_goals_157,test,43,0.0569230992466332,0.135028229661103
llm_goals_157,test,44,0.7595899795109367,0.7258662504199943
llm_goals_157,test,45,0.2460947991192279,0.0935995604675028
llm_goals_157,test,46,0.9130041620828326,0.15418174898882
llm_goals_157,test,47,0.1286272537506674,0.3212815335896988
llm_goals_157,test,48,0.0223185805452163,0.2795304252191649
llm_goals_157,test,49,0.9381590468640992,0.7371862441831876
llm_goals_186,test,0,0.4336933985578946,0.0367510709036243
llm_goals_186,test,1,0.6846354592328173,0.9589190483469818
llm_goals_186,test,2,0.0354654024831296,0.0667798014228945
llm_goals_186,test,3,0.0339571980439711,0.0340377111776925
llm_goals_186,test,4,0.4995946134717398,0.4002710909538108
llm_goals_186,test,5,0.7939310091927139,0.8817241785963961
llm_goals_186,test,6,0.6135118683009005,0.8798493094453552
llm_goals_186,test,7,0.0312895724186952,0.0443878504309986
llm_goals_186,test,8,0.5334179391759133,0.4415592471567901
llm_goals_186,test,9,0.4732664620081865,0.8847759344734797
llm_goals_186,test,10,0.9221743361633394,0.8905032311770802
llm_goals_186,test,11,0.6479504598100597,0.704948600699243
llm_goals_186,test,12,0.238718908682272,0.409597002882604
llm_goals_186,test,13,0.9119794373568232,0.8867287662434378
llm_goals_186,test,14,0.7657676235890271,0.8128145923588551
llm_goals_186,test,15,0.9221743361633394,0.4832503599366539
llm_goals_186,test,16,0.8176556820590867,0.8267478910426029
llm_goals_186,test,17,0.96109086115056,0.957207678971151
llm_goals_186,test,18,0.7542500554048902,0.7610878868091969
llm_goals_186,test,19,0.9411737322921556,0.7872715543385574
llm_goals_186,test,20,0.4014151639709504,0.520514563098938
llm_goals_186,test,21,0.5087158599751345,0.9084513175350956
llm_goals_186,test,22,0.937802374748769,0.9157385254478472
llm_goals_186,test,23,0.0339571980439711,0.5585242484052028
llm_goals_186,test,24,0.7596032678663496,0.8535531187105866
llm_goals_186,test,25,0.8118659261554929,0.8466653814359101
llm_goals_186,test,26,0.3559589332267844,0.8550637970014335
llm_goals_186,test,27,0.00565756454283,0.9398175480710378
llm_goals_186,test,28,0.00565756454283,0.0028363068023126
llm_goals_186,test,29,0.9503903386952036,0.8305997204848772
llm_goals_186,test,30,0.90624916893406,0.8987706923113074
llm_goals_186,test,31,0.1684757359126464,0.8880043621770078
llm_goals_186,test,32,0.4941535564804269,0.4759852559635721
llm_goals_186,test,33,0.8176556820590867,0.8450176079466206
llm_goals_186,test,34,0.90624916893406,0.9532899841201126
llm_goals_186,test,35,0.9221743361633394,0.0290458993492998
llm_goals_186,test,36,0.9482841502140676,0.9324312223548752
llm_goals_186,test,37,0.293536528811936,0.7062064442252718
llm_goals_186,test,38,0.1773508218908928,0.8475385890175953
llm_goals_186,test,39,0.2328268384729269,0.2451742937665777
llm_goals_186,test,40,0.4564049146706294,0.7628755019143414
llm_goals_186,test,41,0.4957187924324231,0.9118681525061464
llm_goals_186,test,42,0.0312895724186952,0.0299416334392138
llm_goals_186,test,43,0.3391990099144478,0.9088531704037304
llm_goals_186,test,44,0.4995946134717398,0.399223879564458
llm_goals_186,test,45,0.0339571980439711,0.0207412737387863
llm_goals_186,test,46,0.6558317450565913,0.504435185656878
llm_goals_186,test,47,0.1469645444882704,0.0426878976387859
llm_goals_186,test,48,0.7145774914179392,0.8374391175680358
llm_goals_186,test,49,0.0339571980439711,0.9286286845568336
llm_goals_401,test,0,0.7863369521126703,0.9617876405899952
llm_goals_401,test,1,0.7439671736320099,0.9404490002093446
llm_goals_401,test,2,0.8667969053526042,0.935046673136648
llm_goals_401,test,3,0.9337686880348648,0.9543637645078082
llm_goals_401,test,4,0.946974219057266,0.9660480618061604
llm_goals_401,test,5,0.7219743698489822,0.9211199313115676
llm_goals_401,test,6,0.9008229963730972,0.902884063341732
llm_goals_401,test,7,0.8728883316136806,0.94729781169548
llm_goals_401,test,8,0.8375141061262869,0.957207800210959
llm_goals_401,test,9,0.7916501782379012,0.9145740305533586
llm_goals_401,test,10,0.4902341779024117,0.9267561414021268
llm_goals_401,test,11,0.9387537272591148,0.9242701512661912
llm_goals_401,test,12,0.7391555900846996,0.8435903191618971
llm_goals_401,test,13,0.7916501782379012,0.938192186231483
llm_goals_401,test,14,0.0651084992169716,0.8529976602342201
llm_goals_401,test,15,0.807659382108495,0.9478884329856586
llm_goals_401,test,16,0.3738782431870421,0.8192354997719525
llm_goals_401,test,17,0.6898250478249688,0.6739075253562599
llm_goals_401,test,18,0.0651084992169716,0.5197439125792754
llm_goals_401,test,19,0.8848334589592229,0.8583977843568281
llm_goals_401,test,20,0.946974219057266,0.9455993763925636
llm_goals_401,test,21,0.7916501782379012,0.9705763460601288
llm_goals_401,test,22,0.7368937076184147,0.8491748031226035
llm_goals_401,test,23,0.5908154284892033,0.8515620190775874
llm_goals_401,test,24,0.5180705780131046,0.9138265832467732
llm_goals_401,test,25,0.6939721050426017,0.9028179661562172
llm_goals_401,test,26,0.0651084992169716,0.9558187125982178
llm_goals_401,test,27,0.9138558536230216,0.5612720368847214
llm_goals_401,test,28,0.9550225153217524,0.9617025244944858
llm_goals_401,test,29,0.9314229508184668,0.8060652645257104
llm_goals_401,test,30,0.6008065213642175,0.8896843204884566
llm_goals_401,test,31,0.8112394201361149,0.9526923309875832
llm_goals_401,test,32,0.8728883316136806,0.8506568677811456
llm_goals_401,test,33,0.9238893388741336,0.7802594846608962
llm_goals_401,test,34,0.6008065213642175,0.8870658880824575
llm_goals_401,test,35,0.145455989224729,0.954492271718892
llm_goals_401,test,36,0.5215939886684695,0.562048146808884
llm_goals_401,test,37,0.6761473930538705,0.7781126533121301
llm_goals_401,test,38,0.965764344547288,0.8591165497422784
llm_goals_401,test,39,0.7391555900846996,0.8788934372485709
llm_goals_401,test,40,0.7415889395930976,0.8091102829935539
llm_goals_401,test,41,0.8112394201361149,0.8675616408909181
llm_goals_401,test,42,0.7368937076184147,0.949993671778176
llm_goals_401,test,43,0.6549488918491664,0.9467448581700896
llm_goals_401,test,44,0.6204808358681347,0.8687242293966851
llm_goals_401,test,45,0.877935830071381,0.9587250339741858
llm_goals_401,test,46,0.0517036516892024,0.860452357605835
llm_goals_401,test,47,0.877935830071381,0.9253614550163576
llm_goals_401,test,48,0.5180705780131046,0.8647797053472309
llm_goals_401,test,49,0.1843094790753896,0.9454760570818088
llm_goals_420,test,0,0.1485906331645086,0.9711560599789952
llm_goals_420,test,1,0.1205526689007503,0.5978053926454786
llm_goals_420,test,2,0.0828958531504863,0.0817351976918742
llm_goals_420,test,3,0.4069102433750707,0.4730792485055278
llm_goals_420,test,4,0.091250402741408,0.8487827178347965
llm_goals_420,test,5,0.0617805128847267,0.1386299974231985
llm_goals_420,test,6,0.0824888690681105,0.9677888754301456
llm_goals_420,test,7,0.0709780031061163,0.9193048504515688
llm_goals_420,test,8,0.0995608432312768,0.1105940972856699
llm_goals_420,test,9,0.0566124968327034,0.0770199238560772
llm_goals_420,test,10,0.5998317535392524,0.6569762799970394
llm_goals_420,test,11,0.399091407660941,0.4533228613613927
llm_goals_420,test,12,0.2930435520753158,0.9317349816078236
llm_goals_420,test,13,0.1147954999486181,0.5042190525433249
llm_goals_420,test,14,0.4310380141590855,0.1440102415442949
llm_goals_420,test,15,0.5042871289899089,0.3273024402815145
llm_goals_420,test,16,0.2693030962500474,0.3681827771891491
llm_goals_420,test,17,0.2819553737369308,0.4632337459639504
llm_goals_420,test,18,0.1695377908104262,0.0396023029282074
llm_goals_420,test,19,0.0650385587833518,0.1093558671361818
llm_goals_420,test,20,0.0840070493556492,0.0396252534530884
llm_goals_420,test,21,0.0617805128847267,0.0465700238365722
llm_goals_420,test,22,0.0566124968327034,0.1916998836408959
llm_goals_420,test,23,0.1621031946707599,0.1681177802630551
llm_goals_420,test,24,0.4310380141590855,0.1698145969501656
llm_goals_420,test,25,0.0992987034824843,0.9829779862454848
llm_goals_420,test,26,0.1205526689007503,0.0308922007548325
llm_goals_420,test,27,0.9359520080851612,0.8125830946093627
llm_goals_420,test,28,0.0966441586880585,0.9367654930611784
llm_goals_420,test,29,0.0992987034824843,0.8184437096518178
llm_goals_420,test,30,0.2261968362574368,0.9386603865018432
llm_goals_420,test,31,0.0837476365840152,0.10851579640767
llm_goals_420,test,32,0.2395269868368465,0.9666374926215946
llm_goals_420,test,33,0.4310380141590855,0.8901044715204638
llm_goals_420,test,34,0.1119416402501169,0.9215939624410928
llm_goals_420,test,35,0.2580454920543706,0.5267802921981926
llm_goals_420,test,36,0.3576393970363523,0.092175658510858
llm_goals_420,test,37,0.0971818769757534,0.984362841437198
llm_goals_420,test,38,0.1205526689007503,0.8828047505171253
llm_goals_420,test,39,0.5042871289899089,0.2972862903877061
llm_goals_420,test,40,0.269241496812478,0.0444444838151291
llm_goals_420,test,41,0.7011712774886035,0.5478361768565629
llm_goals_420,test,42,0.0650385587833518,0.0713350995649345
llm_goals_420,test,43,0.1898323092140799,0.5106248261137879
llm_goals_420,test,44,0.1153403722345664,0.0905225225380096
llm_goals_420,test,45,0.3738345228092032,0.1531352912609338
llm_goals_420,test,46,0.4371699367930793,0.1216667665904784
llm_goals_420,test,47,0.1205526689007503,0.1240460201984882
llm_goals_420,test,48,0.0507155938401335,0.0596825371886435
llm_goals_420,test,49,0.1190877810943412,0.8335117138475971
llm_goals_263,test,0,0.6776762646513192,0.5209935935366439
llm_goals_263,test,1,0.1267481253519941,0.7968068746445729
llm_goals_263,test,2,0.5976834724507879,0.5467470232144288
llm_goals_263,test,3,0.7607498838950161,0.4733215007319302
llm_goals_263,test,4,0.9640305052699052,0.0057083956844275
llm_goals_263,test,5,0.9299717542784812,0.3493473596509424
llm_goals_263,test,6,0.2034389932018933,0.8201550249820808
llm_goals_263,test,7,0.9553758496329314,0.6557906816477753
llm_goals_263,test,8,0.0418388406745819,0.7543426271500917
llm_goals_263,test,9,0.2141915407616659,0.2009829696053626
llm_goals_263,test,10,0.9104680448266804,0.8489753664207734
llm_goals_263,test,11,0.8079909077919698,0.652436611134806
llm_goals_263,test,12,0.0061883822381932,0.8143466734577086
llm_goals_263,test,13,0.7963205008526529,0.4245607212842352
llm_goals_263,test,14,0.0042226261635514,0.0036452536113296
llm_goals_263,test,15,0.7963205008526529,0.0558692673280436
llm_goals_263,test,16,0.4443747892500168,0.0066133854077101
llm_goals_263,test,17,0.392557434696656,0.7648655133279786
llm_goals_263,test,18,0.0042226261635514,0.006651634113929
llm_goals_263,test,19,0.8380733188431599,0.0487544569045993
llm_goals_263,test,20,0.0418388406745819,0.0331700030843074
llm_goals_263,test,21,0.2034389932018933,0.2223244924357846
llm_goals_263,test,22,0.2141915407616659,0.8850367693524676
llm_goals_263,test,23,0.8640320351137547,0.6136206316393849
llm_goals_263,test,24,0.3749073687679352,0.0103991722036265
llm_goals_263,test,25,0.576321551323993,0.7490420921699364
llm_goals_263,test,26,0.765605378821981,0.0149267434716544
llm_goals_263,test,27,0.3384422929161462,0.7989164572724189
llm_goals_263,test,28,0.8585939970346969,0.6376088146659757
llm_goals_263,test,29,0.6740715513347942,0.0419343519282845
llm_goals_263,test,30,0.9293553828782244,0.8598701912381717
llm_goals_263,test,31,0.2034389932018933,0.168156003178124
llm_goals_263,test,32,0.6449929441390178,0.6210063725022936
llm_goals_263,test,33,0.8862534201255484,0.0062242916440703
llm_goals_263,test,34,0.863605434539384,0.5691545063377933
llm_goals_263,test,35,0.7963205008526529,0.7982008481236453
llm_goals_263,test,36,0.8107373142653842,0.763706617142148
llm_goals_263,test,37,0.5142578531809273,0.0342430752915087
llm_goals_263,test,38,0.6740715513347942,0.1222660265497154
llm_goals_263,test,39,0.7963205008526529,0.8269810089104592
llm_goals_263,test,40,0.765605378821981,0.5318831885299807
llm_goals_263,test,41,0.2190331835170901,0.3207528198494705
llm_goals_263,test,42,0.9164858431589084,0.4801431121790341
llm_goals_263,test,43,0.392557434696656,0.1981375631842198
llm_goals_263,test,44,0.8148687425202055,0.1080272425734687
llm_goals_263,test,45,0.5404447417204341,0.8354177467829539
llm_goals_263,test,46,0.7844108293333867,0.7413273974280716
llm_goals_263,test,47,0.9545734531900784,0.4918597295945824
llm_goals_263,test,48,0.2190331835170901,0.0043793883332247
llm_goals_263,test,49,0.8409059630212835,0.949535011062065
llm_goals_427,test,0,0.5713707051015661,0.2826418194423331
llm_goals_427,test,1,0.6073077391483352,0.380977464557011
llm_goals_427,test,2,0.6566506570860212,0.1487359361961987
llm_goals_427,test,3,0.4982867147773139,0.3576580711889061
llm_goals_427,test,4,0.8032749895536592,0.2270212997591984
llm_goals_427,test,5,0.6054988551888812,0.2711625929555684
llm_goals_427,test,6,0.5694953095962108,0.1402530886796432
llm_goals_427,test,7,0.4401182180703035,0.2935996266753878
llm_goals_427,test,8,0.428517818910498,0.2137670314614922
llm_goals_427,test,9,0.5869846748936872,0.2160041132788326
llm_goals_427,test,10,0.6073077391483352,0.3669200145460971
llm_goals_427,test,11,0.6887739383819812,0.1516882402250043
llm_goals_427,test,12,0.5788952228758855,0.1475453757541205
llm_goals_427,test,13,0.5007305102582656,0.1350458405109811
llm_goals_427,test,14,0.5523927265078112,0.2337964230636721
llm_goals_427,test,15,0.6424094473488955,0.3115728193455654
llm_goals_427,test,16,0.6782998908404376,0.131520745523965
llm_goals_427,test,17,0.6073077391483352,0.3278496493117007
llm_goals_427,test,18,0.6073077391483352,0.3527567015929387
llm_goals_427,test,19,0.4304399117523007,0.2313815817463674
llm_goals_427,test,20,0.8032749895536592,0.3221674001172885
llm_goals_427,test,21,0.5869846748936872,0.2494982149574568
llm_goals_427,test,22,0.6073077391483352,0.3779860883941361
llm_goals_427,test,23,0.5175371639168399,0.3509138567308049
llm_goals_427,test,24,0.7118155252951827,0.1946130607095621
llm_goals_427,test,25,0.5713707051015661,0.228222711067827
llm_goals_427,test,26,0.6073077391483352,0.2768263295001016
llm_goals_427,test,27,0.5510286116084943,0.2199474495731038
llm_goals_427,test,28,0.8087093770804943,0.1579098434370231
llm_goals_427,test,29,0.6156429133973852,0.069843346359134
llm_goals_427,test,30,0.6073077391483352,0.5359787931933129
llm_goals_427,test,31,0.5232208808531932,0.1293182240484197
llm_goals_427,test,32,0.7029448112645272,0.2396093502744168
llm_goals_427,test,33,0.7118155252951827,0.1913976476875258
llm_goals_427,test,34,0.6073077391483352,0.4990200469731286
llm_goals_427,test,35,0.7272993887231526,0.357807030322738
llm_goals_427,test,36,0.7772736437515961,0.2580007688260685
llm_goals_427,test,37,0.4304399117523007,0.4031150735356658
llm_goals_427,test,38,0.748727669024795,0.2737247490124149
llm_goals_427,test,39,0.7376905590332256,0.2478362318668904
llm_goals_427,test,40,0.6887739383819812,0.5026721270474518
llm_goals_427,test,41,0.2459654578933983,0.2273186194850299
llm_goals_427,test,42,0.5523927265078112,0.4444071308114509
llm_goals_427,test,43,0.8032749895536592,0.2369720640870139
llm_goals_427,test,44,0.6424094473488955,0.3961639877527012
llm_goals_427,test,45,0.5528802340524328,0.2771055535106792
llm_goals_427,test,46,0.7103030662279873,0.3138421601355035
llm_goals_427,test,47,0.5232208808531932,0.3609031182529178
llm_goals_427,test,48,0.6624252868858688,0.1899314535085168
llm_goals_427,test,49,0.8032749895536592,0.4452677872765214
llm_goals_449,test,0,0.0056046171824915,0.0338418398422384
llm_goals_449,test,1,0.0164553082726881,0.5657697432527007
llm_goals_449,test,2,0.014296299179854,0.0110135668657682
llm_goals_449,test,3,0.089781288450469,0.2352946829974157
llm_goals_449,test,4,0.2124827131554247,0.4842577903424374
llm_goals_449,test,5,0.035688032759858,0.3485549555066181
llm_goals_449,test,6,0.035688032759858,0.0519669241570106
llm_goals_449,test,7,0.0056046171824915,0.0031269987549636
llm_goals_449,test,8,0.4524205580452488,0.2974090419757364
llm_goals_449,test,9,0.033362502954134,0.0925536782452943
llm_goals_449,test,10,0.0424244123837647,0.4386853694122202
llm_goals_449,test,11,0.0057265965453231,0.0063782741293255
llm_goals_449,test,12,0.0164553082726881,0.0714949969968408
llm_goals_449,test,13,0.033362502954134,0.0227751515807358
llm_goals_449,test,14,0.0377303816794924,0.3195753835685478
llm_goals_449,test,15,0.3929103217797158,0.2420638006790782
llm_goals_449,test,16,0.0377303816794924,0.0953277975239941
llm_goals_449,test,17,0.1648128551188873,0.5835221517250182
llm_goals_449,test,18,0.0377303816794924,0.1603112674891041
llm_goals_449,test,19,0.0672539165472731,0.6833613521345718
llm_goals_449,test,20,0.3929103217797158,0.4549636770044163
llm_goals_449,test,21,0.033362502954134,0.1579551412473356
llm_goals_449,test,22,0.0179707288335267,0.4400750405221786
llm_goals_449,test,23,0.0965475237955836,0.0251530775884869
llm_goals_449,test,24,0.0640522620126655,0.2695772384712642
llm_goals_449,test,25,0.0320702264639532,0.4519585097229938
llm_goals_449,test,26,0.0098760429723072,0.1123650856049343
llm_goals_449,test,27,0.0056717697453615,0.4873581137262729
llm_goals_449,test,28,0.0527904568201065,0.1751834751469549
llm_goals_449,test,29,0.0318478788815457,0.5804994670396382
llm_goals_449,test,30,0.3014946579584649,0.4626257946707522
llm_goals_449,test,31,0.035688032759858,0.093699276239858
llm_goals_449,test,32,0.1221885399547325,0.0067638379987912
llm_goals_449,test,33,0.0680797399204515,0.1681834079617312
llm_goals_449,test,34,0.3014946579584649,0.3493466516790004
llm_goals_449,test,35,0.0591786777300795,0.0068633490722964
llm_goals_449,test,36,0.3014946579584649,0.3064552348162913
llm_goals_449,test,37,0.0757827903554717,0.6652150761082033
llm_goals_449,test,38,0.1219735311293245,0.6741024889471738
llm_goals_449,test,39,0.1670135052346957,0.0101379083480811
llm_goals_449,test,40,0.082199213684588,0.0089588521989727
llm_goals_449,test,41,0.033362502954134,0.1780122280374072
llm_goals_449,test,42,0.0184825379300489,0.0051090174127486
llm_goals_449,test,43,0.035688032759858,0.2498444495344637
llm_goals_449,test,44,0.3929103217797158,0.221646438441774
llm_goals_449,test,45,0.1580097380395529,0.2094790944562388
llm_goals_449,test,46,0.0638928303931767,0.0060341568900946
llm_goals_449,test,47,0.1520903879586116,0.1241710666090617
llm_goals_449,test,48,0.0104754527863168,0.1338989075405874
llm_goals_449,test,49,0.0164553082726881,0.5982472498607049
llm_goals_93,test,0,0.0426636920225072,0.0729546648027557
llm_goals_93,test,1,0.8815204469587139,0.6981648167380458
llm_goals_93,test,2,0.9515972148445884,0.3318565449695651
llm_goals_93,test,3,0.097366020739123,0.5505450337981316
llm_goals_93,test,4,0.9706472756119192,0.9547701486411684
llm_goals_93,test,5,0.0335113156667642,0.8378989133869518
llm_goals_93,test,6,0.8307812228023245,0.8645678173925403
llm_goals_93,test,7,0.1073135505271563,0.8034776985663136
llm_goals_93,test,8,0.9392359864361162,0.9139015687588464
llm_goals_93,test,9,0.6666164297592857,0.84076714934408
llm_goals_93,test,10,0.1129182347357881,0.6739811171843284
llm_goals_93,test,11,0.9688890574402698,0.1039005746210211
llm_goals_93,test,12,0.3999482314102984,0.4267719606730696
llm_goals_93,test,13,0.9688890574402698,0.8366404177501517
llm_goals_93,test,14,0.910742818660624,0.51043302648597
llm_goals_93,test,15,0.9715423591104266,0.9305120134073452
llm_goals_93,test,16,0.910742818660624,0.3610424966705102
llm_goals_93,test,17,0.0125600399682643,0.6383014796360676
llm_goals_93,test,18,0.606306088644602,0.7718638733110297
llm_goals_93,test,19,0.1320570685347709,0.6413577201238602
llm_goals_93,test,20,0.9706472756119192,0.9315750038397262
llm_goals_93,test,21,0.8307812228023245,0.959779321458113
llm_goals_93,test,22,0.9060359024985812,0.8212707656396169
llm_goals_93,test,23,0.9622903470750708,0.0620020892855925
llm_goals_93,test,24,0.910742818660624,0.6707394124648912
llm_goals_93,test,25,0.1669873859328807,0.8513622881275814
llm_goals_93,test,26,0.4299214811349275,0.9295520797235572
llm_goals_93,test,27,0.8975709697035651,0.731125599089208
llm_goals_93,test,28,0.8975709697035651,0.6387209955509132
llm_goals_93,test,29,0.8815204469587139,0.904010833763946
llm_goals_93,test,30,0.696378105977604,0.6688304494781727
llm_goals_93,test,31,0.5776887088548034,0.7246857956085144
llm_goals_93,test,32,0.9710434667176536,0.8395389979928227
llm_goals_93,test,33,0.9318573487453734,0.4902935277900161
llm_goals_93,test,34,0.0502040827449859,0.5478889802411547
llm_goals_93,test,35,0.1779745652597602,0.8178324059837278
llm_goals_93,test,36,0.8792646582658749,0.8865698576591567
llm_goals_93,test,37,0.2493038936578456,0.9194802654649477
llm_goals_93,test,38,0.2318551112352574,0.8798558779688433
llm_goals_93,test,39,0.856287723280563,0.2399301633758412
llm_goals_93,test,40,0.0303528114124786,0.946265162703226
llm_goals_93,test,41,0.7812671062189973,0.8435175392494392
llm_goals_93,test,42,0.0668360918752532,0.260949780916787
llm_goals_93,test,43,0.8307812228023245,0.8190814792570137
llm_goals_93,test,44,0.910742818660624,0.951412738003951
llm_goals_93,test,45,0.6095091773111799,0.5085180485155563
llm_goals_93,test,46,0.8612556424658604,0.946404217454057
llm_goals_93,test,47,0.9060359024985812,0.5778150570910173
llm_goals_93,test,48,0.910742818660624,0.6859809771933842
llm_goals_93,test,49,0.0148001342101651,0.6187362092588319
llm_goals_358,test,0,0.8862895992627853,0.9198604804287828
llm_goals_358,test,1,0.6496964624809618,0.8623428941495346
llm_goals_358,test,2,0.9105174572947344,0.8146633538972576
llm_goals_358,test,3,0.8909326173012295,0.6635203414505186
llm_goals_358,test,4,0.8847048284084934,0.9873765704706148
llm_goals_358,test,5,0.91599506392778,0.8085697334742067
llm_goals_358,test,6,0.9258835350644146,0.8449593731392603
llm_goals_358,test,7,0.9105174572947344,0.7802023295414534
llm_goals_358,test,8,0.9594003549902568,0.5598487865057791
llm_goals_358,test,9,0.8160151800598606,0.7689259718491731
llm_goals_358,test,10,0.7427057069869437,0.4090564458803354
llm_goals_358,test,11,0.923280534594948,0.7281676519766522
llm_goals_358,test,12,0.7465694018308758,0.781706684015145
llm_goals_358,test,13,0.8533648229666596,0.6175350663762746
llm_goals_358,test,14,0.1095177143196853,0.1259366314847969
llm_goals_358,test,15,0.9867305163934316,0.9665391433681092
llm_goals_358,test,16,0.673011711690823,0.0977212357476949
llm_goals_358,test,17,0.5040878547351685,0.839291034278836
llm_goals_358,test,18,0.8189191165037518,0.0422931239637008
llm_goals_358,test,19,0.6274226353756172,0.3805861792548485
llm_goals_358,test,20,0.987455964400792,0.972559035375534
llm_goals_358,test,21,0.8533648229666596,0.7844216881478699
llm_goals_358,test,22,0.8189191165037518,0.8432835924874589
llm_goals_358,test,23,0.1975316506481061,0.5831400725193898
llm_goals_358,test,24,0.1095177143196853,0.4717356494812245
llm_goals_358,test,25,0.0287550849782554,0.5591997574513735
llm_goals_358,test,26,0.4094259949204003,0.2416094818565881
llm_goals_358,test,27,0.8653954219334247,0.8557277309389357
llm_goals_358,test,28,0.8909326173012295,0.7784201381020285
llm_goals_358,test,29,0.5618304680525681,0.9848793746115032
llm_goals_358,test,30,0.1651701336237502,0.6211451382223804
llm_goals_358,test,31,0.8533648229666596,0.3507967043222499
llm_goals_358,test,32,0.1491359814727031,0.670993868258675
llm_goals_358,test,33,0.673011711690823,0.0563775762088827
llm_goals_358,test,34,0.1542949739466754,0.4923522105012786
llm_goals_358,test,35,0.9105174572947344,0.8157534628947803
llm_goals_358,test,36,0.0141346750233268,0.7491294702469764
llm_goals_358,test,37,0.0429859253621814,0.5478990059483921
llm_goals_358,test,38,0.2078923051785218,0.9873113036659013
llm_goals_358,test,39,0.7465694018308758,0.6807296173615788
llm_goals_358,test,40,0.8189191165037518,0.6446558925323718
llm_goals_358,test,41,0.1892427479012722,0.3360622093964198
llm_goals_358,test,42,0.8407836619464183,0.6737437200032999
llm_goals_358,test,43,0.8533648229666596,0.453765234769123
llm_goals_358,test,44,0.7243406662597518,0.921309112250278
llm_goals_358,test,45,0.7243406662597518,0.5133269325272689
llm_goals_358,test,46,0.7555418027658395,0.7619134214235583
llm_goals_358,test,47,0.8987152012602471,0.5260478340890856
llm_goals_358,test,48,0.1095177143196853,0.0910570466126295
llm_goals_358,test,49,0.8653954219334247,0.4710935988277175
