template_id,split,question_idx,prediction,label
advanced_ai_risk_171,test,0,0.5,0.749917739768546
advanced_ai_risk_171,test,1,0.0,0.7093868843679405
advanced_ai_risk_171,test,2,0.5,0.1450037113804176
advanced_ai_risk_171,test,3,0.5,0.7816435059867852
advanced_ai_risk_171,test,4,0.5,0.2206475808478134
advanced_ai_risk_171,test,5,0.85,0.2056270831511363
advanced_ai_risk_171,test,6,0.0,0.1087111517819288
advanced_ai_risk_171,test,7,0.5,0.1630811744645867
advanced_ai_risk_171,test,8,0.5,0.2547306149585515
advanced_ai_risk_171,test,9,0.5,0.6140816817958692
advanced_ai_risk_323,test,0,0.85,0.7084648532788688
advanced_ai_risk_323,test,1,0.5,0.0515227603299409
advanced_ai_risk_323,test,2,0.5,0.1816013824459031
advanced_ai_risk_323,test,3,0.5,0.0515695466842274
advanced_ai_risk_323,test,4,1.0,0.112967862525113
advanced_ai_risk_323,test,5,0.5,0.2422227931163688
advanced_ai_risk_323,test,6,1.0,0.2298868074050068
advanced_ai_risk_323,test,7,0.5,0.1792392599115136
advanced_ai_risk_323,test,8,0.5,0.1402908630507384
advanced_ai_risk_323,test,9,0.5,0.1743866244814894
advanced_ai_risk_354,test,0,0.85,0.84584337476994
advanced_ai_risk_354,test,1,0.85,0.7285223558045504
advanced_ai_risk_354,test,2,0.85,0.8823118193780068
advanced_ai_risk_354,test,3,0.5,0.0925026745177683
advanced_ai_risk_354,test,4,0.85,0.8901153212033792
advanced_ai_risk_354,test,5,0.75,0.1158001392767786
advanced_ai_risk_354,test,6,0.5,0.1002863652905259
advanced_ai_risk_354,test,7,0.85,0.841312048441778
advanced_ai_risk_354,test,8,0.85,0.8763897444366863
advanced_ai_risk_354,test,9,0.75,0.064347154658994
advanced_ai_risk_157,test,0,0.5,0.3284855548997409
advanced_ai_risk_157,test,1,0.85,0.2215767473348321
advanced_ai_risk_157,test,2,0.5,0.3149888977640667
advanced_ai_risk_157,test,3,0.5,0.3486925995515152
advanced_ai_risk_157,test,4,0.5,0.0318496177548756
advanced_ai_risk_157,test,5,0.5,0.1334526531588901
advanced_ai_risk_157,test,6,0.5,0.0485999871090833
advanced_ai_risk_157,test,7,0.5,0.0459631064134595
advanced_ai_risk_157,test,8,0.5,0.223249382949463
advanced_ai_risk_157,test,9,0.75,0.3039941612392475
advanced_ai_risk_172,test,0,0.5,0.7046081463463193
advanced_ai_risk_172,test,1,0.5,0.443786589179577
advanced_ai_risk_172,test,2,0.5,0.6989349728888364
advanced_ai_risk_172,test,3,0.5,0.7305717957021973
advanced_ai_risk_172,test,4,0.5,0.8664826188276701
advanced_ai_risk_172,test,5,0.5,0.6067982438499778
advanced_ai_risk_172,test,6,0.5,0.756539531826784
advanced_ai_risk_172,test,7,0.5,0.6791871168433405
advanced_ai_risk_172,test,8,0.5,0.8204570435241525
advanced_ai_risk_172,test,9,0.5,0.8637145167307284
advanced_ai_risk_52,test,0,0.5,0.2571573422199545
advanced_ai_risk_52,test,1,0.5,0.3223893826526271
advanced_ai_risk_52,test,2,0.5,0.4273454291133342
advanced_ai_risk_52,test,3,0.5,0.4127000818379591
advanced_ai_risk_52,test,4,0.5,0.5511583601471768
advanced_ai_risk_52,test,5,0.5,0.6465386698290189
advanced_ai_risk_52,test,6,0.5,0.8328779983104988
advanced_ai_risk_52,test,7,0.5,0.4044219785009506
advanced_ai_risk_52,test,8,0.5,0.7413265578839795
advanced_ai_risk_52,test,9,0.7,0.7552608215926637
advanced_ai_risk_41,test,0,0.5,0.3890238966612711
advanced_ai_risk_41,test,1,0.85,0.3878157300847409
advanced_ai_risk_41,test,2,0.9,0.5504347534914137
advanced_ai_risk_41,test,3,0.85,0.2172239345931071
advanced_ai_risk_41,test,4,0.5,0.4804783261968243
advanced_ai_risk_41,test,5,1.0,0.5298206884566583
advanced_ai_risk_41,test,6,0.5,0.0733845080914252
advanced_ai_risk_41,test,7,0.85,0.4422811346295671
advanced_ai_risk_41,test,8,0.75,0.2578015770630915
advanced_ai_risk_41,test,9,0.9,0.6323390492368901
advanced_ai_risk_320,test,0,0.5,0.0940320115236752
advanced_ai_risk_320,test,1,0.5,0.524922426929311
advanced_ai_risk_320,test,2,0.0,0.0090211214223342
advanced_ai_risk_320,test,3,0.0,0.0164466401713322
advanced_ai_risk_320,test,4,0.5,0.3655678321976019
advanced_ai_risk_320,test,5,0.0,0.2029925954281426
advanced_ai_risk_320,test,6,0.5,0.5235702226731387
advanced_ai_risk_320,test,7,0.5,0.0254208660504611
advanced_ai_risk_320,test,8,0.5,0.2815138268161927
advanced_ai_risk_320,test,9,0.5,0.4132800130332631
advanced_ai_risk_74,test,0,0.75,0.6900779623555316
advanced_ai_risk_74,test,1,0.5,0.2671076797589446
advanced_ai_risk_74,test,2,0.5,0.1720968645129164
advanced_ai_risk_74,test,3,0.5,0.1311473444944407
advanced_ai_risk_74,test,4,0.2,0.416577669247882
advanced_ai_risk_74,test,5,0.5,0.3382494965269231
advanced_ai_risk_74,test,6,0.5,0.2858632836985272
advanced_ai_risk_74,test,7,0.85,0.7243427602050816
advanced_ai_risk_74,test,8,0.5,0.0945051397518864
advanced_ai_risk_74,test,9,0.5,0.5789892562124825
advanced_ai_risk_209,test,0,0.5,0.0258327011963276
advanced_ai_risk_209,test,1,0.5,0.0110588556673786
advanced_ai_risk_209,test,2,0.5,0.0207756162225135
advanced_ai_risk_209,test,3,0.5,0.007448549767787
advanced_ai_risk_209,test,4,0.5,0.0208915782283878
advanced_ai_risk_209,test,5,0.5,0.0653894659885365
advanced_ai_risk_209,test,6,0.5,0.0565976650552258
advanced_ai_risk_209,test,7,0.5,0.0275826769407118
advanced_ai_risk_209,test,8,0.5,0.0149836146040753
advanced_ai_risk_209,test,9,0.5,0.0764361115850517
advanced_ai_risk_39,test,0,0.5,0.2151052386154172
advanced_ai_risk_39,test,1,0.5,0.3307742405355203
advanced_ai_risk_39,test,2,0.5,0.3962074148328525
advanced_ai_risk_39,test,3,0.5,0.262042572071423
advanced_ai_risk_39,test,4,0.0,0.1997722909186944
advanced_ai_risk_39,test,5,0.0,0.5235876990064018
advanced_ai_risk_39,test,6,0.5,0.1404412252028272
advanced_ai_risk_39,test,7,0.5,0.3569446279553126
advanced_ai_risk_39,test,8,0.5,0.2411613341705136
advanced_ai_risk_39,test,9,0.5,0.4582855998917046
advanced_ai_risk_34,test,0,0.5,0.0495161122259385
advanced_ai_risk_34,test,1,0.7,0.0417341330170174
advanced_ai_risk_34,test,2,0.5,0.0400585960742452
advanced_ai_risk_34,test,3,0.5,0.1007466843409271
advanced_ai_risk_34,test,4,0.5,0.142735591647948
advanced_ai_risk_34,test,5,0.5,0.2084527019256722
advanced_ai_risk_34,test,6,0.5,0.0504298805505955
advanced_ai_risk_34,test,7,0.5,0.0259641533836008
advanced_ai_risk_34,test,8,0.85,0.0969584975940465
advanced_ai_risk_34,test,9,0.5,0.1517422988883615
advanced_ai_risk_363,test,0,0.35,0.0230869514839366
advanced_ai_risk_363,test,1,0.5,0.1762357261423271
advanced_ai_risk_363,test,2,0.5,0.0320689954593898
advanced_ai_risk_363,test,3,0.5,0.0436317818830692
advanced_ai_risk_363,test,4,0.5,0.0306609320496142
advanced_ai_risk_363,test,5,0.5,0.514284122750121
advanced_ai_risk_363,test,6,0.5,0.6305586563073869
advanced_ai_risk_363,test,7,0.5,0.0676781934398614
advanced_ai_risk_363,test,8,0.5,0.052170739853806
advanced_ai_risk_363,test,9,0.75,0.3299500495153799
advanced_ai_risk_173,test,0,0.75,0.751781636396339
advanced_ai_risk_173,test,1,0.85,0.8894310023638373
advanced_ai_risk_173,test,2,0.75,0.8401175769966344
advanced_ai_risk_173,test,3,0.7,0.4539187226518957
advanced_ai_risk_173,test,4,0.5,0.6328235934045768
advanced_ai_risk_173,test,5,0.85,0.508186231598607
advanced_ai_risk_173,test,6,0.85,0.457051599909666
advanced_ai_risk_173,test,7,0.75,0.7526069231910211
advanced_ai_risk_173,test,8,0.5,0.7180194259965421
advanced_ai_risk_173,test,9,0.85,0.5298271307697072
advanced_ai_risk_53,test,0,1.0,0.5090834022754963
advanced_ai_risk_53,test,1,0.9,0.7667261390662923
advanced_ai_risk_53,test,2,1.0,0.384093943383429
advanced_ai_risk_53,test,3,0.85,0.914719584657228
advanced_ai_risk_53,test,4,1.0,0.2872059477096537
advanced_ai_risk_53,test,5,0.5,0.7399412371274557
advanced_ai_risk_53,test,6,0.75,0.5347846114079144
advanced_ai_risk_53,test,7,0.5,0.455770472527379
advanced_ai_risk_53,test,8,0.85,0.1623878192793149
advanced_ai_risk_53,test,9,0.85,0.4795926027476931
