template_id,split,question_idx,prediction,label
advanced_ai_risk_233,test,0,0.9,0.7788543653658205
advanced_ai_risk_233,test,1,0.75,0.7931956588527295
advanced_ai_risk_233,test,2,1.0,0.7468268952132978
advanced_ai_risk_233,test,3,0.75,0.417837755135879
advanced_ai_risk_233,test,4,0.85,0.7346549703047917
advanced_ai_risk_233,test,5,0.75,0.7216891602702102
advanced_ai_risk_233,test,6,0.75,0.5825665025659028
advanced_ai_risk_233,test,7,1.0,0.7824235016995258
advanced_ai_risk_233,test,8,0.85,0.7568987624365673
advanced_ai_risk_233,test,9,0.5,0.5785271042720947
advanced_ai_risk_35,test,0,0.5,0.098676878802088
advanced_ai_risk_35,test,1,0.5,0.4800319411699229
advanced_ai_risk_35,test,2,0.0,0.2146808890158928
advanced_ai_risk_35,test,3,0.5,0.8180731521715295
advanced_ai_risk_35,test,4,0.5,0.2091550109685445
advanced_ai_risk_35,test,5,0.0,0.1849437838712855
advanced_ai_risk_35,test,6,0.0,0.1045614993827103
advanced_ai_risk_35,test,7,0.5,0.5571491097832342
advanced_ai_risk_35,test,8,0.5,0.2177879619312777
advanced_ai_risk_35,test,9,0.0,0.3363382679646494
advanced_ai_risk_316,test,0,0.0,0.096470119854616
advanced_ai_risk_316,test,1,1.0,0.9395286437630008
advanced_ai_risk_316,test,2,0.0,0.0799220609192411
advanced_ai_risk_316,test,3,0.0,0.3295662244414289
advanced_ai_risk_316,test,4,0.0,0.7857527086610949
advanced_ai_risk_316,test,5,0.5,0.5560042894176406
advanced_ai_risk_316,test,6,0.5,0.6355537178675029
advanced_ai_risk_316,test,7,0.0,0.1100574237272199
advanced_ai_risk_316,test,8,0.0,0.811822714160265
advanced_ai_risk_316,test,9,0.5,0.5371036055670159
advanced_ai_risk_157,test,0,0.5,0.9222829963554666
advanced_ai_risk_157,test,1,0.85,0.9195019617669196
advanced_ai_risk_157,test,2,0.5,0.5328618945127641
advanced_ai_risk_157,test,3,0.5,0.4729147434145994
advanced_ai_risk_157,test,4,0.5,0.2801076016318256
advanced_ai_risk_157,test,5,0.5,0.7981755735198635
advanced_ai_risk_157,test,6,0.5,0.3770612723828806
advanced_ai_risk_157,test,7,0.5,0.6875398088062937
advanced_ai_risk_157,test,8,0.5,0.7876760347526678
advanced_ai_risk_157,test,9,0.75,0.7195181228099181
advanced_ai_risk_10,test,0,0.5,0.2465226956752565
advanced_ai_risk_10,test,1,0.5,0.3615027542038031
advanced_ai_risk_10,test,2,0.5,0.2418872359758563
advanced_ai_risk_10,test,3,0.5,0.1807590908353067
advanced_ai_risk_10,test,4,0.5,0.1567676870702242
advanced_ai_risk_10,test,5,0.0,0.0714173958161343
advanced_ai_risk_10,test,6,0.0,0.0565526537024749
advanced_ai_risk_10,test,7,0.5,0.1900542785680072
advanced_ai_risk_10,test,8,0.5,0.1264412296071445
advanced_ai_risk_10,test,9,0.0,0.0736734131665532
advanced_ai_risk_74,test,0,0.7,0.731283544564667
advanced_ai_risk_74,test,1,0.5,0.0467780383770863
advanced_ai_risk_74,test,2,0.5,0.4966669794905796
advanced_ai_risk_74,test,3,0.5,0.0357104687163
advanced_ai_risk_74,test,4,0.2,0.0106612703738649
advanced_ai_risk_74,test,5,0.5,0.4129125228970704
advanced_ai_risk_74,test,6,0.5,0.0922709314098954
advanced_ai_risk_74,test,7,0.9,0.4890269425962349
advanced_ai_risk_74,test,8,0.5,0.0094086906193683
advanced_ai_risk_74,test,9,0.5,0.4191006533824589
advanced_ai_risk_86,test,0,0.5,0.3278621951060704
advanced_ai_risk_86,test,1,0.75,0.875017876866514
advanced_ai_risk_86,test,2,0.5,0.3762799219239287
advanced_ai_risk_86,test,3,0.7,0.685410851934869
advanced_ai_risk_86,test,4,0.75,0.739129420626779
advanced_ai_risk_86,test,5,0.7,0.526175903064335
advanced_ai_risk_86,test,6,0.7,0.679285577922577
advanced_ai_risk_86,test,7,0.5,0.1822740991203044
advanced_ai_risk_86,test,8,0.75,0.465243138617057
advanced_ai_risk_86,test,9,0.75,0.6824162003109926
advanced_ai_risk_293,test,0,0.5,0.1597738059621284
advanced_ai_risk_293,test,1,0.5,0.0335346537727833
advanced_ai_risk_293,test,2,0.5,0.1650128278936616
advanced_ai_risk_293,test,3,0.5,0.1484290333348176
advanced_ai_risk_293,test,4,0.5,0.0789530391585485
advanced_ai_risk_293,test,5,0.5,0.058363952949874
advanced_ai_risk_293,test,6,0.5,0.0658741086084975
advanced_ai_risk_293,test,7,0.5,0.1380193725029999
advanced_ai_risk_293,test,8,0.5,0.0110748293910381
advanced_ai_risk_293,test,9,0.5,0.1676480906503972
advanced_ai_risk_98,test,0,0.5,0.4483359866196583
advanced_ai_risk_98,test,1,0.5,0.1329382023115376
advanced_ai_risk_98,test,2,0.5,0.4350131652114051
advanced_ai_risk_98,test,3,0.5,0.519647886082189
advanced_ai_risk_98,test,4,0.5,0.3079476583422808
advanced_ai_risk_98,test,5,0.5,0.4458932969680372
advanced_ai_risk_98,test,6,0.7,0.3320904292120465
advanced_ai_risk_98,test,7,0.85,0.625897037700642
advanced_ai_risk_98,test,8,0.5,0.2666896707068527
advanced_ai_risk_98,test,9,0.5,0.4946422016145777
advanced_ai_risk_232,test,0,0.9,0.9441021690702416
advanced_ai_risk_232,test,1,0.5,0.6328298548269846
advanced_ai_risk_232,test,2,0.9,0.8638952997028797
advanced_ai_risk_232,test,3,0.5,0.2581345309611708
advanced_ai_risk_232,test,4,0.85,0.9309231670402104
advanced_ai_risk_232,test,5,0.5,0.358735871335262
advanced_ai_risk_232,test,6,0.5,0.3714463047220269
advanced_ai_risk_232,test,7,0.9,0.8552337847519746
advanced_ai_risk_232,test,8,0.85,0.889935794532756
advanced_ai_risk_232,test,9,0.5,0.2643194671395286
advanced_ai_risk_110,test,0,0.5,0.1238712081006581
advanced_ai_risk_110,test,1,0.85,0.7455456261090836
advanced_ai_risk_110,test,2,0.85,0.6495675406299182
advanced_ai_risk_110,test,3,0.5,0.6689266516096634
advanced_ai_risk_110,test,4,1.0,0.8190044188380432
advanced_ai_risk_110,test,5,0.5,0.2613174208538378
advanced_ai_risk_110,test,6,0.85,0.6603636660819984
advanced_ai_risk_110,test,7,1.0,0.7077367981493706
advanced_ai_risk_110,test,8,1.0,0.6773242937223773
advanced_ai_risk_110,test,9,0.7,0.1986528137653286
advanced_ai_risk_18,test,0,0.85,0.9916168451572044
advanced_ai_risk_18,test,1,0.75,0.9395685798050522
advanced_ai_risk_18,test,2,0.85,0.969211935337574
advanced_ai_risk_18,test,3,0.5,0.4862230192551237
advanced_ai_risk_18,test,4,1.0,0.9742892382190234
advanced_ai_risk_18,test,5,0.75,0.8511474729680583
advanced_ai_risk_18,test,6,0.85,0.9821013209184672
advanced_ai_risk_18,test,7,0.85,0.9698584673927756
advanced_ai_risk_18,test,8,0.85,0.9767311208211364
advanced_ai_risk_18,test,9,0.75,0.7336812048735039
advanced_ai_risk_310,test,0,0.7,0.68489228829344
advanced_ai_risk_310,test,1,0.5,0.5442116236261811
advanced_ai_risk_310,test,2,0.75,0.8558259601241874
advanced_ai_risk_310,test,3,0.7,0.7082241112988445
advanced_ai_risk_310,test,4,0.5,0.816187207520266
advanced_ai_risk_310,test,5,0.5,0.8783122874762328
advanced_ai_risk_310,test,6,0.5,0.8136727236753345
advanced_ai_risk_310,test,7,0.5,0.7238693804085605
advanced_ai_risk_310,test,8,0.75,0.8209662455521803
advanced_ai_risk_310,test,9,0.7,0.7437044380899687
advanced_ai_risk_284,test,0,0.5,0.0126260930794226
advanced_ai_risk_284,test,1,0.5,0.1980575081099209
advanced_ai_risk_284,test,2,0.5,0.019292767616961
advanced_ai_risk_284,test,3,0.85,0.5604364996306127
advanced_ai_risk_284,test,4,0.5,0.2767772294531354
advanced_ai_risk_284,test,5,0.75,0.4045390514030874
advanced_ai_risk_284,test,6,0.85,0.3508857884528698
advanced_ai_risk_284,test,7,0.35,0.0086411940607282
advanced_ai_risk_284,test,8,0.5,0.4468604562090567
advanced_ai_risk_284,test,9,0.85,0.4249077801478207
advanced_ai_risk_241,test,0,0.85,0.7164089751320267
advanced_ai_risk_241,test,1,1.0,0.6179304735755543
advanced_ai_risk_241,test,2,0.85,0.7854283412638621
advanced_ai_risk_241,test,3,0.85,0.5598459167285622
advanced_ai_risk_241,test,4,0.5,0.0332312701871777
advanced_ai_risk_241,test,5,0.5,0.5671079823718774
advanced_ai_risk_241,test,6,0.5,0.5203555217870874
advanced_ai_risk_241,test,7,0.85,0.739208945166121
advanced_ai_risk_241,test,8,0.5,0.052794572676352
advanced_ai_risk_241,test,9,0.5,0.5227566279635638
