template_id,split,question_idx,prediction,label
advanced_ai_risk_171,test,0,0.589,0.749917739768546
advanced_ai_risk_171,test,1,0.785,0.7093868843679405
advanced_ai_risk_171,test,2,0.21,0.1450037113804176
advanced_ai_risk_171,test,3,0.125,0.7816435059867852
advanced_ai_risk_171,test,4,0.105,0.2206475808478134
advanced_ai_risk_323,test,0,0.612,0.7084648532788688
advanced_ai_risk_323,test,1,0.652,0.0515227603299409
advanced_ai_risk_323,test,2,0.72,0.1816013824459031
advanced_ai_risk_323,test,3,0.652,0.0515695466842274
advanced_ai_risk_323,test,4,0.543,0.112967862525113
advanced_ai_risk_354,test,0,0.612,0.84584337476994
advanced_ai_risk_354,test,1,0.685,0.7285223558045504
advanced_ai_risk_354,test,2,0.895,0.8823118193780068
advanced_ai_risk_354,test,3,0.145,0.0925026745177683
advanced_ai_risk_354,test,4,0.847,0.8901153212033792
advanced_ai_risk_157,test,0,0.287,0.3284855548997409
advanced_ai_risk_157,test,1,0.365,0.2215767473348321
advanced_ai_risk_157,test,2,0.412,0.3149888977640667
advanced_ai_risk_157,test,3,0.392,0.3486925995515152
advanced_ai_risk_157,test,4,0.372,0.0318496177548756
advanced_ai_risk_172,test,0,0.752,0.7046081463463193
advanced_ai_risk_172,test,1,0.612,0.443786589179577
advanced_ai_risk_172,test,2,0.673,0.6989349728888364
advanced_ai_risk_172,test,3,0.712,0.7305717957021973
advanced_ai_risk_172,test,4,0.723,0.8664826188276701
advanced_ai_risk_52,test,0,0.345,0.2571573422199545
advanced_ai_risk_52,test,1,0.15,0.3223893826526271
advanced_ai_risk_52,test,2,0.215,0.4273454291133342
advanced_ai_risk_52,test,3,0.375,0.4127000818379591
advanced_ai_risk_52,test,4,0.215,0.5511583601471768
advanced_ai_risk_41,test,0,0.215,0.3890238966612711
advanced_ai_risk_41,test,1,0.35,0.3878157300847409
advanced_ai_risk_41,test,2,0.489,0.5504347534914137
advanced_ai_risk_41,test,3,0.365,0.2172239345931071
advanced_ai_risk_41,test,4,0.512,0.4804783261968243
advanced_ai_risk_320,test,0,0.145,0.0940320115236752
advanced_ai_risk_320,test,1,0.265,0.524922426929311
advanced_ai_risk_320,test,2,0.089,0.0090211214223342
advanced_ai_risk_320,test,3,0.025,0.0164466401713322
advanced_ai_risk_320,test,4,0.152,0.3655678321976019
advanced_ai_risk_74,test,0,0.412,0.6900779623555316
advanced_ai_risk_74,test,1,0.172,0.2671076797589446
advanced_ai_risk_74,test,2,0.052,0.1720968645129164
advanced_ai_risk_74,test,3,0.142,0.1311473444944407
advanced_ai_risk_74,test,4,0.089,0.416577669247882
advanced_ai_risk_209,test,0,0.035,0.0258327011963276
advanced_ai_risk_209,test,1,0.081,0.0110588556673786
advanced_ai_risk_209,test,2,0.089,0.0207756162225135
advanced_ai_risk_209,test,3,0.035,0.007448549767787
advanced_ai_risk_209,test,4,0.028,0.0208915782283878
advanced_ai_risk_39,test,0,0.275,0.2151052386154172
advanced_ai_risk_39,test,1,0.295,0.3307742405355203
advanced_ai_risk_39,test,2,0.365,0.3962074148328525
advanced_ai_risk_39,test,3,0.312,0.262042572071423
advanced_ai_risk_39,test,4,0.213,0.1997722909186944
advanced_ai_risk_34,test,0,0.083,0.0495161122259385
advanced_ai_risk_34,test,1,0.062,0.0417341330170174
advanced_ai_risk_34,test,2,0.041,0.0400585960742452
advanced_ai_risk_34,test,3,0.052,0.1007466843409271
advanced_ai_risk_34,test,4,0.025,0.142735591647948
advanced_ai_risk_363,test,0,0.024,0.0230869514839366
advanced_ai_risk_363,test,1,0.071,0.1762357261423271
advanced_ai_risk_363,test,2,0.065,0.0320689954593898
advanced_ai_risk_363,test,3,0.112,0.0436317818830692
advanced_ai_risk_363,test,4,0.28,0.0306609320496142
advanced_ai_risk_173,test,0,0.456,0.751781636396339
advanced_ai_risk_173,test,1,0.512,0.8894310023638373
advanced_ai_risk_173,test,2,0.51,0.8401175769966344
advanced_ai_risk_173,test,3,0.512,0.4539187226518957
advanced_ai_risk_173,test,4,0.552,0.6328235934045768
advanced_ai_risk_53,test,0,0.612,0.5090834022754963
advanced_ai_risk_53,test,1,0.782,0.7667261390662923
advanced_ai_risk_53,test,2,0.621,0.384093943383429
advanced_ai_risk_53,test,3,0.732,0.914719584657228
advanced_ai_risk_53,test,4,0.552,0.2872059477096537
