Model,Prompt_Type,Forecasting_CoT,Forecasting_Debate,ChangeMyView_CoT,ChangeMyView_Debate,OpenReview_CoT,OpenReview_Debate
GPT-4o (May 7),No Prompt,0.0018,-0.0439,0.0671,0.038,0.073,0.154
GPT-4o (May 7),CT Prompt,0.0156,-0.012,0.066,0.120,0.103,0.131
GPT-4o (May 7),CF Prompt,0.090,-0.0227,0.146,0.268,-0.086,0.237
GPT-4o (Apr 30),No Prompt,0.016,0.017,0.070,0.078,,
GPT-4o (Apr 30),CT Prompt,,,,,,
GPT-4o (Apr 30),CF Prompt,0.080,0.017,0.139,0.154,,
deepseek_r1,No Prompt,0.0207,0.0559,0.0502,0.0845,0.0676,0.0366
deepseek_r1,CT Prompt,0.0119,0.0121,0.0511,-0.0622,0.0595,0.1860
deepseek_r1,CF Prompt,0.0450,0.0487,0.0526,0.0961,0.0689,0.0299
gemini_2_0_flash,No Prompt,0.0764,-0.0196,0.1209,0.0969,0.1012,0.0882
gemini_2_0_flash,CT Prompt,0.0067,-0.0012,0.1203,0.0642,0.0817,0.1263
gemini_2_0_flash,CF Prompt,0.0335,-0.0368,0.1052,0.0295,0.0849,0.0646
deepseek_v3,No Prompt,0.0335,-0.0929,0.1155,0.0739,0.1028,0.1337
deepseek_v3,CT Prompt,0.0348,-0.0064,0.0990,0.0179,0.0865,0.0743
deepseek_v3,CF Prompt,0.0763,-0.0216,0.0879,0.0511,-0.1493,0.2113
llama_4_scout,No Prompt,0.0350,0.0078,0.1420,0.0900,0.0890,0.1168
llama_4_scout,CT Prompt,0.0125,-0.0395,0.1146,0.0238,0.1028,0.1729
llama_4_scout,CF Prompt,0.0740,-0.0114,0.1372,0.0003,-0.0253,0.1929
llama_4_maverick,No Prompt,0.0178,0.0103,0.1038,0.1100,0.0823,0.1749
llama_4_maverick,CT Prompt,0.0282,0.0132,0.1161,0.1185,0.0909,0.2521
llama_4_maverick,CF Prompt,0.0523,-0.0128,0.1435,0.1608,0.0951,0.1724
claude_3_5_haiku,No Prompt,0.0320,-0.0283,0.1218,0.0230,,
claude_3_5_haiku,CT Prompt,0.0133,0.0348,0.1083,0.0587,,
claude_3_5_haiku,CF Prompt,0.0563,-0.0151,0.0890,,,