problem_id,correctness,coarse_grained_novelty
2023_AMC_8_Problems_14,"{'claude-3-7-sonnet-20250219': 'NO', 'final_decision': 'NO'}",{'final_decision': 'NO'}
2018_USAJMO_Problems_2,"{'claude-3-7-sonnet-20250219': 'NO', 'final_decision': 'NO'}",{'final_decision': 'NO'}
2009_AMC_12A_Problems_24,"{'claude-3-7-sonnet-20250219': 'NO', 'final_decision': 'NO'}",{'final_decision': 'NO'}
2017_USAMO_Problems_3,"{'claude-3-7-sonnet-20250219': 'NO', 'final_decision': 'NO'}",{'final_decision': 'NO'}
2008_AIME_I_Problems_10,"{'claude-3-7-sonnet-20250219': 'NO', 'final_decision': 'NO'}",{'final_decision': 'NO'}
2011_USAMO_Problems_1,"{'claude-3-7-sonnet-20250219': 'NO', 'final_decision': 'NO'}",{'final_decision': 'NO'}
2022_USAJMO_Problems_1,"{'claude-3-7-sonnet-20250219': 'UNCLEAR', 'final_decision': 'NO'}",{'final_decision': 'NO'}
2008_AMC_10A_Problems_9,"{'claude-3-7-sonnet-20250219': 'NO', 'final_decision': 'NO'}",{'final_decision': 'NO'}
2011_USAJMO_Problems_2,"{'claude-3-7-sonnet-20250219': 'NO', 'final_decision': 'NO'}",{'final_decision': 'NO'}
2014_AMC_10B_Problems_18,"{'claude-3-7-sonnet-20250219': 'NO', 'final_decision': 'NO'}",{'final_decision': 'NO'}
2016_USAJMO_Problems_4,"{'claude-3-7-sonnet-20250219': 'NO', 'final_decision': 'NO'}",{'final_decision': 'NO'}
2012_USAMO_Problems_4,"{'claude-3-7-sonnet-20250219': 'NO', 'final_decision': 'NO'}",{'final_decision': 'NO'}
2020_USAJMO_Problems_2,"{'claude-3-7-sonnet-20250219': 'NO', 'final_decision': 'NO'}",{'final_decision': 'NO'}
2012_USAJMO_Problems_6,"{'claude-3-7-sonnet-20250219': 'NO', 'final_decision': 'NO'}",{'final_decision': 'NO'}
1981_USAMO_Problems_1,"{'claude-3-7-sonnet-20250219': 'NO', 'final_decision': 'NO'}",{'final_decision': 'NO'}
1987_AIME_Problems_11,"{'claude-3-7-sonnet-20250219': 'NO', 'final_decision': 'NO'}",{'final_decision': 'NO'}
2022_AMC_10A_Problems_9,"{'claude-3-7-sonnet-20250219': 'NO', 'final_decision': 'NO'}",{'final_decision': 'NO'}
2011_AIME_II_Problems_9,"{'claude-3-7-sonnet-20250219': 'NO', 'final_decision': 'NO'}",{'final_decision': 'NO'}
2006_AIME_II_Problems_11,"{'claude-3-7-sonnet-20250219': 'NO', 'final_decision': 'NO'}",{'final_decision': 'NO'}
1987_USAMO_Problems_1,"{'claude-3-7-sonnet-20250219': 'NO', 'final_decision': 'NO'}",{'final_decision': 'NO'}
1987_AIME_Problems_7,"{'claude-3-7-sonnet-20250219': 'NO', 'final_decision': 'NO'}",{'final_decision': 'NO'}
1992_IMO_Problems_3,"{'claude-3-7-sonnet-20250219': 'NO', 'final_decision': 'NO'}",{'final_decision': 'NO'}
1998_AIME_Problems_13,"{'claude-3-7-sonnet-20250219': 'NO', 'final_decision': 'NO'}",{'final_decision': 'NO'}
2011_AIME_I_Problems_12,"{'claude-3-7-sonnet-20250219': 'NO', 'final_decision': 'NO'}",{'final_decision': 'NO'}
2023_USAJMO_Problems_1,"{'claude-3-7-sonnet-20250219': 'NO', 'final_decision': 'NO'}",{'final_decision': 'NO'}
2011_USAJMO_Problems_6,"{'claude-3-7-sonnet-20250219': 'NO', 'final_decision': 'NO'}",{'final_decision': 'NO'}
2001_AMC_10_Problems_20,"{'claude-3-7-sonnet-20250219': 'NO', 'final_decision': 'NO'}",{'final_decision': 'NO'}
2015_USAJMO_Problems_3,"{'claude-3-7-sonnet-20250219': 'NO', 'final_decision': 'NO'}",{'final_decision': 'NO'}
2015_USAJMO_Problems_5,"{'claude-3-7-sonnet-20250219': 'NO', 'final_decision': 'NO'}",{'final_decision': 'NO'}
1990_USAMO_Problems_1,"{'claude-3-7-sonnet-20250219': 'NO', 'final_decision': 'NO'}",{'final_decision': 'NO'}
