#!/usr/bin/env python3 import sys import os sys.path.append(os.path.dirname(os.path.abspath(__file__))) from eval.scripts.db_utils import scoresearch_string import logging # Configure logging logging.basicConfig(level=logging.INFO) # Define the benchmarks we need benchmarks = [  "AIME24_accuracy_avg", "AMC23_accuracy_avg", "MATH500_accuracy",  "JEEBench_accuracy_avg", "GPQADiamond_accuracy_avg",  "veCodeBench_accuracy_avg", "CodeElo_accuracy_avg", "CodeForces_accuracy_avg" ] # Search for all missing models missing_models = [  # Math answer sampng (c1): 0.3k, 1k, 3k, 10k  "c1_math_0d_16s_0.3k", "c1_math_0d_16s_1k", "c1_math_0d_16s_3k", "c1_math_0d_16s_10k",  # Code mix (b1): 1k  "b1_code_top_2_1k",  # Code source (a1): 10k  "a1_code_code_golf_10k",  # Science mix (b1): 1k, 10k  "b1_science_top_2_1k", "b1_science_top_2_10k",  # Science source (a1): 10k  "a1_science_stackexchange_physics_10k" ] class Args:  def __init__(self):  self.comma_separated_bstrings = True  self.output = "all_missing_models" args = Args() print("Searching for all missing models...") relts, csv_file = scoresearch_string(missing_models, benchmarks=benchmarks, args=args) if not relts.empty:  print("\nFound relts:")  print(relts.to_string())  print(f"\nRelts saved to: {csv_file}")  # Print formatted entries for easy copy-paste  print("\n=== Formatted entries for hardcoded CSV ===")  for _, row in relts.iterrows():  exp = row['Experiments']  domain = row['Domain']  # Infer dataset size from name  if '0.3k' in exp:  size = 316.0  ef '1k' in exp:  size = 1000.0  ef '3k' in exp:  size = 3160.0  ef '10k' in exp:  size = 10000.0  else:  size = 'Unknown'  entry = f"{exp},{domain},{size},{row['AvgAll']},{row['AIME24']},{row['AMC23']},{row['MATH500']},{row['AvgMath']},{row['JEEBench']},{row['GPQAD']},{row['AvgSci']},{row['LCBv2']},{row['CodeElo']},{row['CodeForces']},{row['AvgCode']}"  print(entry) else:  print("No relts found for the missing models")