#!/usr/bin/env python3 import sys import os sys.path.append(os.path.dirname(os.path.abspath(__file__))) from eval.scripts.db_utils import scoresearch_string import logging # Configure logging logging.basicConfig(level=logging.INFO) # Define the benchmarks we need benchmarks = [  "AIME24_accuracy_avg", "AMC23_accuracy_avg", "MATH500_accuracy",  "JEEBench_accuracy_avg", "GPQADiamond_accuracy_avg",  "veCodeBench_accuracy_avg", "CodeElo_accuracy_avg", "CodeForces_accuracy_avg" ] # Search specifically for b1_science_top_2_10k target_model = ["b1_science_top_2_10k"] class Args:  def __init__(self):  self.comma_separated_bstrings = True  self.output = "check_b1_science_10k" args = Args() print("Searching specifically for b1_science_top_2_10k...") relts, csv_file = scoresearch_string(target_model, benchmarks=benchmarks, args=args) if not relts.empty:  print("\nFound relts:")  print(relts.to_string())  # Print the specific row details  for _, row in relts.iterrows():  exp = row['Experiments']  domain = row['Domain']  size = row['DatasetSize']  print(f"\n=== Detailed relts for {exp} ===")  print(f"Domain: {domain}")  print(f"DatasetSize: {size}")  print(f"AvgAll: {row['AvgAll']}")  print(f"AIME24: {row['AIME24']}")  print(f"AMC23: {row['AMC23']}")  print(f"MATH500: {row['MATH500']}")  print(f"AvgMath: {row['AvgMath']}")  print(f"JEEBench: {row['JEEBench']}")  print(f"GPQAD: {row['GPQAD']}")  print(f"AvgSci: {row['AvgSci']}")  print(f"LCBv2: {row['LCBv2']}")  print(f"CodeElo: {row['CodeElo']}")  print(f"CodeForces: {row['CodeForces']}")  print(f"AvgCode: {row['AvgCode']}")  # Formatted entry for CSV  entry = f"{exp},{domain},{size},{row['AvgAll']},{row['AIME24']},{row['AMC23']},{row['MATH500']},{row['AvgMath']},{row['JEEBench']},{row['GPQAD']},{row['AvgSci']},{row['LCBv2']},{row['CodeElo']},{row['CodeForces']},{row['AvgCode']}"  print(f"\nFormatted CSV entry:")  print(entry) else:  print("No relts found for b1_science_top_2_10k")