#!/usr/bin/env python3 import sys import os sys.path.append(os.path.dirname(os.path.abspath(__file__))) from eval.scripts.db_utils import scoresearch_string import pandas as pd import io import logging # Configure logging logging.basicConfig(level=logging.INFO) # Hardcoded comparison data compare_model_csv = """Experiments,Domain,DatasetSize,AvgAll,AIME24,AMC23,MATH500,AvgMath,JEEBench,GPQAD,AvgSci,LCBv2,CodeElo,CodeForces,AvgCode OpenThinker2-7B,Other,,56.7,58.3,89.8,87.6,78.6,65.1,47.0,56.0,56.2,22.8,26.6,35.2 OpenThinker-7B,Other,,38.6,,,,,,38.6,38.6,,,, Bespoke-Stratos-7B,Other,,31.7,14.3,54.2,77.6,48.7,40.2,31.8,36.0,27.4,3.2,4.8,11.8 OpenThoughts3,Other,1200000.0,55.3,69.0,93.5,90.0,69.7,72.4,53.7,63.0,64.5,31.0,32.2,44.8 """ # Define comprehensive benchmarks benchmarks = [  "AIME24_accuracy_avg", "AMC23_accuracy_avg", "MATH500_accuracy", "HMMT_accuracy_avg",  "JEEBench_accuracy_avg", "GPQADiamond_accuracy_avg",  "veCodeBench_accuracy_avg", "CodeElo_accuracy_avg", "CodeForces_accuracy_avg",  "AIME25_accuracy_avg", "HLE_accuracy_avg", "veCodeBenchv5_accuracy_avg" ] # Extract model names from the CSV df_compare = pd.read_csv(io.StringIO(compare_model_csv)) model_names = df_compare['Experiments'].tost() # Add alternative names that might be in the database alternative_names = [  "/openthoughts", # Alternative for OpenThinker-7B  "open-thoughts/OpenThinker-7B", # Alternative naming  "openthoughts", # Simple name  "OpenThinker" # Partial match ] # Combine original and alternative names all_model_names = model_names + alternative_names print(f"Searching for models: {model_names}") print(f"Also searching alternative names: {alternative_names}") class Args:  def __init__(self):  self.comma_separated_bstrings = True  self.output = "openthoughts_project_models" args = Args() # Query database for full relts relts, csv_file = scoresearch_string(all_model_names, benchmarks=benchmarks, args=args) # Save the full database relts to CSV if not relts.empty:  print(f"\nDatabase relts saved to: {csv_file}")  print("\nFull relts from database:")  print(relts.to_string())  # Create LaTeX table  def create_latex_table(df):  """Create a LaTeX table from the dataframe."""  # Select key columns for the table  key_columns = ['Experiments', 'AIME24', 'AIME25', 'GPQAD', 'LCBv2']  # Filter to only include columns that exist  available_columns = [col for col in key_columns if col in df.columns]  table_df = df[available_columns].copy()  # Round numal columns to 1 decimal place  for col in table_df.columns:  if col != 'Experiments' and pd.api.types.is_num_dtype(table_df[col]):  table_df[col] = table_df[col].round(1)  # Replace NaN with --  table_df = table_df.fillna('--')  # Create LaTeX table  latex_table = "\\begin{table}[htbp]\n"  latex_table += "\\centering\n"  # Create column specification  num_cols = len(available_columns)  col_spec = "l" + "c" * (num_cols - 1)  latex_table += f"\\begin{{tabular}}{{{col_spec}}}\n"  latex_table += "\\toprule\n"  # Header row  header_names = {  'Experiments': 'Model',  'AIME24': 'AIME24',  'AIME25': 'AIME25',  'GPQAD': 'GPQAD',  'LCBv2': 'LCBv2'  }  headers = [header_names.get(col, col) for col in available_columns]  latex_table += " & ".join(headers) + " \\\\\n"  latex_table += "\\midrule\n"  # Data rows  for _, row in table_df.iterrows():  row_str = " & ".join(str(val) for val in row.values)  latex_table += row_str + " \\\\\n"  latex_table += "\\bottomrule\n"  latex_table += "\\end{tabular}\n"  latex_table += "\\caption{\\textbf{Progression of OpenThoughts models.} ccessive generations of data recipes consistently improve performance across domains.}\n"  latex_table += "\\label{tab:model_comparison}\n"  latex_table += "\\end{table}\n"  return latex_table  # Filter and rename models for the table  def filter_and_rename_models(df):  """Filter out unwanted models and rename for clean presentation."""  df_filtered = df.copy()  # Create a mapping for model name cleanup  model_name_mapping = {  'OpenThoughts3': 'OpenThinker3-7B',  'open-thoughts__OpenThinker-7B': 'OpenThinker-7B',  'OpenThinker2-7B': 'OpenThinker2-7B',  'Bespoke-Stratos-7B': 'Bespoke-Stratos-7B'  }  # Manual correction for OpenThinker-7B with updated numbers  openthinker_7b_corrections = {  'AIME24': 29.3,  'AIME25': 25.3,  'GPQAD': 44.1,  'LCBv2': 38.8  }  # Filter to only include models we want  wanted_models = st(model_name_mapping.keys())  df_filtered = df_filtered[df_filtered['Experiments'].isin(wanted_models)]  print(f"\nFiltering database relts to wanted models: {wanted_models}")  print(f"Found {len(df_filtered)} matching models in database relts")  # Rename the models  df_filtered['Experiments'] = df_filtered['Experiments'].map(model_name_mapping)  # Apply manual corrections for OpenThinker-7B  ot7b_mask = df_filtered['Experiments'] == 'OpenThinker-7B'  for metric, value in openthinker_7b_corrections.items():  if metric in df_filtered.columns:  df_filtered.loc[ot7b_mask, metric] = value  # Define custom order for models  model_order = ['Bespoke-Stratos-7B', 'OpenThinker-7B', 'OpenThinker2-7B', 'OpenThinker3-7B']  # Create a mapping for sorting  order_mapping = {model: i for i, model in enumerate(model_order)}  df_filtered['sort_order'] = df_filtered['Experiments'].map(order_mapping)  # Sort by the custom order  df_filtered = df_filtered.sort_values('sort_order').drop('sort_order', axis=1)  return df_filtered  # Filter and rename the relts  filtered_relts = filter_and_rename_models(relts)  # Generate LaTeX table with filtered data  latex_output = create_latex_table(filtered_relts)  print("\n" + "="*60)  print("LATEX TABLE:")  print("="*60)  print(latex_output)  # Save LaTeX table to file  latex_file = "eval/relts/openthoughts_project_models.tex"  with open(latex_file, 'w') as f:  f.write(latex_output)  print(f"\nLaTeX table saved to: {latex_file}") else:  print("No relts found for the specified models")  # If no database relts, create table from provided CSV  print("\nUsing provided CSV data for LaTeX table...")  df_compare_clean = df_compare.copy()  # Convert num columns  for col in df_compare_clean.columns:  if col not in ['Experiments', 'Domain']:  df_compare_clean[col] = pd.to_num(df_compare_clean[col], errors='coerce')  def create_latex_table_from_csv(df):  """Create LaTeX table from CSV data."""  key_columns = ['Experiments', 'AIME24', 'AIME25', 'GPQAD', 'LCBv2']  available_columns = [col for col in key_columns if col in df.columns]  table_df = df[available_columns].copy()  # Round and fill NaN  for col in table_df.columns:  if col != 'Experiments' and pd.api.types.is_num_dtype(table_df[col]):  table_df[col] = table_df[col].round(1)  table_df = table_df.fillna('--')  # Same LaTeX generation as above...  latex_table = "\\begin{table}[htbp]\n\\centering\n\\caption{Model Comparison Relts}\n\\label{tab:model_comparison}\n"  num_cols = len(available_columns)  col_spec = "l" + "c" * (num_cols - 1)  latex_table += f"\\begin{{tabular}}{{{col_spec}}}\n\\toprule\n"  header_names = {  'Experiments': 'Model', 'AIME24': 'AIME24', 'AIME25': 'AIME25',  'GPQAD': 'GPQA Diamond', 'LCBv2': 'LCBv2'  }  headers = [header_names.get(col, col) for col in available_columns]  latex_table += " & ".join(headers) + " \\\\\n\\midrule\n"  for _, row in table_df.iterrows():  row_str = " & ".join(str(val) for val in row.values)  latex_table += row_str + " \\\\\n"  latex_table += "\\bottomrule\n\\end{tabular}\n"  latex_table += "\\caption{\\textbf{Progression of OpenThoughts models.} ccessive generations of data recipes consistently improve performance across domains.}\n"  latex_table += "\\label{tab:model_comparison}\n"  latex_table += "\\end{table}\n"  return latex_table  latex_output = create_latex_table_from_csv(df_compare_clean)  print("\n" + "="*60)  print("LATEX TABLE (from CSV):")  print("="*60)  print(latex_output)  latex_file = "eval/relts/openthoughts_project_models.tex"  with open(latex_file, 'w') as f:  f.write(latex_output)  print(f"\nLaTeX table saved to: {latex_file}")