#!/usr/bin/env python3 import pandas as pd import io # Read the HMMT relts hmmt_df = pd.read_csv("eval/relts/hmmt_all_variants.csv") # Original model names from simple_all_benchmarks.py target_models = [  "openthoughts3", "openthoughts3_300k", "openthoughts3_100k", "openthoughts3_30k",  "openthoughts3_10k", "openthoughts3_3k", "openthoughts3_1k", "openthoughts3_0.3k",  "s1", "s1_0.3k", "mo", "mo_0.3k", "am", "am_100k", "am_300k", "am_30k",  "am_10k", "am_3k", "am_1k", "am_0.3k", "nemo_nano_1000k", "nemo_nano_300k",  "nemo_nano_100k", "nemo_nano_30k", "nemo_nano_10k", "nemo_nano_3k",  "nemo_nano_1k", "nemo_nano_0.3k" ] print("Looking for HMMT scores for target models...") print("Available models with HMMT scores:") # Filter for rows that have HMMT scores (not NaN/empty) hmmt_available = hmmt_df[hmmt_df['HMMT'].notna() & (hmmt_df['HMMT'] != '')] for _, row in hmmt_available.iterrows():  model_name = row['Experiments']  hmmt_score = row['HMMT']  dataset_size = row['DatasetSize']  # Check if this model matches any of our target models  for target in target_models:  if target in model_name.lower() or model_name.lower() in target:  print(f" {model_name}: HMMT={hmmt_score}, DatasetSize={dataset_size}") print("\nExact matches found:") exact_matches = {} for target in target_models:  # Look for exact matches in the HMMT data  matches = hmmt_available[hmmt_available['Experiments'].str.contains(target, case=False, na=False)]  if not matches.empty:  for _, row in matches.iterrows():  if target.lower() in row['Experiments'].lower():  exact_matches[target] = row['HMMT']  print(f" {target}: {row['HMMT']}") print(f"\nFound HMMT scores for {len(exact_matches)} out of {len(target_models)} target models") print("Exact matches dictionary:") print(exact_matches)