# Multi-Seed Baseline Comparison Experiment Configuration
# Compare MoltenFlow vs baselines with statistical rigor across multiple seeds

experiment:
  name: "multi_seed_comparison_latest_finetune_hpo"
  description: "Statistical comparison of optimization methods with multiple seeds"

  # Methods to compare
  methods:
    - "moltenflow"
    - "gradient_ascent"
    - "bo_mogp"
    - "bo_2gp"

  # Random seeds for statistical comparison
  # Recommendation: 5 seeds minimum, 10 for publication
  seeds: [42, 123, 456, 789, 1000]

# Inherit most settings from base budgeted_optimization config
# This section overrides or specifies experiment-specific settings

# Optimization parameters
optimization:
  budget: 100  # Total oracle calls per run
  n_init: 10   # Initial dataset size
  batch_size: 1  # Proposals per iteration

# Initialization method
init:
  method: "random"  # or "near_pareto"
  pool_size: null
  k_neighbors: 5

# Reference point for hypervolume (QED, -SA)
hypervolume:
  ref_point: [0.0, -10.0]
  sense: ["max", "max"]

# Data configuration (inherits from base config)
data:
  parquet_path: "data/processed/zinc250k_qed_sas.parquet"
  smiles_col: "smiles"
  max_len: 128
  max_molecules: null
  vocab_path: "experiments/exp_f1b68b38/20260127_161530/finetune/vocab.json"
  representation: "selfies"

# VAE configuration (must match trained model)
vae:
  checkpoint_path: "experiments/exp_f1b68b38/20260127_161530/finetune/vae_best.pt"
  d_model: 128
  nhead: 8
  enc_layers: 6
  dec_layers: 6
  dim_ff: 1024
  dropout: 0.1
  K: 8
  latent_dim: 128

# Flow configuration (must match trained model)
flow:
  checkpoint_path: "experiments/exp_f1b68b38/20260127_161530/flow/flow_best.pt"
  d_model: 256
  nhead: 8
  layers: 10
  dim_ff: 512
  dropout: 0.1
  time_dim: 128

# Surrogate configuration
surrogate:
  out_dim: 2
  hidden_dim: 1024
  aggregation: "mean"
  dropout: 0.1
  cond_dim: 0
  output_bounds:
    qed: [0.0, 1.0]
    sas: [1.0, 10.0]

# MoltenFlow proposer configuration
moltenflow:
  gamma: 36.0686
  sigma: 0.804543
  steps: 12
  t_start: 0.887901
  seed_selection: "diversity_weighted"
  clip_norm: 5.0
  normalize_gradient: true
  use_flow: true
  step_size: null  # Defaults to gamma/steps
  # Diversity parameters
  diversity_threshold: 0.7
  diversity_penalty: 2.0
  diversity_window: 10
  pareto_weight: 2.0

# Gradient ascent configuration (no flow, pure gradient optimization)
gradient_ascent:
  step_size: 0.3  # Smaller than moltenflow's gamma, gradient ascent is more sensitive
  sigma: 0.2
  steps: 10
  seed_selection: "diversity_weighted"
  clip_norm: null
  normalize_gradient: true
  # Diversity parameters
  diversity_threshold: 0.7
  diversity_penalty: 2.0
  diversity_window: 10
  pareto_weight: 2.0

# BO proposer configuration
bo:
  num_restarts: 10
  raw_samples: 512
  latent_aggregation: "flatten"

# Plotting configuration for multi-seed analysis
plotting:
  confidence: 0.90  # Confidence level for CIs
  n_bootstrap: 1000  # Bootstrap samples for CI estimation
  # CI band type: "bootstrap" (rigorous), "se" (mean +/- SE, tighter), "se2" (mean +/- 2*SE)
  ci_type: "bootstrap"  # Use SE bands for tighter visualization

  # Pareto density plot
  density_grid_resolution: 50  # Grid resolution for KDE

  # Example runs selection
  example_runs:
    n_best: 2   # Number of best runs to show
    n_worst: 2  # Number of worst runs to show

  # Molecule gallery
  molecules_per_method: 4  # Molecules to show per method
  sample_across_seeds: true  # Sample from multiple seeds

# Output configuration
output:
  dir: "experiments/multi_seed_comparison_latest_finetune_hpo"
  pareto_snapshot_interval: 25

# Base seed for reproducibility
seed: 42
