# file: configs/experiment/hpo_architecture.yaml
# ============================================================
# HPO STUDY 1: ARCHITECTURE SEARCH
# ============================================================
# Objective: Find the optimal model architecture (capacity, style, etc.)
# for the given dataset, while keeping loss and optimizer settings fixed.
# This helps isolate the impact of architectural choices from the training dynamics.

study_name: "prism_hpo_architecture_search"
directions: ["maximize", "maximize", "maximize"] # probe_gap, observer_acc, neg_info_loss
n_trials: 100

base_config: "configs/base.yaml"

sampler:
  type: "TPESampler"
  seed: 42

search_space:
  # --- Tier 1: Latent Space Dimensions ---
  model.latent_space.latent_dim:
    type: "categorical"
    choices: [64, 128, 256]

  model.latent_space.target_dim:
    type: "int"
    low: 16
    high: 128 # NOTE: The HPO script must dynamically cap this value to latent_dim / 2
    step: 16

  # --- Tier 2: Core Backbone Construction (Encoder/Decoder) ---
  model.architecture.conv.depth:
    type: "int"
    low: 1
    high: 2

  model.architecture.conv.start_channels:
    type: "categorical"
    choices: [16, 32, 64]

  model.architecture.conv.block_repeats_per_layer:
    type: "int"
    low: 1
    high: 2

  # --- Tier 3: Style and Operation Choices ---
  model.architecture.activation_type: # For Encoder, Generator, Classifier
    type: "categorical"
    choices: [ 'relu', 'leaky_relu', 'swish', 'gelu' ]

  model.architecture.conv.encoder.style:
    type: "categorical"
    choices: ['vgg', 'residual']

  model.architecture.conv.decoder.style:
    type: "categorical"
    choices: ['vgg', 'residual']

  model.architecture.conv.encoder.downsampling_method:
    type: "categorical"
    choices: ['maxpool', 'avgpool', 'conv']

  model.architecture.conv.decoder.upsampling_method:
    type: "categorical"
    choices: ['pixelshuffle', 'convtranspose', 'nearest']

  model.architecture.use_bn:
    type: "categorical"
    choices: [true, false]

  # --- Tier 4: MLP Bottleneck/Preprocessor Dimensions (for 'conv' type) ---
  model.architecture.conv.encoder.mlp_h_units_depth:
    type: "int"
    low: 1
    high: 3

  model.architecture.conv.encoder.mlp_h_units_size:
    type: "categorical"
    choices: [128, 256, 512]

  # --- Tier 5: Discriminator Architecture (Independent Search) ---
  discriminator_q.type:
    type: "categorical"
    choices: ['conv', 'mlp']

  discriminator_q.architecture.activation_type:
    type: "categorical"
    choices: ['leaky_relu', 'relu', 'swish', 'gelu']

  # --- CONV-specific options for Discriminator ---
  discriminator_q.architecture.conv.encoder.depth:
    type: "int"
    low: 1
    high: 2

  discriminator_q.architecture.conv.encoder.start_channels:
    type: "categorical"
    choices: [32, 64, 128]

  discriminator_q.architecture.conv.encoder.block_repeats_per_layer:
    type: "int"
    low: 1
    high: 2

  discriminator_q.architecture.conv.encoder.style:
    type: "categorical"
    choices: ['vgg', 'residual']

  discriminator_q.architecture.conv.encoder.use_bn:
    type: "categorical"
    choices: [true, false]

  # --- MLP-specific options for Discriminator ---
  discriminator_q.architecture.mlp.depth:
    type: "int"
    low: 2
    high: 5

  discriminator_q.architecture.mlp.width:
    type: "categorical"
    choices: [128, 256, 512]