# Figure Generation Configuration
# Usage: uv run python experiments/figure_generation/run.py run_id=<your_run_id>

# MLflow run settings (required)
run_id: "<run-id>"  # Replace with your MLflow run ID
experiment_id: "<experiment-id>"  # Replace with your MLflow experiment ID


# MLflow tracking settings - update for your environment
tracking_uri: "${oc.env:MLFLOW_TRACKING_URI,local}"
registry_uri: "${oc.env:MLFLOW_REGISTRY_URI,local}"

# Device override (optional): set to "cuda" to run analysis on GPU
# CLI override: `+device=cuda`
# device: cuda

# Layer selection
# null = auto-select last layer
# Examples: "L0.resid.post", "L3.resid.post", "Lcat"
layer: "L3.resid.post"

# Ground truth reference line for dims@95 plot
# Set to the sum of factor dimensions for your generative process
# Example: 3 mess3 factors (3 dims each) + 2 tom_quantum factors (5 dims each) = 3*3 + 2*5 = 19
gt_dims95: 10

# Step filtering for plots
# Set to limit the x-axis range of plots
cev_max_step: 10000  # Max step for CEV curves plot
dims_max_step: 15000  # Max step for panel (c) intrinsic dimension
rmse_max_step: 100000  # Max step for panel (d) dims+RMSE
log_scale: true  # Use log scale for x-axis on panels (c) and (d)

# Metric keys
loss_metric_key: loss/step  # Metric key for training loss

# Checkpoint selection for belief regression visualization
# null = use latest checkpoint
checkpoint_step: null

# CEV recomputation settings
# Set recompute_cev=true if CEV history is not logged to MLflow
recompute_cev: true
cev_n_checkpoints: 200  # Use all available checkpoints up to cev_max_step
cev_batch_size: 1000  # Batch size for sequence generation

# dims@95 recomputation settings
# Set recompute_dims95=true to get finer resolution than MLflow logging
recompute_dims95: true
dims95_n_checkpoints: 50  # More checkpoints for smoother curve

# RMSE recomputation settings
# Set recompute_rmse=true to get RMSE at early checkpoints
recompute_rmse: true
rmse_n_checkpoints: 200  # Use all available checkpoints up to cev_max_step

# BOS token handling
# Set to true to skip BOS-only prefixes in analysis (recommended when BOS token is used)
skip_bos: true

# Prefix length filtering
# Set to limit analysis to early token positions (e.g., 10 for first 10 positions)
max_prefix_length: 10

# Output settings
# ICML column width: 3.25in, full width: 6.75in
output_path: figure_icml.png
supplemental_path: figure_icml_supplemental.png  # Set to null to skip supplemental
output_format: png  # png, pdf, svg
dpi: 300  # High DPI for good quality
figsize:
  - 6.75  # ICML full page width (inches)
  - 4.0   # Main figure height (2 rows)
supplemental_figsize:
  - 6.75  # ICML full page width
  - 2.5   # Supplemental figure height (1 row)

# Caching - set use_cache=false to force recomputation
use_cache: true
cache_dir: .cache
