# @package _global_

# usage: +experiment=celeba/sm/northern_resonance

defaults:
    - override /ae_arch: artifact
    - override /ds: celeba/gender_smiling
    - override /labeller: gt
    - override /split: celeba/artifact/base
    - override /disc_arch: set
    - override /scorer: celeba/sm
    - _self_

seed: 0
dm:
    batch_size_tr: 4
    batch_size_te: 64
    num_samples_per_group_per_bag: 1

alg:
    steps: 20000
    ga_steps: 4
    num_disc_updates: 1
    twoway_disc_loss: false
    prior_loss_w: 0
    log_freq: ${alg.steps} # only log on the final iteration
    val_freq: 0.2
    pred_y_loss_w: 0
    pred_s_loss_w: 0
    warmup_steps: 0
    max_grad_norm: 5
    disc_loss_w: 0.01

ae_arch:
    artifact_name: ${split.artifact_name}_in_vqgan_pt
    version: null # defaults to 'latest'

ae:
    recon_loss: l1
    lr: 0.0000018348295456200725
    zs_transform: none
    optimizer_cls: ADAM
    weight_decay: 0
    zs_dim: 1

disc:
    lr: 0.000027080358427157673
    criterion: LOGISTIC_NS
    optimizer_cls: ADAM

disc_arch:
    hidden_dim_pre: null
    hidden_dim_post: null
    num_hidden_pre: 1
    num_hidden_post: ${disc_arch.num_hidden_pre}
    agg_input_dim: null
    input_norm: true
    final_bias: true

    head_dim: 64
    num_heads: 1
    num_blocks: 4
    mean_query: true

eval:
    batch_size: 12
    balanced_sampling: true
    steps: 10000
    num_hidden: 1
    hidden_dim: null
    opt:
        lr: 1.e-4
        scheduler_cls: torch.optim.lr_scheduler.CosineAnnealingLR
        scheduler_kwargs:
            T_max: ${ eval.steps }
            eta_min: 5e-7

wandb:
    group: ${split.artifact_name}_winter_pine
