project: ddflow_rm_cres_v0.1
program: train_sweep.py
method: grid
metric:
  name: valid_loss_cmin_dl0
  goal: minimize
parameters:
  default_configs:
    value: "configs/defaults/rm_cres.yaml"

  # opt
  lr:
    values: [0.001, 0.003, 0.01, 0.03]
  wd:
    values: [1.0e-3, 1.0e-2, 1.0e-1]
  bs:
    values: [256]
  opt:
    value: "adamax"
  scheduler:
    value: "steplr"

  seed:
    values: [3000, 3001, 3002, 3003, 3004, 3005, 3006, 3007, 3008, 3009]

  # flow params
  hidden_units:
    values: [[64, 64]]
  num_layers:
    values: [3]
  num_bins:
    values: [16]
  flow_type:
    value: "unconstrained_rational_quadratic"
  activation:
    value: "swish"
  shuffle:
    value: True
  actnorm:
    value: True

  # training
  epochs:
    values: [25]
  main_stage_epochs:
    values: [25]
  grad_clip:
    value: 0.0

  # experiment setup
  default_param:
    values: [0.99, 0.9, 0.75, 0.5]
  opt_params:
    value: True
  init_default_param:
    value: null
  fine_tune:
    value: False
  alternating:
    value: "lam"
  alternating_steps:
    values: [4]
  lam_stage_epochs:
    values: [100]
  retain_lr:
    value: true
  lam_lr:
    values: [0.03, 0.1, 0.3]
  lam_wd:
    value: 0.0
