project: ddflow_rm_cres_v0.3
program: train_sweep.py
method: grid
metric:
  name: valid_loss_cmin_dl0
  goal: minimize
parameters:
  default_configs:
    value: "configs/defaults/rm_cres.yaml"

  # opt
  lr:
    values: [0.001, 0.003, 0.01, 0.03]
  wd:
    values: [1.0e-3, 1.0e-2, 1.0e-1]
  bs:
    values: [256]
  opt:
    value: "adamax"
  scheduler:
    value: "steplr"

  seed:
    values: [3000, 3001, 3002, 3003, 3004, 3005, 3006, 3007, 3008, 3009]

  # flow params
  hidden_units:
    values: [[64, 64]]
  num_layers:
    values: [3]
  num_bins:
    values: [16]
  flow_type:
    value: "unconstrained_rational_quadratic"
  activation:
    value: "swish"
  shuffle:
    value: True
  actnorm:
    value: True

  # training
  epochs:
    values: [100]
  grad_clip:
    value: 0.0

  # experiment setup
  default_param:
    values:
      [
        1.0,
        0.99,
        0.975,
        0.95,
        0.9,
        0.825,
        0.75,
        0.625,
        0.5,
        0.4,
        0.33,
        0.25,
        0.1,
      ]
  opt_params:
    value: False
  init_default_param:
    value: null
  fine_tune:
    value: False

  check_param_fit:
    value: True
