# ==============================================================================
# TRAINING
# ==============================================================================
epochs: 2000  # 1000
lr: 1.0E-4
sizes: {bs: 64, k: 1}


# ----------- LOSS -----------
kl_factor: 1
kl_end_warmup: 1


# ==============================================================================
# JOINT MODEL
# ==============================================================================
learn_prior: False
stoc_dim: {x1: [16, 16, 16, 16, 100], x2: [8, 100]}
stoc_dist: 'normal'


# ==============================================================================
# VAE: X1
# ==============================================================================
x1_input_shape: [3, 64, 64]


# ----------- DETERMINISTIC LAYER -----------
x1_det_specs_bu: [[
  { t: 'dconv', c: 128, downsample: True, residual: False, f: 0.5 },
  { t: 'dconv', c: 128, downsample: True, residual: False, f: 0.5 },
],[
  { t: 'dconv', c: 128, downsample: True, residual: True, f: 0.5 },
],[
  { t: 'dconv', c: 128, downsample: True, residual: True, f: 0.5 },
],[
  { t: 'dconv', c: 128, downsample: True, residual: True, f: 0.5 },
],[
  { t: 'dense', out: 512 },
]]

x1_det_specs_td:  [[
  { t: 'dconv', c: 128, residual: True, f: 0.5 },
  { t: 'usd' },
  { t: 'dconv', c: 128, residual: True, f: 0.5 },
  { t: 'usd' },
],[
  { t: 'dconv', c: 128, residual: True, f: 0.5 },
  { t: 'usd' },
],[
  { t: 'dconv', c: 128, residual: True, f: 0.5 },
  { t: 'usd' },
],[
  { t: 'usd' },
  { t: 'dconv', c: 128, residual: True, f: 0.5 },
],[
  { t: 'dense', 'out': 512, 'reshape': [ 128, 2, 2 ]},
]]



# ----------- STOCHASTIC LAYER -----------
x1_stoc_specs: [{t: 'conv'}, {t: 'conv'}, {t: 'conv'}, {t: 'conv'}, {t: 'dense'}]
x1_stoc_upsampling: [{t: 'conv'}, {t: 'conv'}, {t: 'conv'}, {t: 'conv'}, {t: 'dense', reshape: [512]}]
x1_merge_layer: {t: 'conv'}

# ----------- RECONSTRUCTION LAYER -----------
x1_rec_specs: {t: 'conv', k: 3}
x1_rec_dist: 'sigmoid'
x1_rec_factor: 1


# ----------- GENERIC LAYER -----------
x1_nonlin: gelu


# ==============================================================================
# VAE: X2
# ==============================================================================
x2_input_shape: [1024,]


# ----------- DETERMINISTIC LAYER -----------
x2_det_specs_bu: [[
  {t: 'dense', out: 1024}, {t: 'dense', out: 768}
],[
  {t: 'dense', out: 768}, {t: 'dense', out: 768}
]]
x2_det_specs_td: [ [
  { t: 'dense', out: 1024 }, { t: 'dense', out: 1024 }
],[
  { t: 'dense', out: 768 }, { t: 'dense', out: 768 }
]]


# ----------- STOCHASTIC LAYER -----------
x2_stoc_specs: [{t: 'dense'}, {t: 'dense'}]
x2_stoc_upsampling: [{t: 'dense', reshape: [768]}, {t: 'dense', reshape: [768]}]
x2_merge_layer: {t: 'dense'}
x2_prior_layer: {t: 'dense'}


# ----------- RECONSTRUCTION LAYER -----------
x2_rec_specs: {t: 'dense'}
x2_rec_dist: 'normal'
x2_rec_factor: 1


# ----------- GENERIC LAYER -----------
x2_nonlin: leaky_relu


# ==============================================================================
# MISC
# ==============================================================================
n_modalities: 2
eval_bs: 1
exp_name: 'hierarchical_new'
trial: 'trial'
seed: 23