data:
  dataset: mass
  n_subj: 60
policy:
  policy_size_per_fold: 5
  subpolicies_length: 2
diff:
  search_epochs: 50
  assess_epochs: 300
  eval_step: 2
discrete:
  n_trials: 200
  eval_step: 5
  epochs: 300
split:
  train_size_over_valid: 0.5  # corresponds to 24 train/valid nights
  data_ratio: 1.
  batch_size: 16
  random_state: 29
  n_folds: 5  # corresponds to 12 test nights
  grouped_subset: True
training:
  # lr: 0.001
  early_stop: True
