data:
  dataset: mass
  n_subj: 60
policy:
  policy_size_per_fold: 5
  subpolicies_length: 2
diff:
  search_epochs: 50
  assess_epochs: 300
  eval_step: 5
discrete:
  n_trials: 200
  eval_step: 10
  epochs: 300
split:
  train_size_over_valid: 0.0208  # with 5-fold, corresponds to 1-47 nights (train-val)
  data_ratio: 1.
  batch_size: 16
  random_state: 29
  n_folds: 5
  grouped_subset: True
training:
  lr: 0.001
  early_stop: True
