---
linear_simulation:
    seed: 42
    n_samples: 2_048
    kernel_dim: -1          # bases of null(f) to construct DA. Set to 0 or -1 for random or full respectively.
    n_experiments: 32
    sweep_samples: 8
    methods:
        - ERM
        - DA+ERM
        - DA+IVL-CV
        - DA+IVL-LCV
        - DA+IVL-CC
        - DA+IV
        - IRM
        - ICP
        - DRO
        - RICE
        - V-REx
        - MM-REx
        - L1Janzing
        - L2Janzing
        - Kania&Wit
    augmentations:
        - translate

optical_device:
    seed: 42
    n_samples: 1_000
    methods:
        - ERM
        - DA+ERM
        - DA+IVL-CV
        - DA+IVL-LCV
        - DA+IVL-CC
        - DA+IV
        - IRM
        - ICP
        - DRO
        - RICE
        - V-REx
        - MM-REx
        - L1Janzing
        - L2Janzing
        - Kania&Wit
    augmentations:
        - gaussian-noise

colored_mnist:
    seed: 42
    num_seeds: 10
    n_samples: 60_000
    methods:
        - ERM
        - DA+ERM
        - DA+IVL-CV
        - DA+IVL-LCV
        - DA+IV
        - IRM
        - DRO
        - RICE
        - V-REx
        - MM-REx
    augmentations:
        - jitter > translate

hyperparameters:
    sgd:
        lr: 0.01            # learning rate for stochastic gradient descent
        batch: 256          # batch size
        epochs: 16          # number of epochs
    cv:
        folds: 5            # k-fold CV number of folds
        frac: 0.2           # vanilla CV test set fraction
        samples: 10         # number of samples for random search
        n_jobs: 1          # number of jobs to run in parallel for hyperparam search
