model:
  name: MadryCNN_no_maxpool_tiny  # This model is defined in model_defs.py. Add your own model definitions there.
  path: models/bab_attack/MadryCNN_no_maxpool_tiny.pt  # Path to PyTorch checkpoint.
data:
  dataset: MNIST  # Dataset name. This is just the standard CIFAR-10 test set defined in the "load_verification_dataset()" function in utils.py
  start: 110  # First example to verify in dataset.
  end: 111  # Last example to verify in dataset. We verify 100 examples in this test.
specification:
  norm: .inf  # Linf norm (can also be 2 or 1).
  epsilon: 0.3  # epsilon=2./255.
attack:  # Currently attack is only implemented for Linf norm.
  pgd_steps: 200 # Increase for a stronger attack. A PGD attack will be used before verification to filter on non-robust data examples.
  pgd_restarts: 200  # Increase for a stronger attack.
  attack_mode: diverse_pgd
  pgd_order: before
solver:
  batch_size: 8192 # Number of subdomains to compute in parallel in beta-CROWN. Decrease if you run out of memory.
  alpha-crown:
    iteration: 100   # Number of iterations for alpha-CROWN optimization. Alpha-CROWN is used to compute all intermediate layer bounds before branch and bound starts.
    lr_alpha: 0.1    # Learning rate for alpha in alpha-CROWN. The default (0.1) is typically ok.
  beta-crown:
    lr_alpha: 0.01  # Learning rate for optimizing the alpha parameters, the default (0.01) is typically ok, but you can try to tune this parameter to get better lower bound.
    lr_beta: 0.05  # Learning rate for optimizing the beta parameters, the default (0.05) is typically ok, but you can try to tune this parameter to get better lower bound.
    iteration: 50  # Number of iterations for beta-CROWN optimization. 20 is often sufficient, 50 or 100 can also be used.
  mip:
    parallel_solvers: 8
    solver_threads: 1
bab:
  timeout: 600 # Timeout threshold for branch and bound. Increase for verifying more points.
  max_domains: 5000000
  get_upper_bound: true  # Needed for Bab-Attack.
  attack:
    enabled: true
    beam_candidates: 32
    beam_depth: 8
    max_dive_fix_ratio: 0.5
    min_local_free_ratio: 0.4
    mip_timeout: 30
    mip_start_iteration: 2
    refined_mip_attacker: false
  branching:  # Parameters for branching heuristics.
    reduceop: min  # Reduction function for the branching heuristic scores, min or max. Using max can be better on some models.
    method: kfsb  # babsr is fast but less accurate; fsb is slow but most accurate; kfsb is usualy a balance.
    candidates: 3  # Number of candidates to consider in fsb and kfsb. More leads to slower but better branching. 3 is typically good enough.
