program: main.py
command:
  - ${env}
  - python3
  - ${program}
  - ${args}
method: grid
metric:
  name: validation/mean_accuracy
  goal: maximize
parameters:
  name:
    value: addmul_ff_alpha_analysis
  log:
    value: wandb
  task:
    value: addmul_ff
  stop_after:
    value: 20000
  layer_sizes:
    distribution: categorical
    values:
      - "800,800,800,800"
      - "2000,2000,2000,2000"
  n_digits:
    value: 2
  mask_loss_weight:
    distribution: categorical
    values:
      - 0.00001
      - 0.000015
      - 0.00002
      - 0.00003
      - 0.00004
      - 0.00005
      - 0.00006
      - 0.00007
      - 0.00008
      - 0.00009
      - 0.00010
      - 0.0001
      - 0.00011
      - 0.000125
      - 0.00015
      - 0.000175
      - 0.0002
      - 0.00025
      - 0.0003
      - 0.0004
      - 0.0005
      - 0.0006
      - 0.0007
      - 0.0008
      - 0.0009
      - 0.001
  mask_lr:
    value: 1e-2
  step_per_mask:
    value: 20000
  bias_no_mask:
    value: 1
  sweep_id_for_grid_search:
    distribution: categorical
    values:
      - 1
      - 2
      - 3
      - 4
      - 5
      - 6
      - 7
      - 8
      - 9
      - 10

