name: fig10_fixed_b2_2
method: grid
parameters:
  opt.batch_size:
    values: [16, 32, 64, 128, 256, 512, 1024] # -> 7x
  opt.peak_lr_scaled:
    values: [5.0e-5, 1.0e-4, 2.0e-4, 4.0e-4, 8.0e-4, 1.6e-3, 3.2e-3, 5.0e-3, 1.0e-2] # -> 9x
  # total: 7*9=63
program: main.py
command:
  - ${env}
  - ${interpreter}
  - ${program}
  - +model=lm19m
  - +dataset=c4_t5all
  - opt.optimizer='adamw'
  - opt.b1=0.9
  - opt.b2=0.95
  - opt.weight_decay=0.1
  - opt.max_microbatch_size=16
  - opt.peak_lr_scaling='${pow:${opt.batch_size},0.5}'
  - ${args_no_hyphens}
