name: fig10_fixed_t2_3
method: grid
parameters:
  opt.batch_size:
    values: [16, 32, 64, 128, 256, 512, 1024] # -> 7x
  opt.peak_lr_scaled:
    values: [2.5e-5, 5.0e-5, 1.0e-4, 2.0e-4, 4.0e-4, 8.0e-4, 1.6e-3, 3.2e-3, 6.4e-3, 1.3e-2] # -> 10x
  # total: 7*10=70
program: main.py
command:
  - ${env}
  - ${interpreter}
  - ${program}
  - +model=lm19m
  - +dataset=c4_t5all
  - opt.optimizer='adamw'
  - opt.b1=0.9
  - opt.t2=10_000_000
  - opt.weight_decay=0.1
  - opt.max_microbatch_size=16
  - opt.peak_lr_scaling='${pow:${opt.batch_size},0.4}'
  - ${args_no_hyphens}
