experiment_name: gpt2_config_example
sim_time: 30000
metric_check_num: 50
times_to_calculate: [1, 10]
times_to_communicate: [0]
batch_size: 32
optimizer: adamw
num_workers: 8
configs:
  - algorithm: synchronized_sgd
    step_size_range: [-11, -10]
  - algorithm: ringmaster_sgd
    step_size_range: [-10, -7]
    server_params:
      num_grads_list: [16, 32, 64]
  - algorithm: rennala_sgd
    step_size_range: [-10, -7]
    server_params:
      num_grads_list: [16, 32, 64]
  - algorithm: local_sgd
    step_size_range: [-10, -7]
    server_params:
      num_grads_list: [16, 32, 64]
  - algorithm: ringmaster_sgd_compcomm
    step_size_range: [-10, -9]
    server_params:
      num_grads_list: [16, 32, 64]
    worker_params:
      target_communicate_compute_ratio: null
      min_local_steps_list: [2, 4]
      local_step_size_multiplier_list: [1]
