env_name: TrafficJunction
experiment_tag: paper_tj_adaptive
num_runs: 5

common_config:
  learning_rate: 0.001
  num_iterations: 2000
  num_episodes: 1
  # improve stability
  gradient_clip_max_norm: 0.1
  msg_loss_weight: 0.1

  softmax_msg_size_selection: True
  message_mode: PseudoGradient
  msg_sizes: [[0, 32, 128]]
  comm_channel_type: StochasticSpacing
  comm_channel_size: [512]
  force_random_msg_size_selection: [False, True]

env_configs:
  TrafficJunction:
    # improve stability
    num_envs: 128
    mode: easy
    train_curriculum: True