{
    "args": {
        "seed": [1],
        "agent_rl_algo": ["ppo"],
        "n_total_updates": [30000],
        "train_runner": ["paired"],
        "n_devices": [1],
        "student_model_name": ["default_student_actor_cnn"],
        "student_critic_model_name": ["default_student_critic_cnn"],
        "env_name": ["Overcooked"],
        "verbose": [false],
        "is_multi_agent": [true],
        "log_dir": ["~/logs/minimax"],
        "log_interval": [10],
        "from_last_checkpoint": [false],
        "checkpoint_interval": [1000],
        "archive_interval": [0],
        "archive_init_checkpoint": [false],
        "test_interval": [100],
        "n_students": [2],
        "n_parallel": [32],
        "n_eval": [1],
        "n_rollout_steps": [400],
        "lr": [3e-4],
        "lr_anneal_steps": [0],
        "max_grad_norm": [0.5],
        "adam_eps": [1e-05],
        "track_env_metrics": [true],
        "discount": [0.999],
        "n_unroll_rollout": [10],
        "render": [false],
        "ued_score": ["relative_regret"],
        "student_gae_lambda": [0.98],
        "teacher_discount": [0.999],
        "teacher_lr_anneal_steps": [0],
        "teacher_gae_lambda": [0.98],
        "student_entropy_coef": [0.01],
        "student_value_loss_coef": [0.5],
        "student_n_unroll_update": [5],
        "student_ppo_n_epochs": [8],
        "student_ppo_n_minibatches": [4],
        "student_ppo_clip_eps": [0.2],
        "student_ppo_clip_value_loss": [true],
        "teacher_entropy_coef": [0.01],
        "teacher_value_loss_coef": [0.5],
        "teacher_n_unroll_update": [5],
        "teacher_ppo_n_epochs": [8],
        "teacher_ppo_n_minibatches": [4],
        "teacher_ppo_clip_eps": [0.2],
        "teacher_ppo_clip_value_loss": [true],
        "student_recurrent_arch": ["lstm"],
        "student_recurrent_hidden_dim": [64],
        "student_hidden_dim": [64],
        "student_n_hidden_layers": [2],
        "student_is_soft_moe": [true],
        "student_soft_moe_num_experts": [4],
        "student_soft_moe_num_slots": [32],
        "student_n_conv_layers": [3],
        "student_n_conv_filters": [32],
        "student_n_scalar_embeddings": [4],
        "student_scalar_embed_dim": [5],
        "student_agent_kind": ["mappo"],
        "teacher_model_name": ["default_teacher_cnn"],
        "teacher_recurrent_arch": ["lstm"],
        "teacher_recurrent_hidden_dim": [64],
        "teacher_hidden_dim": [64],
        "teacher_n_hidden_layers": [1],
        "teacher_n_conv_filters": [128],
        "teacher_scalar_embed_dim": [10],
        "overcooked_height": [6],
        "overcooked_width": [9],
        "overcooked_n_walls": [5],
        "overcooked_normalize_obs": [true],
        "overcooked_max_steps": [400],
        "overcooked_random_reset": [false],
        "overcooked_ued_replace_wall_pos": [true],
        "overcooked_ued_fixed_n_wall_steps": [false],
        "overcooked_ued_first_wall_pos_sets_budget": [true],
        "overcooked_ued_noise_dim": [50],
        "overcooked_ued_n_walls": [15],
        "overcooked_ued_normalize_obs": [true],
        "n_shaped_reward_updates": [30000],
        "test_n_episodes": [10],
        "test_env_names": [
            "Overcooked-CoordRing6_9,Overcooked-ForcedCoord6_9,Overcooked-CounterCircuit6_9,Overcooked-AsymmAdvantages6_9,Overcooked-CrampedRoom6_9"
        ],
        "overcooked_test_normalize_obs": [true]
    }
}