env: "mt_grid_mpe"

env_args:
  n_agents: 3
  n_landmarks: 6
  field_size: [15,15]
  sight: 14
  episode_limit: 70
  reach_range: 2
  task_id: 0

test_greedy: True
test_nepisode: 32
test_interval: 500
log_interval: 500
runner_log_interval: 500
learner_log_interval: 500
save_model_interval: 10000
t_max: 40000 # 40000 training gradient steps
noise_scale: 0.05
use_obs_attack: False

id_length: 2
max_agent: 3
max_ally_num: 6
max_enemy_num: 6
max_step_num: 100

# offline dataset, used only for single-task offline
offline_data_folder: "dataset"
offline_data_ls: [
]
offline_data_quality: "expert"
offline_max_buffer_size: 4000
offline_data_shuffle: False
offline_data_type: "h5"