# env config for the grid mpe task: Spread

env: "grid_mpe"

env_args:
  map_name: cn-2
  n_agents: 2            
  field_size: [6,6]      
  sight: 5               
  episode_limit: 50        
  reach_range: 2
  default_task: True

test_greedy: True
test_nepisode: 40

# offline dataset
offline_data_folder: "dataset"
offline_data_name: ""
offline_data_quality: "expert"
offline_data_size: 2000
offline_data_shuffle: False
offline_max_buffer_size: 4000

tune_all: False
standardise_returns: False
standardise_rewards: False

data_device: "cuda"

# --- Alg settings for COMAD ---
n_reuse_heads: 2
delta_m_thres: 1
ebm_noise_scale: 1
stage1_steps: 20000
cont_train_steps: 20000
t_max: 20000

test_interval: 250
log_interval: 250
runner_log_interval: 250
learner_log_interval: 250
