env: sc2_v2

env_args:
  continuing_episode: False
  difficulty: "7"
  game_version: null
  task: "terran_5_vs_5_meta1"
  map_name: "10gen_terran"
  move_amount: 2
  obs_all_health: True
  obs_instead_of_state: False
  obs_last_action: False
  obs_own_health: True
  obs_pathing_grid: False
  obs_terrain_height: False
  obs_timestep_number: False
  reward_death_value: 10
  reward_defeat: 0
  reward_negative_scale: 0.5
  reward_only_positive: True
  reward_scale: True
  reward_scale_rate: 20
  reward_sparse: False
  reward_win: 200
  replay_dir: ""
  replay_prefix: ""
  conic_fov: False
  use_unit_ranges: True
  min_attack_range: 2
  obs_own_pos: True
  num_fov_actions: 12
  state_last_action: True
  state_timestep_number: False
  step_mul: 8
  seed: null
  heuristic_ai: False
  heuristic_rest: False
  debug: False
  prob_obs_enemy: 1.0
  action_mask: True

test_greedy: True
test_nepisode: 32
test_interval: 500
log_interval: 500
runner_log_interval: 500
learner_log_interval: 500
save_model_interval: 10000
t_max: 40000 # 40000 training gradient steps
encoder_train_episode: 20000

id_length: 5
max_agent: 20
max_ally_num: 20
max_enemy_num: 23
max_step_num: 200
reward_loss_weight: 0.1
own_loss_weight: 0.01
ally_loss_weight: 1.0
enemy_loss_weight: 1.0
encoder_reward_scale: 0.1

pretrain_id: -1
vae_id: -1
prior_role_use_history: True
separate_role_encoding: True

num_tasks: 17
num_train_tasks: 5
train_task_ls: ["terran_5_vs_5_meta1","terran_5_vs_5_meta2","terran_10_vs_10_meta3","terran_10_vs_11_meta1","terran_10_vs_11_meta2"]
test_task_ls: ["terran_5_vs_5_test1","terran_5_vs_5_test2","terran_5_vs_5_test3","terran_10_vs_10_test1","terran_10_vs_10_test2","terran_10_vs_10_test3","terran_10_vs_11_test1","terran_10_vs_11_test2","terran_10_vs_11_test3","terran_20_vs_20_test1","terran_20_vs_20_test2","terran_20_vs_20_test3"]
total_task_ls: ["terran_5_vs_5_meta1","terran_5_vs_5_meta2","terran_5_vs_5_test1","terran_5_vs_5_test2","terran_5_vs_5_test3","terran_10_vs_10_meta3","terran_10_vs_10_test1","terran_10_vs_10_test2","terran_10_vs_10_test3","terran_10_vs_11_meta1","terran_10_vs_11_meta2","terran_10_vs_11_test1","terran_10_vs_11_test2","terran_10_vs_11_test3","terran_20_vs_20_test1","terran_20_vs_20_test2","terran_20_vs_20_test3"]
role_ls: [0,1,2,3,4,5]
role2task: [["terran_5_vs_5_meta1","terran_10_vs_10_meta3","terran_10_vs_11_meta1","terran_10_vs_11_meta2"],["terran_5_vs_5_meta1","terran_5_vs_5_meta2","terran_10_vs_11_meta2"],["terran_5_vs_5_meta2","terran_10_vs_11_meta2"],["terran_10_vs_10_meta3"],["terran_10_vs_11_meta1"],["terran_10_vs_10_meta3","terran_10_vs_11_meta1"]]

vae_path_ls: []

policy_path_ls: [
]

role_encoder_path_ls: []
prior_role_encoder_path_ls: []
encoder_path_ls: []
pretrain_path_ls: []


# offline dataset, used only for single-task offline
offline_data_folder: "dataset"
role_data_root: ""
offline_data_ls: [
]
offline_bottom_data_path: ""
offline_data_quality: "expert"
# offline_max_buffer_size: 4000
offline_max_buffer_size: 8000
offline_max_buffer_size_test: 100
offline_data_shuffle: False
offline_data_type: "h5"