# @package _global_
trainer:
  log_freq: 5
  total_samples: 1e11
  train_time_budget: 1e30
  gradient_acc: 1.0
  clip: 1.0
  chkpt_freq: 5e5

optimizer:
  lr: 0.0005
  optim_warmup_steps: 1000
  lr_end_fraction: 0.1
  scheduler_type: cosine
  weight_decay: 0.1
  type: adamw

data:
  dataset_name: nld-aa-monk-5
  batch_size: 4
  unroll_length: 8192
  workers: 30
  env: NetHackChallenge-v0
  use_inventory: true
  dataset_type: parquet
  # train_gameids: datasets/nld-aa-monk-4_split_1.npy

network:
  # general hdim
  hdim: 1024
  inv_hdim: 256
  inv_edim: 32
  core_mode: llama
  tf_num_layers: 8
  tf_num_heads: 16

  char_edim: 16
  color_edim: 8
  glyph_edim: 16
  group_edim: 4
  level_edim: 4
  difficulty_edim: 4
  weight_edim: 4
  speed_edim: 4
  corpse_edim: 2
  sacrifice_edim: 2
  use_true_blstats: false

  glyph_embed_with_linear: true

  # sequence model
  mamba_num_layers: 24
  llama_use_fp16: true

  # top encoding
  msg_hdim: 64

  # bottom encoding
  blstats_hdim: 512
  add_raw_time_encoding: false
  add_log_time_encoding: false
  add_emb_time_encoding: false
  add_layernorm_in_blstats_conv: false

  # misc
  fc_after_cnn_hdim: 512
  add_char_color: false
  use_inventory: true
  use_message: true
  use_observation: true
  use_crop: true
  add_norm_after_linear: true
  fix_initialization: false

  # observation encoding
  include_top_and_bottom: false
  obs_kernel_size: 3
  obs_conv_blocks: 2
  obs_frame_stack: ${data.obs_frame_stack}
  resnet_num_blocks: 2
  resnet_num_layers: 2
  resnet_num_fc_layers: 2
  resnet_hdim: 512

  # policy
  policy_num_fc_layers: 2

setup:
  disable_cuda: false
  num_gpus: 8
  use_amp: true

  wandb_name: scale_tf_xl_h1024_l12_15k
  wandb_mode: disabled
