# @package _global_
trainer:
  total_samples: 1e9
  clip: 1.0

data:
  batch_size: 4
  unroll_length: 2000
  dataset_name: nld-aa-monk
  dataset_type: parquet

network:
  hdim: 512
  mamba_num_layers: 12
  tf_mem_len: 2000
  tf_num_layers: 6
  tf_num_heads: 4
  tf_head_dim: 128

  glyph_edim: 16
  group_edim: 16
  level_edim: 16
  difficulty_edim: 16
  weight_edim: 16
  speed_edim: 16

  glyph_embed_with_linear: false
  add_char_color: true
  use_inventory: true

setup:
  wandb_name: glyphs_2k_tf_xl
  wandb_mode: offline
  num_gpus: 2