# @package _global_

defaults:
  - _default
dataset:
  datasets:
  - mc_maze.*
  - dyer_co.*
  - gallego_co.*
  - churchland_misc.*
  # scale_limit: 4000
train:
  autoscale_batch_size: false
  accumulate_batches: 4
  batch_size: 512 # 80G -> effective 2048
model:
  transformer:
    n_layers: 12