# @package _global_
trainer:
  total_samples: 1e9

data:
  batch_size: 104
  unroll_length: 80

network:
  hdim: 512
  mamba_num_layers: 12

optimizer:
  lr: 0.00005
  optim_warmup_steps: 2e3
  lr_end_fraction: 0.1
  scheduler_type: cosine

setup:
  wandb_name: il_feature_lr_cosine
  wandb_mode: online
