# configs/models/attn_next_k_from_0_8heads.yaml

seed: 0
device: cuda

train_mode: rollout_next_k_from_0
num-epochs: 100000
kernel_bw2: 0.5

eval_mode: forecast
train_fraction: 0.5
dt_sim: 0.1

substeps_per_dt: 1
verlet: v

loss_type: geom_sinkhorn
vel: bundle

lr: 1.0e-4

# friction
friction: 0.00
learnable_friction: false
friction_lr: 1.0e-2

# data features
use_com: false
use_ema: true

# logging / outputs
gif_frame_skip: 1
gif_fps: 5
ckpt_every: 10000
gif_every: 10000
eval_every: 2000

# model
arch: attn_flow
dropout: 0.0
arch_kwargs:
  attn_heads: 8
  attn_hidden_dim: 64
  attn_layers: 4
  use_time: false

wandb_project: boids
wandb_tags: 0.5blur,8heads
