# configs/models/attn_single_cell_default.yaml
#
# Default config for attention-based model with EMA support.
# Sweep parameters (overridden via CLI):
#   - arch_kwargs.attn_heads (1-3)
#   - holdout-marginal (1-3)
#   - seed (0-2)

device: cuda

train_mode: rollout_next_k_from_0
num_epochs: 100000

substeps_per_dt: 1
dt_sim: 0.2
integrator: v

loss_type: geom_sinkhorn
vel: bundle

lr: 1.0e-4

# Friction
friction: 1.00
learnable_friction: true
friction_lr: 1.0e-2

# Data features
use_com: false

# Logging / outputs
gif_frame_skip: 1
gif_fps: 1
ckpt_every: 10000
eval_every: 500
gif_every: 10000

# Model architecture
arch: attn_flow
dropout: 0.1

# Architecture kwargs (attn_heads can be overridden via --set)
attn_heads: 4
attn_hidden_dim: 64
attn_layers: 4
use_time: true

# W&B
wandb_project: wlf_2heads_0.1_dropout
wandb_tags: interpolate,ema,4head,dropout_0.1