# Training configuration

device: cuda  # or cpu
seed: 42

# Data configuration
data:
  train_path: /data/toy_offline_bav_rho1_data
  val_path: /data/toy_offline_bav_rho1_data
  num_workers: 4

# Optimizer configuration
optimizer:
  name: adam
  lr: 1e-4
  betas: [0.9, 0.999]
  weight_decay: 0.0

# Learning rate scheduler configuration
scheduler:
  use_scheduler: true
  name: cosine_with_warmup  # Options: cosine, cosine_with_warmup
  warmup_ratio: 0.1  # 10% of total steps for warmup

# Training configuration
training:
  num_epochs: 32  # Reduced for testing with validation
  grad_clip: 1.0
  compile_model: true
  compile_backend: eager  # eager works on CPU
  use_amp: false
  amp_dtype: bfloat16  # bfloat16 works on CPU with recent PyTorch
  val_interval: 2  # Validate every 2 epochs
