# FedSSM Configuration

data:
  data_dir: "/root/autodl-tmp/vqa_v2"
  annotations_dir: "/root/autodl-tmp/vqa_v2/annotations"
  images_dir: "/root/autodl-tmp/vqa_v2/images"

model:
  pretrained_model: "unc-nlp/lxmert-base-uncased"
  max_seq_length: 20
  num_visual_features: 36
  visual_feat_dim: 2048
  visual_pos_dim: 4

lora:
  enabled: true
  rank: 8
  alpha: 16
  dropout: 0.1
  target_modules: ["query", "value"]
  bias: "none"

federated:
  num_clients: 20
  num_rounds: 8
  data_partition_strategy: "non_iid"
  non_iid_alpha: 0.5
  client_test_ratio: 0.2
  min_samples_per_client: 100

training:
  batch_size: 256
  local_epochs: 2
  learning_rate: 0.0001
  weight_decay: 0.01
  max_grad_norm: 1.0
  device: "cuda"
  num_workers: 2

optimizer:
  type: "adamw"
  betas: [0.9, 0.999]
  eps: 1e-8

output:
  output_dir: "outputs/fedssm"
  checkpoint_dir: "checkpoints/fedssm"
  log_dir: "logs/fedssm"
  run_name: "fedssm_vqa"

env:
  seed: 42
  fp16: true

evaluation:
  eval_every_n_rounds: 1
  batch_size: 512

# FedSSM specific
fedssm:
  enabled: true
  state_dim: 32
  action_dim: 16
  beta_macro: 0.9
  n_min: 4
  n_max: 8
  kappa: 2.0
  threshold_quantile: 0.5
  tau: 2.0
  beta_variance: 1.0
  beta_staleness: 0.5
  beta_loss_align: 1.0
  beta_grad_align: 0.5
  trust_eta: 1.0
  min_trust: 0.1
  max_trust: 1.0
  eta_decay: 0.99
  eta_min: 0.1
  outlier_threshold: 3.0
