dataset: config/datasets/cifar_100.yaml

training:
  optimizer:
    name: AdamW
    lr: 1.0e-3
    weight_decay: 5.0e-4
  param_groups:
    - pattern: relation_graph
      cfg:
        weight_decay: 5.0e-4
    - pattern: matcher
  drop_remain: True

  lr_schedule:
    name: cosine_annealing
    T_max: 50
    eta_min: 1.0e-5
  train_epochs: 50
  print_interval: 20
  val_interval: 500
  batch_size: 64
  num_workers: 8

relation_graph:
  backbone_jit: run/cifar_100/codebook/deit_tiny-l9-1024_all/jit/backbone-jit.pth
  codebook_jit: run/cifar_100/codebook/deit_tiny-l9-1024_all/jit/codebook-jit.pth
  matcher:
    similarity: inner_product
  gnn:
    embed_dim: 256
    num_layers: 2
  ir_atlas:
    dist_alpha: 1
    dist_pow: 2
    feat_h: 14
    feat_w: 14
    clamp_vertex_attn: -1.0
    clamp_edge_attn: -1.0
    remove_self_loop: False
    prune_node_threshold: 0.01
    apply_normalize: True
  initial_state_fp: run_kg/cifar_100/init_IR_atlas-deit_tiny-l9-1024_all.pth

validation:
  batch_size: 64
  num_workers: 8

loss:
  name: dkg_loss
  weight_dict:
    cls: 1.0
    re_entropy_vertex: 0.5
    re_entropy_edge: 0.75
