out_dir: results
metric_best: accuracy
repeat: 10
wandb:
  use: False
  project: malnet
  entity: expand-gnns
dataset:
  format: PyG-MalNetTiny
  name: LocalDegreeProfile
  task: graph
  task_type: classification
  transductive: False
  node_encoder: True
  node_encoder_name: LinearNode #+RWSE
  edge_encoder: True
  edge_encoder_name: DummyEdge
  edge_encoder_bn: False
posenc_ERN:
  enable: False
  model: Linear
  dim_pe: 8
  layers: 2
#posenc_RWSE:
#  enable: True
#  kernel:
#    times_func: range(1,17)
#  model: Linear
#  dim_pe: 20
#  raw_norm_type: BatchNorm
train:
  mode: custom
  batch_size: 64 #64
  eval_period: 1
  ckpt_period: 100
model:
  type: MultiModel
  loss_fun: cross_entropy
  edge_decoding: dot
  graph_pooling: max
gt:
  layer_type: CustomGatedGCN+Primphormer_lm # some other options: Exphormer, GINE+Exphormer, GINE, GINE__exp
  layers: 5 # 5
  n_heads: 1
  dim_hidden: 84 # 84  # `gt.dim_hidden` must match `gnn.dim_inner`
  dropout: 0.15 #0.12
  attn_dropout: 0.5
  layer_norm: False
  batch_norm: True
  primphormer:
    low_rank: 50
    vns: 50
gnn:
  head: default
  layers_pre_mp: 1 # 1
  layers_post_mp: 2 #3  # Not used when `gnn.head: san_graph`
  dim_inner: 84 # 84  # `gt.dim_hidden` must match `gnn.dim_inner`
  batchnorm: True
  act: relu
  dropout: 0.15
  agg: mean
  normalize_adj: False
optim:
  clip_grad_norm: True
  optimizer: adamW
  weight_decay: 1e-3 #1e-3
  base_lr: 0.001 #0.001
  max_epoch: 300
  scheduler: cosine_with_warmup
  num_warmup_epochs: 5 #10
  patience: 0
  eta: 1.0 # 0.01 # weight for KSVD loss
#optim:
#  optimizer: adam
#  weight_decay: 0.0
#  base_lr: 0.0005
#  max_epoch: 300
#  scheduler: reduce_on_plateau
#  reduce_factor: 0.5
#  schedule_patience: 20
#  min_lr: 1e-5
