out_dir: results
metric_best: accuracy
wandb:
  use: True
  project: your-project
  entity: your-wandb-profile
  name: epnn keep lowest 3
dataset:
  split_mode: none # This currently does nothing for BREC
  format: Custom
  name: BREC
  task: graph # Does nothing
  task_type: classification # Does nothing (I think)
  transductive: False
  node_encoder: True
  node_encoder_name: LinearNode+RPETransformerBias
  node_encoder_bn: False
  edge_encoder: False
  edge_encoder_name: LinearEdge
  edge_encoder_bn: False
posenc_RPE:
  enable: True
  encode: 'deepsets'
  num_in_degrees: 64
  num_out_degrees: 64
  epnn:
    enable: True
    num_layers: 2
    hidden_dim: 64
    output_dim: 1
    keep: 3
  num_rpes: 1
train:
  mode: BREC
  batch_size: 12 # full batch
  eval_period: 1
  enable_ckpt: True  # Checkpointing can now be disabled to save I/O when e.g. just benchmarking.
  ckpt_best: True  # WARNING: Checkpoint every epoch a better model is found may increase I/O significantly.
#  ckpt_period: 100  # Follow set checkpointing schedule
model:
  type: RPETransformer
  loss_fun: cross_entropy
  edge_decoding: dot
  graph_pooling: graph_token
rpe_transformer:
  num_layers: 8
  num_heads: 4
  num_kernels: 8
  embed_dim: 32
  dropout: 0.0
  attention_dropout: 0.1
  mlp_dropout: 0.1
  input_dropout: 0.1
  use_degree_embedding: False
  use_add_bias: True
  use_mult_bias: True
gnn:
  head: graphormer_graph
  layers_pre_mp: 0
  layers_post_mp: 3  # Not used when `gnn.head: san_graph`
  dim_inner: 32  # `gt.dim_hidden` must match `gnn.dim_inner`
  batchnorm: True
  act: relu
  dropout: 0.0
  agg: mean
  normalize_adj: False
optim:
  clip_grad_norm: True
  clip_grad_norm_value: 5.0
  optimizer: adamW
  weight_decay: 0.01
  base_lr: 0.001
  max_epoch: 75
  scheduler: polynomial_with_warmup
  num_warmup_epochs: 5
