# Original:  zinc-GRIT-2000.yaml
out_dir: results
metric_best: mae
metric_agg: argmin
tensorboard_each_run: False  # Log to Tensorboard each run
#accelerator: "cuda:3"
#device: "cuda:3"
accelerator: "cuda:0"
mlflow:
  use: False
  project: Exp
  name: QM9
wandb:
  use: False
  project: QM9
dataset:
  format: PyG-QM9
  name: standard
  task: graph
  task_type: regression
  transductive: False
  node_encoder: True
  node_encoder_name: TypeDictNode+CAPE
  node_encoder_num_types: 5
  node_encoder_bn: False
  edge_encoder: True
  edge_encoder_name: TypeDictEdge
  edge_encoder_num_types: 4
  edge_encoder_bn: False
  max_num_nodes: 29
  remove_h: False
  half: False
  target: 2  # for \epsilon_HOMO
posenc_RWSE:
  enable: False
  kernel:
    times_func: range(1,21)
  model: Linear
  dim_pe: 16
  raw_norm_type: BatchNorm
posenc_RRWP:
  enable: False
  ksteps: 16
posenc_CAPE:
  enable: True
  type: onespace
  decouple: True
  use_signnet: False  # override other settings to use SignNet; always set to False, otherwise use posenc_SignNet
  use_laplacian: True
  normalize_matrix: False
  dim_h: 64
  dim_pe: 28
  layers: 4
  gp_layer: 'ew'
  set2set_layers: 2
  max_mult: 4
  eigen_noise: 1e-5
  use_eigenvalue: False # use eigenvalue information in Clifford NN
  use_concat: False # concatenate invariant representations of different eigenspaces for each graph, instead of pooling
  dim_reduction_method: 'learnable_project'
  eigvec_lim: 8
  restrict_grade: None
  share_weights: False
  lambda_norm: 'none'
train:
  mode: custom
  batch_size: 256
  eval_period: 1
  ckpt_period: 100
  ensemble_repeat: 1
  ensemble_mode: none
model:
  type: GPSModel
  loss_fun: l1
  edge_decoding: dot
  graph_pooling: add
gt:
  layer_type: GINE+Transformer  # CustomGatedGCN+Performer
  layers: 10
  n_heads: 4
  dim_hidden: 64  # `gt.dim_hidden` must match `gnn.dim_inner`
  dropout: 0.0
  attn_dropout: 0.2
  layer_norm: False
  batch_norm: True
gnn:
  head: san_graph
  layers_pre_mp: 0
  layers_post_mp: 3  # Not used when `gnn.head: san_graph`
  dim_inner: 64  # `gt.dim_hidden` must match `gnn.dim_inner`
  batchnorm: True
  act: elu
  dropout: 0.0
  agg: mean
  normalize_adj: False
  num_layer_MPNN: 1
  similarity_type: cos
  inference_mode: original
  mp_threshold: 0.0
  force_undirected: False
optim:
  clip_grad_norm: True
  optimizer: adamW
  weight_decay: 1e-5
  base_lr: 0.001
  max_epoch: 1000
  scheduler: cosine_with_warmup
  num_warmup_epochs: 50

