cuda_device: 'cuda'
resources:
  resource_type: dynamic
  hidden_dim_mb: 3.6
  n_message_passing_mb: 1
  combined_mb: 3.6
  base_mb: 1000
  vram: 48000
max_concurrent_trails: 14
run_name: "ogb_arxiv_grid_search_pair_sage"
search_space:
  hidden_dim: [128, 256, 512]
  dropout: [ 0.0, 0.2, 0.4, 0.6, 0.8 ]
  n_message_passings: [ 16,32,64 ]
  msg_passing_method: [ "sage"]
  model_class: [ "gcn_pair" ]
model_parameters:
  wrapper_class: "node_gnn"
  model_class: "gcn_pair"
  msg_passing_method: "gat_v2"
  #  msg_passing_method: "gcn" # Options: "gcn", "gat_v2", "sage", "gin",
  n_message_passings: 2
  hidden_dim: 32
  dropout: 0.2
  last_activation: "logsoftmax"
training_parameters:
  batch_size: 1
  epochs: 500
  learning_rate: 0.01
  loss: "nll" # Options: "mse", "crossentropy", "nll", "weighted_mse"
  optimizer: "adam" # Options: "adam", "sgd"
  lr_scheduler_params:
    scheduler: "ReduceLROnPlateau" # Options: "ReduceLROnPlateau", "CyclicLR", "OneCycleLR"
    params: # Give the parameters for the specific class you chose. Here you can find the documentation: https://pytorch.org/docs/stable/optim.html
      min_lr: 0.00001
      patience: 30
      factor: 0.5
      mode: 'min'
  weight_decay: 0.000
  balance_classes: true
  momentum: 0.1
  seed: 69
  batch_shuffle: true
  patience: 100
  validation_frequency: 5
dataset_parameters:
  class_name: "ogbn"
  name: "ogbn-arxiv"
  process: True
  transform:
    t_class: "minmax"
data_split_parameters:
  seed: 42
  n_folds: 8
evaluation_parameters:
  class_name: "classification"
  scorer_parameters:
    criterion: loss # give "loss" to use loss as criterion
    invert_crit: false # small should be good like loss
    metrics:
      accuracy:
        function: "accuracy"
        normalize: true
      f1_macro:
        function: "f1"
        average: "macro"
