cuda_device: 'cuda'
resources:
  resource_type: dynamic
  hidden_dim_mb: 20
  n_message_passing_mb: 20
  combined_mb: 4
  base_mb: 200
  vram: 49000
max_concurrent_trails: 14
run_name: "ogb_arxiv_grid_search_borf_sage_sage"
search_space:
  hidden_dim: [256, 512, 1024]
  dropout: [ 0.0, 0.2, 0.4, 0.6, 0.8 ]
  n_message_passings: [ 2,4,8,16,32,64 ]
  n_loops: [ 2,3 ]
  batch_add: [ 50, 100 ]
  batch_remove: [ 50, 100 ]
  model_class: [ "gatv2", "sage"]
model_parameters:
  wrapper_class: "graph_gnn"
  model_class: "gcn"
  n_message_passings: 2
  hidden_dim: 32
  dropout: 0.2
  last_activation: "logsoftmax"
training_parameters:
  batch_size: 1
  epochs: 2000
  learning_rate: 0.01
  loss: "nll" # Options: "mse", "crossentropy", "nll", "weighted_mse"
  optimizer: "adam" # Options: "adam", "sgd"
  lr_scheduler_params:
    scheduler: "ReduceLROnPlateau" # Options: "ReduceLROnPlateau", "CyclicLR", "OneCycleLR"
    params: # Give the parameters for the specific class you chose. Here you can find the documentation: https://pytorch.org/docs/stable/optim.html
      min_lr: 0.00001
      patience: 30
      factor: 0.5
      mode: 'min'
  weight_decay: 0.000
  balance_classes: true
  momentum: 0.1
  seed: 69
  batch_shuffle: true
  patience: 100
  validation_frequency: 3
dataset_parameters:
  class_name: "ogbn"
  name: "ogbn-arxiv"
  process: True
  transform:
    t_class: "minmax"
  pre_transform:
    pre_t_class: borf3
    n_loops: 2
    batch_add: 2
    batch_remove: 2
data_split_parameters:
  seed: 42
  n_folds: 8
evaluation_parameters:
  class_name: "classification"
  scorer_parameters:
    criterion: loss # give "loss" to use loss as criterion
    invert_crit: false # small should be good like loss
    metrics:
      accuracy:
        function: "accuracy"
        normalize: true
      f1_macro:
        function: "f1"
        average: "macro"
