cuda_device: 'cuda'
resources:
  resource_type: dynamic
  hidden_dim_mb: 8
  n_message_passing_mb: 40
  combined_mb: 4
  base_mb: 200
max_concurrent_trails: 20
run_name: "grid_search_arxiv_sage_no_balancing"
search_space:
  hidden_dim: [128, 256, 512]
  dropout: [ 0.0, 0.2, 0.4 ]
  n_message_passings: [ 2,4,8, 16, 32, 64 ]
  model_class: [ "sage" ]
model_parameters:
  wrapper_class: "node_gnn"
  model_class: "sage"
  n_message_passings: 2
  hidden_dim: 32
  dropout: 0.2
  last_activation: "logsoftmax"
training_parameters:
  batch_size: 1
  epochs: 2000
  learning_rate: 0.003
  loss: "nll" # Options: "mse", "crossentropy", "nll", "weighted_mse"
  optimizer: "adam" # Options: "adam", "sgd"
  lr_scheduler_params:
    scheduler: "ReduceLROnPlateau" # Options: "ReduceLROnPlateau", "CyclicLR", "OneCycleLR"
    params: # Give the parameters for the specific class you chose. Here you can find the documentation: https://pytorch.org/docs/stable/optim.html
      min_lr: 0.00074
      patience: 25
      factor: 0.5
      mode: 'min'
  weight_decay: 0.000
  loss_class_weighting: none
  momentum: 0.1
  seed: 69
  batch_shuffle: true
  patience: 50
  validation_frequency: 3
dataset_parameters:
  class_name: "ogbn"
  name: "ogbn-arxiv"
  process: True
  transform:
    t_class: "minmax"
data_split_parameters:
  seed: 42
  n_folds: 6
evaluation_parameters:
  class_name: "classification"
  scorer_parameters:
    criterion: loss # give "loss" to use loss as criterion
    invert_crit: false # small should be good like loss
    metrics:
      accuracy:
        function: "accuracy"
        normalize: true
      f1_macro:
        function: "f1"
        average: "macro"
