cuda_device: 'cuda'
resources:
  resource_type: dynamic
  hidden_dim_mb: 4
  n_message_passing_mb: 10
  combined_mb: 5
  base_mb: 500
max_concurrent_trails: 20
run_name: "errica_roman-empire_sdrf_gat_l4"
search_space:
  hidden_dim: [32, 64, 128]
  dropout: [0.2, 0.4, 0.6, 0.8]
  n_loops: [100, 150]
  tau: [10, 100]
  n_message_passings: [4]
  model_class: ["gatv2"]
model_parameters:
  wrapper_class: "node_gnn"
  model_class: "gatv2"
  #  msg_passing_method: "gcn" # Options: "gcn", "gat_v2", "sage", "gin",
  n_message_passings: 4
  hidden_dim: 32
  dropout: 0.2
  last_activation: "softmax"
training_parameters:
  batch_size: 1
  epochs: 500
  learning_rate: 0.001
  loss: "crossentropy" # Options: "mse", "crossentropy", "nll", "weighted_mse"
  optimizer: "adam" # Options: "adam", "sgd"
  weight_decay: 0.000
  loss_class_weighting: none
  momentum: 0.1
  seed: 69
  batch_shuffle: true
  patience: 30
  validation_frequency: 3
dataset_parameters:
  class_name: "heterophilic"
  name: "Roman-empire"
  process: true
  force_reload: true
  pre_transform:
    pre_t_class: sdrf
    n_loops: 100
    tau: 100
data_split_parameters:
  n_folds: 10
evaluation_parameters:
  class_name: "classification"
  scorer_parameters:
    criterion: loss # give "loss" to use loss as criterion
    invert_crit: false # small should be good like loss
    metrics:
      accuracy:
        function: "accuracy"
        normalize: true
      f1_macro:
        function: "f1"
        average: "macro"
  measure_params:
    dirichlet:
      function: dirichlet
      per_graph: false
      types:
      - rusch
      - cai
    mad_3:
      function: mad
      max_neigh_hop: 3
    mad_1:
      function: mad
      max_neigh_hop: 1
    wu_smoothness:
      function: wu_smoothness
