defaults:
  - _self_  # Ensures that this file is self-contained

project: "TASK3_EDGE"

dataset:
  name: "traffic-anaheim-simulation" # "traffic-anaheim-simulation", "traffic-barcelona-simulation", "traffic-chicago-simulation", "traffic-winnipeg-simulation"
  splits: 20 # Number of dataset splits
  max_dim: 2 # Maximum simplex dimension
  feat_init: "random" # "zeros", "random"
  device: "cuda" # "cpu", "cuda"
  split_number: 0 # Split number - will be modified for each split, initialize to 0
  adjacencies: "TrafficSSN" # Which adjacencies to select (TrafficSSN for experiments in the paper)
  data_path: "data" # Path to store the dataset
  seed: 42

model:
  routing: False # Not implemented for edge tasks
  hidden_sizes_list: [32,32,32] # Embedding size for each simplex dimension. List with length >= max_dim
  num_layers: 9 # Number of layers in the model
  conv_type: "GCN" # Type of convolution layer (GAT, SAGE, GCN)
  dropout: 0.1 # Dropout rate 
  jumping_knowledge: null # Not implemented for edge tasks
  normalize: false # Whether to apply L2 normalization at the output of each layer
  in_aggr: mean # Aggregation function for incoming messages
  out_aggr: mean # Aggregation function for outgoing messages
  lin_res: True # Whether to use linear residual connections (skip-connections)
  bn: False # Whether to use batch normalization
  ln: False # Whether to use layer normalization
  k: 4 # Number of experts (when using routing SSN)
  loss_alpha: 1.0 # Weight for the loss on directed edges vs undirected edges

training:
  seed: 42
  n_epochs: 1500 # Number of epochs for training
  lr: 0.01 # Learning rate
  wd: 0.0 # Weight decay
  patience: 80 # Number of epochs to wait for improvement before stopping
  iterations: 1 # Number of repetitions for each experiment
  device: "cuda" # "cpu", "cuda"
  gpu_idx: 1 
  validation: 1 # Every how many epochs to perform validation
