device: auto
root_dir: output_testing
seed: 1
param_count: 0
dataset:
  root: ../Data
  name: amazoncomputers
  name_list: [ ] # In case we want to train with several datsaets at the same time
  splits: [ 0.8,0.2 ]
  k_fold: 1
  shuffle_train: True
  loss: ce
  scale: None
  use_weight: False
  balance: None
  d: 5 # CSBM
  directed: false # CSBM
  eps: 0.5 # CSBM
  mu_norm: 1.0 # CSBM
  n: 1000 # CSBM
  p: 0.8 # CSBM
  q: 0.3 # CSBM
  std_dev: 1.0 # CSBM
  version: v2 # CSBM
  T: 10
  mu: 1.0
  kernel: exp
  w: 1.0
  alpha: 0.1
  username: user_name_1 # Twitter
  start_date: '2000-01-01' # Twitter
  end_date: '2023-01-01' # Twitter
  use_cache: True # Twitter: scrape data
  use_local: True # Twitter:  use local data or DB
  include_likes: False # Twitter
  download: False # Shapes 3D
  load_from_numpy: True # Shapes 3D
  percentage: 100 # Shapes 3D
  percentage_list: [ ]
  include_idx: False # Shapes 3D
  single_split: None
  size: 64
  num_samples: 1000
  is_dense: False
  max_nodes: 150
  add_noise: False
model:
  name: gnn
  layer_name: gatv1
  dim_inner: 64
  dim_latent: 0
  num_layers_pre: 1
  num_layers: 4
  num_layers_post: 1
  stage_type: skipsum
  distr_z: nornmal
  act: relu
  dropout: 0.0
  has_bn: False
  has_l2_norm: False
  num_iter_inner: 0
  r1_weight: 0.0
  max_num_points: 0
  use_only_batch_idx: -1
  load_inr: None
  pooling: None
  init: None
  plot: True
  eps_clip: 0.9
  gamma: 0.9
  coeff_mse: 0.0
  coeff_entropy: 0.0
  n_steps: 10
  warm_up_epochs: 0
  num_samples: 1
  ppo_steps: 1
  ratio: 0.5
  min_score: 0.0
  hard_pooling: False
  num_blocks: 1
  additional_losses: False
  max_nodes: 150
  margin: 1.0
layer:
  eps: 0.0
  train_eps: False
  negative_slope: 0.2
  add_self_loops: False
  heads: 1
  heads_aggr: concat
  bias: True
  mode: gat
  att_mode: gatv1
  share_weights_score: True
  share_weights_value: True
  share_weights: False
  aggr: mean
  use_ansatz: False
  use_partial_ansatz: False
  w: 1.0
  w0_initial: 30.0
  num_layers_flow: 2
  aggregators: [ sum, mean, min, max, std ]
  scalers: [ identity, amplification, attenuation, linear, inverse_linear ]
  towers: 1
  pre_layers: 1
  post_layers: 1
  residual: gated
  parity: False
encoding:
  num_frequencies: 0
  std_dev: 0.0
fn_representation:
  layer_sizes: [ 32 ]
hypernetwork:
  layer_sizes: [ 32 ]
pointconv:
  out_channels_list: [ 64, 0, 128, 0, 256, 0, 512, 0, 1 ]
  num_output_points_list: [ 4096, 1024, 1024, 256, 256, 64, 64, 16, 1 ]
  num_neighbors_list: [ 9, 9, 9, 9, 9, 9, 9, 9, 16 ]
  mid_channels: [ 16,16 ]
  linear_layer_sizes: [ ]
  act: lrelu__0_2
  add_sigmoid: True
  norm_order: 2.0
  add_batchnorm: False
  add_weightnet_batchnorm: False
  deterministic: False
  same_coordinates: False
reward:
  name: ratio_ub_entropy_diff
  desired_ratio: 0.5
  lambda_: None
  lambda_1: 0.2
  lambda_2: 0.2
  lambda_3: 0.2
  k_1: 1.0
  k_2: 1.0
  k_3: 1.0
env:
  name: graph_one
  penalty_size: 0.0
  use_intrinsic_reward: False
  max_episode_length: 100000
  action_refers_to: node
train:
  max_epochs: 100
  batch_size: 64
  num_workers: 0
  limit_train_batches: none
  limit_val_batches: None
  auto_scale_batch_size: False
  auto_lr_find: False
  profiler: None # None, simple, advanced
  enable_progress_bar: True
  max_time: None
  model_checkpoint: True
  inference_mode: True
early_stopping:
  activate: False
  min_delta: 0.0
  patience: 3
  verbose: False
optim:
  optimizer: adam
  base_lr: 0.01
  beta_1: 0.9
  beta_2: 0.999
  momentum: 0.0
  weight_decay: 0.0
  scheduler: exp
  gamma: 0.99
  step_size: 100
  mode: min
  factor: 0.1
  patience: 10
  cooldown: 0
optim_2:
  optimizer: adam
  base_lr: 0.01
  beta_1: 0.9
  beta_2: 0.999
  momentum: 0.0
  weight_decay: 0.0
  scheduler: exp
  gamma: 0.99
  step_size: 100
  mode: min
  factor: 0.1
  patience: 10
  cooldown: 0