# Telegram Bot
# telegram_config_file: telegram_config.yml

# Dataset and Splits
data_root: DATA
dataset_class: dataset.OGBGmolpcbaFeatureMap
dataset_name:  ogbg-molpcba
data_splits_file:  DATA_SPLITS/CHEMICAL/ogbg_molpcba/ogbg_molpcba_outer1_inner1.splits


# Hardware
device:  cuda
max_cpus:  20
max_gpus: 8
gpus_per_task:  1

# Data Loading
dataset_getter: pydgn.data.provider.DataProvider
data_loader:
  class_name: torch_geometric.loader.DataLoader
  args:
    num_workers : 1
    pin_memory: True


# Reproducibility
seed: 42


# Experiment
result_folder: GSPN_RESULTS/UNSUPERVISED
exp_name: unsupervised_embedding_generation_categorical
experiment: unsupervised_embedding_generation.EmbeddingTask
higher_results_are_better: True
evaluate_every: 1
final_training_runs: 1

grid:
  unsupervised_config:
    model: model.GSPN
    checkpoint: True
    shuffle: True
    batch_size: 1024
    epochs: 100


    # Model specific arguments #

    embeddings_folder: 'UNSUP_GSPN_EMBEDDINGS_BASIC/'

    convolution_class: model.GSPNBaseConv
    emission_class: model.GSPNMultiCategoricalEmission
    dim_categorical_features:
      feat1: 44
      feat2: 3
      feat3: 7
      feat4: 8
      feat5: 6
      feat6: 5
      feat7: 6
      feat8: 2
      feat9: 2

    num_mixtures:
      - 10
      - 5
      - 20

    num_hidden_neurons: 0  # not used at the moment
    num_layers:
      - 5
      - 10
      - 20

    avg_parameters_across_layers:
      - True
      - False

    # ------------------------ #

    # Optimizer
    optimizer:
      - class_name: pydgn.training.callback.optimizer.Optimizer
        args:
          optimizer_class_name: torch.optim.Adam
          lr: 0.1
          accumulate_gradients: False  # do/do not accumulate gradient across mini-batches

    # Scheduler
    scheduler: null

    # Loss metric
    loss: metric.GSPNNodeLogLikelihood

    # Score metric
    scorer:
      - class_name: pydgn.training.callback.metric.MultiScore
        args:
          main_scorer: metric.GSPNNodeLogLikelihood

    # Readout (optional)
    readout: null

    # Training engine
    engine: pydgn.training.engine.TrainingEngine

    # Gradient clipper (optional)
    gradient_clipper: null

    # Early stopper
    early_stopper:
      - class_name: pydgn.training.callback.early_stopping.PatienceEarlyStopper
        args:
          patience: 50
          monitor: validation_main_score
          mode: min
          checkpoint: True

    # Plotter of metrics
    plotter: pydgn.training.callback.plotter.Plotter
