from MegaGNN.graphgym.register import register_config
from typing import Union

@register_config('dataset_cfg')
def dataset_cfg(cfg):
    """Dataset-specific config options.
    """

    # The entity to perform the task in an heterogeneous graph dataset
    cfg.dataset.task_entity = None

    # The number of node types to expect in TypeDictNodeEncoder.
    cfg.dataset.node_encoder_num_types = 0

    # The number of edge types to expect in TypeDictEdgeEncoder.
    cfg.dataset.edge_encoder_num_types = 0

    # VOC/COCO Superpixels dataset version based on SLIC compactness parameter.
    cfg.dataset.slic_compactness = 10

    # infer-link parameters (e.g., edge prediction task)
    cfg.dataset.infer_link_label = "None"

    cfg.dataset.reverse_mp = False
    cfg.dataset.add_ports = False
    cfg.dataset.fraudgt_ports = False

    cfg.dataset.ports_as_separate_nodes = False # only used for cybersecurity dataset
    
    cfg.dataset.rand_split = False