import os.path as osp

import torch
from torch_geometric.datasets import TUDataset, MoleculeNet
from ba_multi_shapes import BAMultiShapesDataset
from torch_geometric.utils import degree
import torch_geometric.transforms as T


class NormalizedDegree(object):
    def __init__(self, mean, std):
        self.mean = mean
        self.std = std

    def __call__(self, data):
        deg = degree(data.edge_index[0], dtype=torch.float)
        deg = (deg - self.mean) / self.std
        data.x = deg.view(-1, 1)
        return data


def get_dataset(name, sparse=True, cleaned=False):
    path = osp.join(osp.dirname(osp.realpath(__file__)), '../../../../datasets/', name)
    if name == 'mutag_expl':
        import mutag_expl
        dataset = mutag_expl.Mutag(path)
    elif name == 'ba_2motifs':
        import syn_dataset
        dataset = syn_dataset.SynGraphDataset(path, name)
    elif name == 'BBBP':
        dataset = MoleculeNet(name=name, root=path)
    elif name == 'BaMultiShapes':
        dataset = BAMultiShapesDataset(root=path)
    else:
        dataset = TUDataset(path, name, use_node_attr=True, use_edge_attr=True, cleaned=cleaned)
    #dataset.data.edge_attr = None

    #print(dataset.data.x is None)
    #print(dataset.transform is None)


    if dataset.data.x is None:

        max_degree = 0
        degs = [dataset.data.x is None]
        for data in dataset:
            degs += [degree(data.edge_index[0], dtype=torch.long)]
            max_degree = max(max_degree, degs[-1].max().item())

        if max_degree < 1000:
            dataset.transform = T.OneHotDegree(max_degree)
        else:
            deg = torch.cat(degs, dim=0).to(torch.float)
            mean, std = deg.mean().item(), deg.std().item()
            dataset.transform = NormalizedDegree(mean, std)

    if not sparse:
        num_nodes = max_num_nodes = 0
        for data in dataset:
            num_nodes += data.num_nodes
            max_num_nodes = max(data.num_nodes, max_num_nodes)

        '''

        # Filter out a few really large graphs in order to apply DiffPool.
        if name == 'REDDIT-BINARY':
            num_nodes = min(int(num_nodes / len(dataset) * 1.5), max_num_nodes)
        else:
            num_nodes = min(int(num_nodes / len(dataset) * 5), max_num_nodes)

        indices = []

        for i, data in enumerate(dataset):
            if data.num_nodes <= num_nodes:
                indices.append(i)
        dataset = dataset[torch.tensor(indices)]
        dataset.data.y = dataset.data.y[torch.tensor(indices)]
        '''
        num_nodes = max_num_nodes





        if dataset.transform is None:

            dataset.transform = T.ToDense(num_nodes)
        else:
            dataset.transform = T.Compose(
                [dataset.transform, T.ToDense(num_nodes)])


    return dataset
