{
  "cells": [
    {
      "cell_type": "markdown",
      "metadata": {
        "id": "OkbiqXqxO791"
      },
      "source": [
        "# Install Dependencies"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "4YeqnX9-8Rb4"
      },
      "outputs": [],
      "source": [
        "# Install required packages.\n",
        "import os\n",
        "import torch\n",
        "\n",
        "os.environ[\"TORCH\"] = torch.__version__\n",
        "print(torch.__version__)\n",
        "\n",
        "!pip install -q torch-scatter -f https://data.pyg.org/whl/torch-${TORCH}.html\n",
        "!pip install -q torch-sparse -f https://data.pyg.org/whl/torch-${TORCH}.html\n",
        "!pip install -q git+https://github.com/pyg-team/pytorch_geometric.git\n",
        "\n",
        "!pip install -q infomap\n",
        "\n",
        "device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n",
        "print(\"\\n\", device)"
      ]
    },
    {
      "cell_type": "markdown",
      "metadata": {
        "id": "as4YAkAPxkpW"
      },
      "source": [
        "# Models"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "LrOKP8jlxbDF"
      },
      "outputs": [],
      "source": [
        "def _infomap():\n",
        "    from infomap import Infomap\n",
        "    from torch_geometric.utils import to_networkx\n",
        "    import networkx as nx\n",
        "\n",
        "    im = Infomap(silent=True, num_trials=100, two_level=True)\n",
        "    G = to_networkx(data)\n",
        "    im.add_networkx_graph(G)\n",
        "    im.run()\n",
        "\n",
        "    codelength = im.codelength\n",
        "    print(\"\\n Codelength: \", codelength)\n",
        "\n",
        "    labels_pred = list(dict(im.modules).values())\n",
        "    labels_true = torch.flatten(data.y).cpu().detach().numpy()\n",
        "\n",
        "    print(labels_pred)\n",
        "    print(labels_true)\n",
        "\n",
        "    from sklearn.metrics.cluster import normalized_mutual_info_score\n",
        "\n",
        "    NMI = normalized_mutual_info_score(labels_pred=labels_pred, labels_true=labels_true)\n",
        "    print(\"\\n NMI:\", NMI)\n",
        "\n",
        "    communities = {}\n",
        "    for node, community in enumerate(labels_pred):\n",
        "        if communities.get(community) == None:\n",
        "            communities[community] = set([node])\n",
        "        else:\n",
        "            communities[community].add(node)\n",
        "    communities = [v for k, v in communities.items()]\n",
        "\n",
        "    modularity = nx.community.modularity(G, communities)\n",
        "    print(\"\\n Modularity: \", modularity)\n",
        "\n",
        "    results = pd.read_csv(\"/content/drive/MyDrive/\" + dataset.name + \".csv\")\n",
        "    results.loc[len(results.index)] = [\n",
        "        dataset.name,\n",
        "        \"N/A\",\n",
        "        False,\n",
        "        False,\n",
        "        f\"{NMI:.1f}\",\n",
        "        \"N/A\",\n",
        "        f\"{modularity:.1f}\",\n",
        "        \"N/A\",\n",
        "        f\"{codelength:.1f}\",\n",
        "        \"N/A\",\n",
        "        False,\n",
        "    ]\n",
        "    results.to_csv(\"/content/drive/MyDrive/\" + dataset.name + \".csv\", index=False)\n",
        "\n",
        "    print(\"\\n\", results)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "_N0FuTxWot9K"
      },
      "outputs": [],
      "source": [
        "def neuromap(dataset, data, device, learning_rate=0.001, epochs=10000, patience=100):\n",
        "    def map_equation(S, A):\n",
        "        E = S.T @ A.matmul(S)\n",
        "\n",
        "        e1 = torch.sum(E) - torch.trace(E)\n",
        "        e2 = torch.sum(E - torch.diag(E) * torch.eye(len(E)).to(device), 1)\n",
        "        e3 = A.matmul(torch.ones(A.size(dim=1), 1).to(device))\n",
        "        e4 = torch.sum(E, 1)\n",
        "\n",
        "        e = e3.T.matmul(torch.ones(A.size(dim=1), 1).to(device))[0][0]\n",
        "\n",
        "        e1 /= e\n",
        "        e2 /= e\n",
        "        e3 /= e\n",
        "        e4 /= e\n",
        "\n",
        "        e4 += e2\n",
        "\n",
        "        e1 = torch.sum(e1 * torch.nan_to_num(torch.log2(e1), nan=0.0))\n",
        "        e2 = torch.sum(e2 * torch.nan_to_num(torch.log2(e2), nan=0.0))\n",
        "        e3 = torch.sum(e3 * torch.nan_to_num(torch.log2(e3), nan=0.0))\n",
        "        e4 = torch.sum(e4 * torch.nan_to_num(torch.log2(e4), nan=0.0))\n",
        "\n",
        "        return e1 - 2 * e2 - e3 + e4\n",
        "\n",
        "    import torch\n",
        "    from torch.nn import Linear, ReLU, SELU\n",
        "    import torch.nn.functional as F\n",
        "\n",
        "    class GNN(torch.nn.Module):\n",
        "        def __init__(self, data):\n",
        "            super().__init__()\n",
        "            # torch.manual_seed(12345)\n",
        "            self.encoder = Linear(data.num_node_features, 512)\n",
        "            self.decoder = Linear(512, 16)\n",
        "            self.skip_encoder = Linear(data.num_node_features, 512)\n",
        "            self.skip_decoder = Linear(512, 16)\n",
        "            # self.activation = ReLU()\n",
        "            self.activation = SELU()\n",
        "            self.A = data.adj_t\n",
        "\n",
        "        def forward(self, x):\n",
        "            x = self.encoder(self.A.matmul(x)) + self.skip_encoder(x)\n",
        "            x = self.activation(x)\n",
        "            x = self.decoder(self.A.matmul(x)) + self.skip_decoder(x)\n",
        "            x = F.dropout(x, p=0.5, training=self.training)\n",
        "            x = F.softmax(x, dim=1)\n",
        "            return x\n",
        "\n",
        "    from torch_geometric.transforms import Compose, GCNNorm, ToSparseTensor\n",
        "\n",
        "    data = data.to(device)\n",
        "\n",
        "    # transform = Compose([GCNNorm(add_self_loops=False), ToSparseTensor()])\n",
        "    # _data = transform(data)\n",
        "    # model = GNN(_data).to(device)\n",
        "    # print(\"\\n\", model)\n",
        "\n",
        "    transform = Compose([ToSparseTensor()])\n",
        "    data = transform(data)\n",
        "\n",
        "    model = GNN(data).to(device)\n",
        "    print(\"\\n\", model)\n",
        "\n",
        "    optimizer = torch.optim.Adam(\n",
        "        model.parameters(), lr=learning_rate  # , weight_decay=5e-4\n",
        "    )  # Define optimizer.\n",
        "\n",
        "    def train():\n",
        "        model.train()\n",
        "        optimizer.zero_grad()  # Clear gradients.\n",
        "        out = model(data.x) + 1e-8  # Perform a single forward pass.\n",
        "        loss = map_equation(out, data.adj_t)\n",
        "        loss.backward()  # Derive gradients.\n",
        "        optimizer.step()  # Update parameters based on gradients.\n",
        "        return loss\n",
        "\n",
        "    from tqdm import tqdm\n",
        "\n",
        "    print()\n",
        "    counter = 0\n",
        "    count_epochs = 0\n",
        "    best = float(\"inf\")\n",
        "    for epoch in (pbar := tqdm(range(1, epochs + 1))):\n",
        "        loss = train()\n",
        "        count_epochs += 1\n",
        "        if loss < best:\n",
        "            best = loss\n",
        "            counter = 0\n",
        "        else:\n",
        "            counter += 1\n",
        "        if counter > patience:\n",
        "            break\n",
        "        # print(f\"Epoch: {epoch:03d}, Loss: {loss:.4f}\")\n",
        "        pbar.set_description(f\"Epoch: {epoch:03d}, Loss: {loss:.4f}\")\n",
        "\n",
        "    print(\"\\n\", \"Stopped early at epoch: \", count_epochs)\n",
        "\n",
        "    model.eval()\n",
        "    out = model(data.x)\n",
        "\n",
        "    from sklearn.metrics.cluster import normalized_mutual_info_score\n",
        "    from sklearn.metrics import f1_score\n",
        "\n",
        "    labels_pred = torch.argmax(out, dim=1).cpu().detach().numpy()\n",
        "    labels_true = torch.flatten(data.y).detach().cpu().numpy()\n",
        "\n",
        "    print()\n",
        "    print(labels_pred)\n",
        "    print(labels_true)\n",
        "\n",
        "    NMI = normalized_mutual_info_score(labels_pred=labels_pred, labels_true=labels_true)\n",
        "    # F1 = f1_score(y_pred=labels_pred, y_true=labels_true)\n",
        "\n",
        "    print(\"\\n\", NMI)\n",
        "\n",
        "    from torch_geometric.utils import to_networkx\n",
        "    import networkx as nx\n",
        "\n",
        "    G = to_networkx(data)\n",
        "\n",
        "    communities = {}\n",
        "    for node, community in enumerate(labels_pred):\n",
        "        if communities.get(community) == None:\n",
        "            communities[community] = set([node])\n",
        "        else:\n",
        "            communities[community].add(node)\n",
        "    communities = [v for k, v in communities.items()]\n",
        "\n",
        "    modularity = nx.community.modularity(G, communities)\n",
        "    print(\"\\n\", modularity)\n",
        "\n",
        "    result = (NMI, modularity, loss.cpu().detach().numpy())\n",
        "\n",
        "    del data\n",
        "    del model\n",
        "    import gc\n",
        "\n",
        "    gc.collect()\n",
        "    with torch.no_grad():\n",
        "        torch.cuda.empty_cache()\n",
        "\n",
        "    return result"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "NzLf5edL66Zb"
      },
      "outputs": [],
      "source": [
        "from statistics import mean, stdev\n",
        "\n",
        "\n",
        "def find_neuromap(with_features=True, with_LE=False):\n",
        "    searches = 20\n",
        "    lowest_codelength = float(\"inf\")\n",
        "    best_learning_rate = 0.001\n",
        "    best_result = 0\n",
        "    from google.colab import drive\n",
        "\n",
        "    drive.mount(\"/content/drive\")\n",
        "    for search in range(searches):\n",
        "        learning_rate = 0.1 * 0.5**search\n",
        "        runs = 10\n",
        "        NMIs = []\n",
        "        modularities = []\n",
        "        codelengths = []\n",
        "        low_codelength = float(\"inf\")\n",
        "        candidate_result = 0\n",
        "        for run in range(runs):\n",
        "            print(\"\\n\", \"learning_rate: \", learning_rate)\n",
        "            result = neuromap(dataset, data, device, learning_rate)\n",
        "            NMI, modularity, codelength = result\n",
        "            NMIs.append(float(100.0 * NMI))\n",
        "            modularities.append(float(100.0 * modularity))\n",
        "            codelengths.append(float(codelength))\n",
        "            if codelength < low_codelength:\n",
        "                low_codelength = codelength\n",
        "                candidate_result = result\n",
        "\n",
        "        mean_codelength = mean(codelengths)\n",
        "        if mean_codelength < lowest_codelength:\n",
        "            lowest_codelength = mean_codelength\n",
        "            best_result = candidate_result\n",
        "            best_learning_rate = search\n",
        "\n",
        "        results = pd.read_csv(\"/content/drive/MyDrive/\" + dataset.name + \".csv\")\n",
        "        NMI, modularity, codelength = candidate_result\n",
        "        results.loc[len(results.index)] = [\n",
        "            dataset.name,\n",
        "            str(learning_rate),\n",
        "            with_features,\n",
        "            with_LE,\n",
        "            f\"{100*NMI:.1f}\",\n",
        "            f\"{mean(NMIs):.1f} \\u00B1 {stdev(NMIs):.1f}\",\n",
        "            f\"{100*modularity:.1f}\",\n",
        "            f\"{mean(modularities):.1f} \\u00B1 {stdev(modularities):.1f}\",\n",
        "            f\"{codelength:.1f}\",\n",
        "            f\"{mean(codelengths):.1f} \\u00B1 {stdev(codelengths):.1f}\",\n",
        "            False,\n",
        "        ]\n",
        "        results.to_csv(\"/content/drive/MyDrive/\" + dataset.name + \".csv\", index=False)\n",
        "\n",
        "        print(\"\\n\", results)\n",
        "\n",
        "    results = pd.read_csv(\"/content/drive/MyDrive/\" + dataset.name + \".csv\")\n",
        "    results.loc[len(results.index) + best_learning_rate - searches, \"Best?\"] = True\n",
        "    results.to_csv(\"/content/drive/MyDrive/\" + dataset.name + \".csv\", index=False)\n",
        "\n",
        "    print(\"\\n\", results)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "y8Y57nYkuj1h"
      },
      "outputs": [],
      "source": [
        "import pandas as pd\n",
        "\n",
        "\n",
        "def reset_results():\n",
        "    pd.set_option(\"display.width\", 200)\n",
        "\n",
        "    results = pd.DataFrame(\n",
        "        columns=[\n",
        "            \"Dataset\",\n",
        "            \"Learning Rate\",\n",
        "            \"With Features?\",\n",
        "            \"With LaplacianEigenvectorPE?\",\n",
        "            \"Optimised NMI\",\n",
        "            \"Average NMI\",\n",
        "            \"Optimised Modularity\",\n",
        "            \"Average Modularity\",\n",
        "            \"Lowest Codelength\",\n",
        "            \"Average Codelength\",\n",
        "            \"Best?\",\n",
        "        ]\n",
        "    )\n",
        "\n",
        "    from google.colab import drive\n",
        "\n",
        "    drive.mount(\"/content/drive\")\n",
        "    results.to_csv(\"/content/drive/MyDrive/\" + dataset.name + \".csv\", index=False)\n",
        "\n",
        "    print(results)"
      ]
    },
    {
      "cell_type": "markdown",
      "metadata": {
        "id": "9f-i6WrIrARQ"
      },
      "source": [
        "# Benchmark Real Networks"
      ]
    },
    {
      "cell_type": "markdown",
      "metadata": {
        "id": "MhDIt0y_qwr2"
      },
      "source": [
        "## Cora"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "QsBwTDL8oXD_"
      },
      "outputs": [],
      "source": [
        "from torch_geometric.datasets import Planetoid\n",
        "from torch_geometric.transforms import (\n",
        "    Compose,\n",
        "    ToUndirected,\n",
        "    AddLaplacianEigenvectorPE,\n",
        "    SVDFeatureReduction,\n",
        "    ToSparseTensor,\n",
        ")\n",
        "\n",
        "dataset = Planetoid(root=\"data/Planetoid\", name=\"Cora\", transform=ToUndirected())\n",
        "\n",
        "print()\n",
        "print(f\"Dataset: {dataset}:\")\n",
        "print(\"======================\")\n",
        "print(f\"Number of graphs: {len(dataset)}\")\n",
        "print(f\"Number of features: {dataset.num_features}\")\n",
        "print(f\"Number of classes: {dataset.num_classes}\")\n",
        "\n",
        "data = dataset[0]  # Get the first graph object.\n",
        "\n",
        "transform = Compose(\n",
        "    [\n",
        "        # SVDFeatureReduction(dataset.num_classes),\n",
        "        AddLaplacianEigenvectorPE(16, attr_name=None),\n",
        "        # ToSparseTensor(),\n",
        "    ]\n",
        ")\n",
        "data = transform(data)\n",
        "\n",
        "print()\n",
        "print(data)\n",
        "print(\n",
        "    \"===========================================================================================================\"\n",
        ")\n",
        "\n",
        "# Gather some statistics about the graph.\n",
        "print(f\"Number of nodes: {data.num_nodes}\")\n",
        "print(f\"Number of edges: {data.num_edges}\")\n",
        "print(f\"Average node degree: {data.num_edges / data.num_nodes:.1f}\")\n",
        "print(f\"Number of training nodes: {data.train_mask.sum()}\")\n",
        "print(f\"Training node label rate: {int(data.train_mask.sum()) / data.num_nodes:.1f}\")\n",
        "print(f\"Has isolated nodes: {data.has_isolated_nodes()}\")\n",
        "print(f\"Has self-loops: {data.has_self_loops()}\")\n",
        "print(f\"Is undirected: {data.is_undirected()}\")"
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "reset_results()"
      ],
      "metadata": {
        "id": "edKMTmh2ggV1"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "j5zz-9vgOYib"
      },
      "outputs": [],
      "source": [
        "_infomap()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "KlbxBrCc9Kj4"
      },
      "outputs": [],
      "source": [
        "find_neuromap(True, True)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "Wm4KOZCGxMr9"
      },
      "outputs": [],
      "source": [
        "from torch_geometric.datasets import Planetoid\n",
        "from torch_geometric.transforms import (\n",
        "    Compose,\n",
        "    ToUndirected,\n",
        "    AddLaplacianEigenvectorPE,\n",
        "    SVDFeatureReduction,\n",
        "    ToSparseTensor,\n",
        ")\n",
        "\n",
        "dataset = Planetoid(root=\"data/Planetoid\", name=\"Cora\", transform=ToUndirected())\n",
        "\n",
        "print()\n",
        "print(f\"Dataset: {dataset}:\")\n",
        "print(\"======================\")\n",
        "print(f\"Number of graphs: {len(dataset)}\")\n",
        "print(f\"Number of features: {dataset.num_features}\")\n",
        "print(f\"Number of classes: {dataset.num_classes}\")\n",
        "\n",
        "data = dataset[0]  # Get the first graph object.\n",
        "\n",
        "# transform = Compose(\n",
        "#     [\n",
        "#         # SVDFeatureReduction(dataset.num_classes),\n",
        "#         # AddLaplacianEigenvectorPE(16, attr_name=None),\n",
        "#         ToSparseTensor(),\n",
        "#     ]\n",
        "# )\n",
        "# data = transform(data)\n",
        "\n",
        "print()\n",
        "print(data)\n",
        "print(\n",
        "    \"===========================================================================================================\"\n",
        ")\n",
        "\n",
        "# Gather some statistics about the graph.\n",
        "print(f\"Number of nodes: {data.num_nodes}\")\n",
        "print(f\"Number of edges: {data.num_edges}\")\n",
        "print(f\"Average node degree: {data.num_edges / data.num_nodes:.1f}\")\n",
        "print(f\"Number of training nodes: {data.train_mask.sum()}\")\n",
        "print(f\"Training node label rate: {int(data.train_mask.sum()) / data.num_nodes:.1f}\")\n",
        "print(f\"Has isolated nodes: {data.has_isolated_nodes()}\")\n",
        "print(f\"Has self-loops: {data.has_self_loops()}\")\n",
        "print(f\"Is undirected: {data.is_undirected()}\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "PiEzDC7knnHz"
      },
      "outputs": [],
      "source": [
        "find_neuromap(True, False)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "jkam9sq1xNKT"
      },
      "outputs": [],
      "source": [
        "from torch_geometric.datasets import Planetoid\n",
        "from torch_geometric.transforms import (\n",
        "    Compose,\n",
        "    ToUndirected,\n",
        "    AddLaplacianEigenvectorPE,\n",
        "    SVDFeatureReduction,\n",
        "    ToSparseTensor,\n",
        ")\n",
        "\n",
        "dataset = Planetoid(root=\"data/Planetoid\", name=\"Cora\", transform=ToUndirected())\n",
        "\n",
        "print()\n",
        "print(f\"Dataset: {dataset}:\")\n",
        "print(\"======================\")\n",
        "print(f\"Number of graphs: {len(dataset)}\")\n",
        "print(f\"Number of features: {dataset.num_features}\")\n",
        "print(f\"Number of classes: {dataset.num_classes}\")\n",
        "\n",
        "data = dataset[0]  # Get the first graph object.\n",
        "\n",
        "# Remove node features\n",
        "del data.x\n",
        "\n",
        "transform = Compose(\n",
        "    [\n",
        "        # SVDFeatureReduction(dataset.num_classes),\n",
        "        AddLaplacianEigenvectorPE(16, attr_name=None),\n",
        "        # ToSparseTensor(),\n",
        "    ]\n",
        ")\n",
        "data = transform(data)\n",
        "\n",
        "print()\n",
        "print(data)\n",
        "print(\n",
        "    \"===========================================================================================================\"\n",
        ")\n",
        "\n",
        "# Gather some statistics about the graph.\n",
        "print(f\"Number of nodes: {data.num_nodes}\")\n",
        "print(f\"Number of edges: {data.num_edges}\")\n",
        "print(f\"Average node degree: {data.num_edges / data.num_nodes:.1f}\")\n",
        "print(f\"Number of training nodes: {data.train_mask.sum()}\")\n",
        "print(f\"Training node label rate: {int(data.train_mask.sum()) / data.num_nodes:.1f}\")\n",
        "print(f\"Has isolated nodes: {data.has_isolated_nodes()}\")\n",
        "print(f\"Has self-loops: {data.has_self_loops()}\")\n",
        "print(f\"Is undirected: {data.is_undirected()}\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "dKfyPdvGnxr4"
      },
      "outputs": [],
      "source": [
        "find_neuromap(False, True)"
      ]
    },
    {
      "cell_type": "markdown",
      "metadata": {
        "id": "8_XDUT3pHXQq"
      },
      "source": [
        "## CiteSeer"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "d84T6ZFjj_KG"
      },
      "outputs": [],
      "source": [
        "from torch_geometric.datasets import Planetoid\n",
        "from torch_geometric.transforms import (\n",
        "    Compose,\n",
        "    ToUndirected,\n",
        "    AddLaplacianEigenvectorPE,\n",
        "    SVDFeatureReduction,\n",
        "    ToSparseTensor,\n",
        ")\n",
        "\n",
        "dataset = Planetoid(root=\"data/Planetoid\", name=\"CiteSeer\", transform=ToUndirected())\n",
        "\n",
        "print()\n",
        "print(f\"Dataset: {dataset}:\")\n",
        "print(\"======================\")\n",
        "print(f\"Number of graphs: {len(dataset)}\")\n",
        "print(f\"Number of features: {dataset.num_features}\")\n",
        "print(f\"Number of classes: {dataset.num_classes}\")\n",
        "\n",
        "data = dataset[0]  # Get the first graph object.\n",
        "\n",
        "transform = Compose(\n",
        "    [\n",
        "        # SVDFeatureReduction(dataset.num_classes),\n",
        "        AddLaplacianEigenvectorPE(16, attr_name=None),\n",
        "        # ToSparseTensor(),\n",
        "    ]\n",
        ")\n",
        "data = transform(data)\n",
        "\n",
        "\n",
        "print()\n",
        "print(data)\n",
        "print(\n",
        "    \"===========================================================================================================\"\n",
        ")\n",
        "\n",
        "# Gather some statistics about the graph.\n",
        "print(f\"Number of nodes: {data.num_nodes}\")\n",
        "print(f\"Number of edges: {data.num_edges}\")\n",
        "print(f\"Average node degree: {data.num_edges / data.num_nodes:.1f}\")\n",
        "print(f\"Number of training nodes: {data.train_mask.sum()}\")\n",
        "print(f\"Training node label rate: {int(data.train_mask.sum()) / data.num_nodes:.1f}\")\n",
        "print(f\"Has isolated nodes: {data.has_isolated_nodes()}\")\n",
        "print(f\"Has self-loops: {data.has_self_loops()}\")\n",
        "print(f\"Is undirected: {data.is_undirected()}\")"
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "reset_results()"
      ],
      "metadata": {
        "id": "HVXYASpSgjHZ"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "4qFaQ2paQUK_"
      },
      "outputs": [],
      "source": [
        "_infomap()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "uuA_P9RFTAQX"
      },
      "outputs": [],
      "source": [
        "find_neuromap(True, True)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "cm7RitKjz7O7"
      },
      "outputs": [],
      "source": [
        "from torch_geometric.datasets import Planetoid\n",
        "from torch_geometric.transforms import (\n",
        "    Compose,\n",
        "    ToUndirected,\n",
        "    AddLaplacianEigenvectorPE,\n",
        "    SVDFeatureReduction,\n",
        "    ToSparseTensor,\n",
        ")\n",
        "\n",
        "dataset = Planetoid(root=\"data/Planetoid\", name=\"CiteSeer\", transform=ToUndirected())\n",
        "\n",
        "print()\n",
        "print(f\"Dataset: {dataset}:\")\n",
        "print(\"======================\")\n",
        "print(f\"Number of graphs: {len(dataset)}\")\n",
        "print(f\"Number of features: {dataset.num_features}\")\n",
        "print(f\"Number of classes: {dataset.num_classes}\")\n",
        "\n",
        "data = dataset[0]  # Get the first graph object.\n",
        "\n",
        "# transform = Compose(\n",
        "#     [\n",
        "#         # SVDFeatureReduction(dataset.num_classes),\n",
        "#         # AddLaplacianEigenvectorPE(16, attr_name=None),\n",
        "#         ToSparseTensor(),\n",
        "#     ]\n",
        "# )\n",
        "# data = transform(data)\n",
        "\n",
        "\n",
        "print()\n",
        "print(data)\n",
        "print(\n",
        "    \"===========================================================================================================\"\n",
        ")\n",
        "\n",
        "# Gather some statistics about the graph.\n",
        "print(f\"Number of nodes: {data.num_nodes}\")\n",
        "print(f\"Number of edges: {data.num_edges}\")\n",
        "print(f\"Average node degree: {data.num_edges / data.num_nodes:.1f}\")\n",
        "print(f\"Number of training nodes: {data.train_mask.sum()}\")\n",
        "print(f\"Training node label rate: {int(data.train_mask.sum()) / data.num_nodes:.1f}\")\n",
        "print(f\"Has isolated nodes: {data.has_isolated_nodes()}\")\n",
        "print(f\"Has self-loops: {data.has_self_loops()}\")\n",
        "print(f\"Is undirected: {data.is_undirected()}\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "zO2795fBTCKO"
      },
      "outputs": [],
      "source": [
        "find_neuromap(True, False)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "lIk5MPJEz7X-"
      },
      "outputs": [],
      "source": [
        "from torch_geometric.datasets import Planetoid\n",
        "from torch_geometric.transforms import (\n",
        "    Compose,\n",
        "    ToUndirected,\n",
        "    AddLaplacianEigenvectorPE,\n",
        "    SVDFeatureReduction,\n",
        "    ToSparseTensor,\n",
        ")\n",
        "\n",
        "dataset = Planetoid(root=\"data/Planetoid\", name=\"CiteSeer\", transform=ToUndirected())\n",
        "\n",
        "print()\n",
        "print(f\"Dataset: {dataset}:\")\n",
        "print(\"======================\")\n",
        "print(f\"Number of graphs: {len(dataset)}\")\n",
        "print(f\"Number of features: {dataset.num_features}\")\n",
        "print(f\"Number of classes: {dataset.num_classes}\")\n",
        "\n",
        "data = dataset[0]  # Get the first graph object.\n",
        "\n",
        "del data.x\n",
        "\n",
        "transform = Compose(\n",
        "    [\n",
        "        # SVDFeatureReduction(dataset.num_classes),\n",
        "        AddLaplacianEigenvectorPE(16, attr_name=None),\n",
        "        # ToSparseTensor(),\n",
        "    ]\n",
        ")\n",
        "data = transform(data)\n",
        "\n",
        "\n",
        "print()\n",
        "print(data)\n",
        "print(\n",
        "    \"===========================================================================================================\"\n",
        ")\n",
        "\n",
        "# Gather some statistics about the graph.\n",
        "print(f\"Number of nodes: {data.num_nodes}\")\n",
        "print(f\"Number of edges: {data.num_edges}\")\n",
        "print(f\"Average node degree: {data.num_edges / data.num_nodes:.1f}\")\n",
        "print(f\"Number of training nodes: {data.train_mask.sum()}\")\n",
        "print(f\"Training node label rate: {int(data.train_mask.sum()) / data.num_nodes:.1f}\")\n",
        "print(f\"Has isolated nodes: {data.has_isolated_nodes()}\")\n",
        "print(f\"Has self-loops: {data.has_self_loops()}\")\n",
        "print(f\"Is undirected: {data.is_undirected()}\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "pcnWpMEsTHL6"
      },
      "outputs": [],
      "source": [
        "find_neuromap(False, True)"
      ]
    },
    {
      "cell_type": "markdown",
      "metadata": {
        "id": "RMKxUvxVHT07"
      },
      "source": [
        "## PudMed"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "6BBp942jkcra"
      },
      "outputs": [],
      "source": [
        "from torch_geometric.datasets import Planetoid\n",
        "from torch_geometric.transforms import (\n",
        "    Compose,\n",
        "    ToUndirected,\n",
        "    AddLaplacianEigenvectorPE,\n",
        "    SVDFeatureReduction,\n",
        "    ToSparseTensor,\n",
        ")\n",
        "\n",
        "dataset = Planetoid(root=\"data/Planetoid\", name=\"PubMed\", transform=ToUndirected())\n",
        "\n",
        "print()\n",
        "print(f\"Dataset: {dataset}:\")\n",
        "print(\"======================\")\n",
        "print(f\"Number of graphs: {len(dataset)}\")\n",
        "print(f\"Number of features: {dataset.num_features}\")\n",
        "print(f\"Number of classes: {dataset.num_classes}\")\n",
        "\n",
        "data = dataset[0]  # Get the first graph object.\n",
        "\n",
        "transform = Compose(\n",
        "    [\n",
        "        # SVDFeatureReduction(dataset.num_classes),\n",
        "        AddLaplacianEigenvectorPE(16, attr_name=None),\n",
        "        ToSparseTensor(),\n",
        "    ]\n",
        ")\n",
        "data = transform(data)\n",
        "\n",
        "\n",
        "print()\n",
        "print(data)\n",
        "print(\n",
        "    \"===========================================================================================================\"\n",
        ")\n",
        "\n",
        "# Gather some statistics about the graph.\n",
        "print(f\"Number of nodes: {data.num_nodes}\")\n",
        "print(f\"Number of edges: {data.num_edges}\")\n",
        "print(f\"Average node degree: {data.num_edges / data.num_nodes:.1f}\")\n",
        "print(f\"Number of training nodes: {data.train_mask.sum()}\")\n",
        "print(f\"Training node label rate: {int(data.train_mask.sum()) / data.num_nodes:.1f}\")\n",
        "print(f\"Has isolated nodes: {data.has_isolated_nodes()}\")\n",
        "print(f\"Has self-loops: {data.has_self_loops()}\")\n",
        "print(f\"Is undirected: {data.is_undirected()}\")"
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "reset_results()"
      ],
      "metadata": {
        "id": "ymUUnHXcgkU8"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "TU-xtvUcQV9T"
      },
      "outputs": [],
      "source": [
        "_infomap()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "gJlcBZ_OTPfM"
      },
      "outputs": [],
      "source": [
        "find_neuromap(True, True)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "-3lc-2Dr0TWy"
      },
      "outputs": [],
      "source": [
        "from torch_geometric.datasets import Planetoid\n",
        "from torch_geometric.transforms import (\n",
        "    Compose,\n",
        "    ToUndirected,\n",
        "    AddLaplacianEigenvectorPE,\n",
        "    SVDFeatureReduction,\n",
        "    ToSparseTensor,\n",
        ")\n",
        "\n",
        "dataset = Planetoid(root=\"data/Planetoid\", name=\"PubMed\", transform=ToUndirected())\n",
        "\n",
        "print()\n",
        "print(f\"Dataset: {dataset}:\")\n",
        "print(\"======================\")\n",
        "print(f\"Number of graphs: {len(dataset)}\")\n",
        "print(f\"Number of features: {dataset.num_features}\")\n",
        "print(f\"Number of classes: {dataset.num_classes}\")\n",
        "\n",
        "data = dataset[0]  # Get the first graph object.\n",
        "\n",
        "transform = Compose(\n",
        "    [\n",
        "        # SVDFeatureReduction(dataset.num_classes),\n",
        "        # AddLaplacianEigenvectorPE(16, attr_name=None),\n",
        "        ToSparseTensor(),\n",
        "    ]\n",
        ")\n",
        "data = transform(data)\n",
        "\n",
        "\n",
        "print()\n",
        "print(data)\n",
        "print(\n",
        "    \"===========================================================================================================\"\n",
        ")\n",
        "\n",
        "# Gather some statistics about the graph.\n",
        "print(f\"Number of nodes: {data.num_nodes}\")\n",
        "print(f\"Number of edges: {data.num_edges}\")\n",
        "print(f\"Average node degree: {data.num_edges / data.num_nodes:.1f}\")\n",
        "print(f\"Number of training nodes: {data.train_mask.sum()}\")\n",
        "print(f\"Training node label rate: {int(data.train_mask.sum()) / data.num_nodes:.1f}\")\n",
        "print(f\"Has isolated nodes: {data.has_isolated_nodes()}\")\n",
        "print(f\"Has self-loops: {data.has_self_loops()}\")\n",
        "print(f\"Is undirected: {data.is_undirected()}\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "LToSLn2LTTgj"
      },
      "outputs": [],
      "source": [
        "find_neuromap(True, False)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "XvG8Mds40Tih"
      },
      "outputs": [],
      "source": [
        "from torch_geometric.datasets import Planetoid\n",
        "from torch_geometric.transforms import (\n",
        "    Compose,\n",
        "    ToUndirected,\n",
        "    AddLaplacianEigenvectorPE,\n",
        "    SVDFeatureReduction,\n",
        "    ToSparseTensor,\n",
        ")\n",
        "\n",
        "dataset = Planetoid(root=\"data/Planetoid\", name=\"PubMed\", transform=ToUndirected())\n",
        "\n",
        "print()\n",
        "print(f\"Dataset: {dataset}:\")\n",
        "print(\"======================\")\n",
        "print(f\"Number of graphs: {len(dataset)}\")\n",
        "print(f\"Number of features: {dataset.num_features}\")\n",
        "print(f\"Number of classes: {dataset.num_classes}\")\n",
        "\n",
        "data = dataset[0]  # Get the first graph object.\n",
        "\n",
        "del data.x\n",
        "\n",
        "transform = Compose(\n",
        "    [\n",
        "        # SVDFeatureReduction(dataset.num_classes),\n",
        "        AddLaplacianEigenvectorPE(16, attr_name=None),\n",
        "        ToSparseTensor(),\n",
        "    ]\n",
        ")\n",
        "data = transform(data)\n",
        "\n",
        "\n",
        "print()\n",
        "print(data)\n",
        "print(\n",
        "    \"===========================================================================================================\"\n",
        ")\n",
        "\n",
        "# Gather some statistics about the graph.\n",
        "print(f\"Number of nodes: {data.num_nodes}\")\n",
        "print(f\"Number of edges: {data.num_edges}\")\n",
        "print(f\"Average node degree: {data.num_edges / data.num_nodes:.1f}\")\n",
        "print(f\"Number of training nodes: {data.train_mask.sum()}\")\n",
        "print(f\"Training node label rate: {int(data.train_mask.sum()) / data.num_nodes:.1f}\")\n",
        "print(f\"Has isolated nodes: {data.has_isolated_nodes()}\")\n",
        "print(f\"Has self-loops: {data.has_self_loops()}\")\n",
        "print(f\"Is undirected: {data.is_undirected()}\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "ozoYAslxTYD_"
      },
      "outputs": [],
      "source": [
        "find_neuromap(False, True)"
      ]
    },
    {
      "cell_type": "markdown",
      "metadata": {
        "id": "VT1_lsuEHPYB"
      },
      "source": [
        "## Amazon Computers"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "OrnQs72hi5vF"
      },
      "outputs": [],
      "source": [
        "from torch_geometric.datasets import Amazon\n",
        "from torch_geometric.transforms import (\n",
        "    Compose,\n",
        "    ToUndirected,\n",
        "    AddLaplacianEigenvectorPE,\n",
        "    SVDFeatureReduction,\n",
        "    ToSparseTensor,\n",
        ")\n",
        "\n",
        "dataset = Amazon(root=\"data/Amazon\", name=\"Computers\", transform=ToUndirected())\n",
        "\n",
        "print()\n",
        "print(f\"Dataset: {dataset}:\")\n",
        "print(\"======================\")\n",
        "print(f\"Number of graphs: {len(dataset)}\")\n",
        "print(f\"Number of features: {dataset.num_features}\")\n",
        "print(f\"Number of classes: {dataset.num_classes}\")\n",
        "\n",
        "data = dataset[0]  # Get the first graph object.\n",
        "\n",
        "transform = Compose(\n",
        "    [\n",
        "        # SVDFeatureReduction(dataset.num_classes),\n",
        "        AddLaplacianEigenvectorPE(16, attr_name=None),\n",
        "        # ToSparseTensor(),\n",
        "    ]\n",
        ")\n",
        "data = transform(data)\n",
        "\n",
        "\n",
        "print()\n",
        "print(data)\n",
        "print(\n",
        "    \"===========================================================================================================\"\n",
        ")\n",
        "\n",
        "# Gather some statistics about the graph.\n",
        "print(f\"Number of nodes: {data.num_nodes}\")\n",
        "print(f\"Number of edges: {data.num_edges}\")\n",
        "print(f\"Average node degree: {data.num_edges / data.num_nodes:.1f}\")\n",
        "# print(f'Number of training nodes: {data.train_mask.sum()}')\n",
        "# print(f'Training node label rate: {int(data.train_mask.sum()) / data.num_nodes:.1f}')\n",
        "print(f\"Has isolated nodes: {data.has_isolated_nodes()}\")\n",
        "print(f\"Has self-loops: {data.has_self_loops()}\")\n",
        "print(f\"Is undirected: {data.is_undirected()}\")"
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "reset_results()"
      ],
      "metadata": {
        "id": "GfZ4ag4kgpWZ"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "kn3Kh3mbQW1z"
      },
      "outputs": [],
      "source": [
        "_infomap()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "ktCGw1G_KitL"
      },
      "outputs": [],
      "source": [
        "find_neuromap(True, True)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "beh2HrnI0fKf"
      },
      "outputs": [],
      "source": [
        "from torch_geometric.datasets import Amazon\n",
        "from torch_geometric.transforms import (\n",
        "    Compose,\n",
        "    ToUndirected,\n",
        "    AddLaplacianEigenvectorPE,\n",
        "    SVDFeatureReduction,\n",
        "    ToSparseTensor,\n",
        ")\n",
        "\n",
        "dataset = Amazon(root=\"data/Amazon\", name=\"Computers\", transform=ToUndirected())\n",
        "\n",
        "print()\n",
        "print(f\"Dataset: {dataset}:\")\n",
        "print(\"======================\")\n",
        "print(f\"Number of graphs: {len(dataset)}\")\n",
        "print(f\"Number of features: {dataset.num_features}\")\n",
        "print(f\"Number of classes: {dataset.num_classes}\")\n",
        "\n",
        "data = dataset[0]  # Get the first graph object.\n",
        "\n",
        "# transform = Compose(\n",
        "#     [\n",
        "#         # SVDFeatureReduction(dataset.num_classes),\n",
        "#         # AddLaplacianEigenvectorPE(16, attr_name=None),\n",
        "#         ToSparseTensor(),\n",
        "#     ]\n",
        "# )\n",
        "# data = transform(data)\n",
        "\n",
        "\n",
        "print()\n",
        "print(data)\n",
        "print(\n",
        "    \"===========================================================================================================\"\n",
        ")\n",
        "\n",
        "# Gather some statistics about the graph.\n",
        "print(f\"Number of nodes: {data.num_nodes}\")\n",
        "print(f\"Number of edges: {data.num_edges}\")\n",
        "print(f\"Average node degree: {data.num_edges / data.num_nodes:.1f}\")\n",
        "# print(f'Number of training nodes: {data.train_mask.sum()}')\n",
        "# print(f'Training node label rate: {int(data.train_mask.sum()) / data.num_nodes:.1f}')\n",
        "print(f\"Has isolated nodes: {data.has_isolated_nodes()}\")\n",
        "print(f\"Has self-loops: {data.has_self_loops()}\")\n",
        "print(f\"Is undirected: {data.is_undirected()}\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "ED1lonPhKmBS"
      },
      "outputs": [],
      "source": [
        "find_neuromap(True, False)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "Hx1BT-bF0fQo"
      },
      "outputs": [],
      "source": [
        "from torch_geometric.datasets import Amazon\n",
        "from torch_geometric.transforms import (\n",
        "    Compose,\n",
        "    ToUndirected,\n",
        "    AddLaplacianEigenvectorPE,\n",
        "    SVDFeatureReduction,\n",
        "    ToSparseTensor,\n",
        ")\n",
        "\n",
        "dataset = Amazon(root=\"data/Amazon\", name=\"Computers\", transform=ToUndirected())\n",
        "\n",
        "print()\n",
        "print(f\"Dataset: {dataset}:\")\n",
        "print(\"======================\")\n",
        "print(f\"Number of graphs: {len(dataset)}\")\n",
        "print(f\"Number of features: {dataset.num_features}\")\n",
        "print(f\"Number of classes: {dataset.num_classes}\")\n",
        "\n",
        "data = dataset[0]  # Get the first graph object.\n",
        "\n",
        "del data.x\n",
        "\n",
        "transform = Compose(\n",
        "    [\n",
        "        # SVDFeatureReduction(dataset.num_classes),\n",
        "        AddLaplacianEigenvectorPE(16, attr_name=None),\n",
        "        # ToSparseTensor(),\n",
        "    ]\n",
        ")\n",
        "data = transform(data)\n",
        "\n",
        "\n",
        "print()\n",
        "print(data)\n",
        "print(\n",
        "    \"===========================================================================================================\"\n",
        ")\n",
        "\n",
        "# Gather some statistics about the graph.\n",
        "print(f\"Number of nodes: {data.num_nodes}\")\n",
        "print(f\"Number of edges: {data.num_edges}\")\n",
        "print(f\"Average node degree: {data.num_edges / data.num_nodes:.1f}\")\n",
        "# print(f'Number of training nodes: {data.train_mask.sum()}')\n",
        "# print(f'Training node label rate: {int(data.train_mask.sum()) / data.num_nodes:.1f}')\n",
        "print(f\"Has isolated nodes: {data.has_isolated_nodes()}\")\n",
        "print(f\"Has self-loops: {data.has_self_loops()}\")\n",
        "print(f\"Is undirected: {data.is_undirected()}\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "htc04uT4KrYQ"
      },
      "outputs": [],
      "source": [
        "find_neuromap(False, True)"
      ]
    },
    {
      "cell_type": "markdown",
      "metadata": {
        "id": "baOOASCvHKs5"
      },
      "source": [
        "## Amazon Photo"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "TrseOZvakxJt"
      },
      "outputs": [],
      "source": [
        "from torch_geometric.datasets import Amazon\n",
        "from torch_geometric.transforms import (\n",
        "    Compose,\n",
        "    ToUndirected,\n",
        "    AddLaplacianEigenvectorPE,\n",
        "    SVDFeatureReduction,\n",
        "    ToSparseTensor,\n",
        ")\n",
        "\n",
        "dataset = Amazon(root=\"data/Amazon\", name=\"Photo\", transform=ToUndirected())\n",
        "\n",
        "print()\n",
        "print(f\"Dataset: {dataset}:\")\n",
        "print(\"======================\")\n",
        "print(f\"Number of graphs: {len(dataset)}\")\n",
        "print(f\"Number of features: {dataset.num_features}\")\n",
        "print(f\"Number of classes: {dataset.num_classes}\")\n",
        "\n",
        "data = dataset[0]  # Get the first graph object.\n",
        "\n",
        "transform = Compose(\n",
        "    [\n",
        "        # SVDFeatureReduction(dataset.num_classes),\n",
        "        AddLaplacianEigenvectorPE(16, attr_name=None),\n",
        "        # ToSparseTensor(),\n",
        "    ]\n",
        ")\n",
        "data = transform(data)\n",
        "\n",
        "\n",
        "print()\n",
        "print(data)\n",
        "print(\n",
        "    \"===========================================================================================================\"\n",
        ")\n",
        "\n",
        "# Gather some statistics about the graph.\n",
        "print(f\"Number of nodes: {data.num_nodes}\")\n",
        "print(f\"Number of edges: {data.num_edges}\")\n",
        "print(f\"Average node degree: {data.num_edges / data.num_nodes:.1f}\")\n",
        "# print(f'Number of training nodes: {data.train_mask.sum()}')\n",
        "# print(f'Training node label rate: {int(data.train_mask.sum()) / data.num_nodes:.1f}')\n",
        "print(f\"Has isolated nodes: {data.has_isolated_nodes()}\")\n",
        "print(f\"Has self-loops: {data.has_self_loops()}\")\n",
        "print(f\"Is undirected: {data.is_undirected()}\")"
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "reset_results()"
      ],
      "metadata": {
        "id": "BmFdYXnGgq_u"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "4vOJ3Zb3QXpa"
      },
      "outputs": [],
      "source": [
        "_infomap()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "ZyfNWCm3TgXt"
      },
      "outputs": [],
      "source": [
        "find_neuromap(True, True)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "Tu9CBc_c0w2h"
      },
      "outputs": [],
      "source": [
        "from torch_geometric.datasets import Amazon\n",
        "from torch_geometric.transforms import (\n",
        "    Compose,\n",
        "    ToUndirected,\n",
        "    AddLaplacianEigenvectorPE,\n",
        "    SVDFeatureReduction,\n",
        "    ToSparseTensor,\n",
        ")\n",
        "\n",
        "dataset = Amazon(root=\"data/Amazon\", name=\"Photo\", transform=ToUndirected())\n",
        "\n",
        "print()\n",
        "print(f\"Dataset: {dataset}:\")\n",
        "print(\"======================\")\n",
        "print(f\"Number of graphs: {len(dataset)}\")\n",
        "print(f\"Number of features: {dataset.num_features}\")\n",
        "print(f\"Number of classes: {dataset.num_classes}\")\n",
        "\n",
        "data = dataset[0]  # Get the first graph object.\n",
        "\n",
        "# transform = Compose(\n",
        "#     [\n",
        "#         # SVDFeatureReduction(dataset.num_classes),\n",
        "#         # AddLaplacianEigenvectorPE(16, attr_name=None),\n",
        "#         ToSparseTensor(),\n",
        "#     ]\n",
        "# )\n",
        "# data = transform(data)\n",
        "\n",
        "\n",
        "print()\n",
        "print(data)\n",
        "print(\n",
        "    \"===========================================================================================================\"\n",
        ")\n",
        "\n",
        "# Gather some statistics about the graph.\n",
        "print(f\"Number of nodes: {data.num_nodes}\")\n",
        "print(f\"Number of edges: {data.num_edges}\")\n",
        "print(f\"Average node degree: {data.num_edges / data.num_nodes:.1f}\")\n",
        "# print(f'Number of training nodes: {data.train_mask.sum()}')\n",
        "# print(f'Training node label rate: {int(data.train_mask.sum()) / data.num_nodes:.1f}')\n",
        "print(f\"Has isolated nodes: {data.has_isolated_nodes()}\")\n",
        "print(f\"Has self-loops: {data.has_self_loops()}\")\n",
        "print(f\"Is undirected: {data.is_undirected()}\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "aWZhpnCZTmIB"
      },
      "outputs": [],
      "source": [
        "find_neuromap(True, False)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "0ugJKdpD0w_6"
      },
      "outputs": [],
      "source": [
        "from torch_geometric.datasets import Amazon\n",
        "from torch_geometric.transforms import (\n",
        "    Compose,\n",
        "    ToUndirected,\n",
        "    AddLaplacianEigenvectorPE,\n",
        "    SVDFeatureReduction,\n",
        "    ToSparseTensor,\n",
        ")\n",
        "\n",
        "dataset = Amazon(root=\"data/Amazon\", name=\"Photo\", transform=ToUndirected())\n",
        "\n",
        "print()\n",
        "print(f\"Dataset: {dataset}:\")\n",
        "print(\"======================\")\n",
        "print(f\"Number of graphs: {len(dataset)}\")\n",
        "print(f\"Number of features: {dataset.num_features}\")\n",
        "print(f\"Number of classes: {dataset.num_classes}\")\n",
        "\n",
        "data = dataset[0]  # Get the first graph object.\n",
        "\n",
        "del data.x\n",
        "\n",
        "transform = Compose(\n",
        "    [\n",
        "        # SVDFeatureReduction(dataset.num_classes),\n",
        "        AddLaplacianEigenvectorPE(16, attr_name=None),\n",
        "        # ToSparseTensor(),\n",
        "    ]\n",
        ")\n",
        "data = transform(data)\n",
        "\n",
        "print()\n",
        "print(data)\n",
        "print(\n",
        "    \"===========================================================================================================\"\n",
        ")\n",
        "\n",
        "# Gather some statistics about the graph.\n",
        "print(f\"Number of nodes: {data.num_nodes}\")\n",
        "print(f\"Number of edges: {data.num_edges}\")\n",
        "print(f\"Average node degree: {data.num_edges / data.num_nodes:.1f}\")\n",
        "# print(f'Number of training nodes: {data.train_mask.sum()}')\n",
        "# print(f'Training node label rate: {int(data.train_mask.sum()) / data.num_nodes:.1f}')\n",
        "print(f\"Has isolated nodes: {data.has_isolated_nodes()}\")\n",
        "print(f\"Has self-loops: {data.has_self_loops()}\")\n",
        "print(f\"Is undirected: {data.is_undirected()}\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "jSgNduRrTp7t"
      },
      "outputs": [],
      "source": [
        "find_neuromap(False, True)"
      ]
    },
    {
      "cell_type": "markdown",
      "metadata": {
        "id": "4h0qj9SUHGDC"
      },
      "source": [
        "## Coauthor CS"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "8_py72hejlgl"
      },
      "outputs": [],
      "source": [
        "from torch_geometric.datasets import Coauthor\n",
        "from torch_geometric.transforms import (\n",
        "    Compose,\n",
        "    ToUndirected,\n",
        "    AddLaplacianEigenvectorPE,\n",
        "    SVDFeatureReduction,\n",
        "    ToSparseTensor,\n",
        ")\n",
        "\n",
        "dataset = Coauthor(root=\"data/Coauthor\", name=\"CS\", transform=ToUndirected())\n",
        "\n",
        "print()\n",
        "print(f\"Dataset: {dataset}:\")\n",
        "print(\"======================\")\n",
        "print(f\"Number of graphs: {len(dataset)}\")\n",
        "print(f\"Number of features: {dataset.num_features}\")\n",
        "print(f\"Number of classes: {dataset.num_classes}\")\n",
        "\n",
        "data = dataset[0]  # Get the first graph object.\n",
        "\n",
        "transform = Compose(\n",
        "    [\n",
        "        # SVDFeatureReduction(dataset.num_classes),\n",
        "        AddLaplacianEigenvectorPE(16, attr_name=None),\n",
        "        # ToSparseTensor(),\n",
        "    ]\n",
        ")\n",
        "data = transform(data)\n",
        "\n",
        "\n",
        "print()\n",
        "print(data)\n",
        "print(\n",
        "    \"===========================================================================================================\"\n",
        ")\n",
        "\n",
        "# Gather some statistics about the graph.\n",
        "print(f\"Number of nodes: {data.num_nodes}\")\n",
        "print(f\"Number of edges: {data.num_edges}\")\n",
        "print(f\"Average node degree: {data.num_edges / data.num_nodes:.1f}\")\n",
        "# print(f'Number of training nodes: {data.train_mask.sum()}')\n",
        "# print(f'Training node label rate: {int(data.train_mask.sum()) / data.num_nodes:.1f}')\n",
        "print(f\"Has isolated nodes: {data.has_isolated_nodes()}\")\n",
        "print(f\"Has self-loops: {data.has_self_loops()}\")\n",
        "print(f\"Is undirected: {data.is_undirected()}\")"
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "reset_results()"
      ],
      "metadata": {
        "id": "sSTzGllQgsHK"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "KQR-K7IoQYS1"
      },
      "outputs": [],
      "source": [
        "_infomap()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "-GfH0CdPTtB7"
      },
      "outputs": [],
      "source": [
        "find_neuromap(True, True)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "XYTW3Ztj0_Hu"
      },
      "outputs": [],
      "source": [
        "from torch_geometric.datasets import Coauthor\n",
        "from torch_geometric.transforms import (\n",
        "    Compose,\n",
        "    ToUndirected,\n",
        "    AddLaplacianEigenvectorPE,\n",
        "    SVDFeatureReduction,\n",
        "    ToSparseTensor,\n",
        ")\n",
        "\n",
        "dataset = Coauthor(root=\"data/Coauthor\", name=\"CS\", transform=ToUndirected())\n",
        "\n",
        "print()\n",
        "print(f\"Dataset: {dataset}:\")\n",
        "print(\"======================\")\n",
        "print(f\"Number of graphs: {len(dataset)}\")\n",
        "print(f\"Number of features: {dataset.num_features}\")\n",
        "print(f\"Number of classes: {dataset.num_classes}\")\n",
        "\n",
        "data = dataset[0]  # Get the first graph object.\n",
        "\n",
        "# transform = Compose(\n",
        "#     [\n",
        "#         # SVDFeatureReduction(dataset.num_classes),\n",
        "#         # AddLaplacianEigenvectorPE(16, attr_name=None),\n",
        "#         ToSparseTensor(),\n",
        "#     ]\n",
        "# )\n",
        "# data = transform(data)\n",
        "\n",
        "\n",
        "print()\n",
        "print(data)\n",
        "print(\n",
        "    \"===========================================================================================================\"\n",
        ")\n",
        "\n",
        "# Gather some statistics about the graph.\n",
        "print(f\"Number of nodes: {data.num_nodes}\")\n",
        "print(f\"Number of edges: {data.num_edges}\")\n",
        "print(f\"Average node degree: {data.num_edges / data.num_nodes:.1f}\")\n",
        "# print(f'Number of training nodes: {data.train_mask.sum()}')\n",
        "# print(f'Training node label rate: {int(data.train_mask.sum()) / data.num_nodes:.1f}')\n",
        "print(f\"Has isolated nodes: {data.has_isolated_nodes()}\")\n",
        "print(f\"Has self-loops: {data.has_self_loops()}\")\n",
        "print(f\"Is undirected: {data.is_undirected()}\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "0DR_c9sdTv33"
      },
      "outputs": [],
      "source": [
        "find_neuromap(True, False)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "NDzC6mDr0_Sd"
      },
      "outputs": [],
      "source": [
        "from torch_geometric.datasets import Coauthor\n",
        "from torch_geometric.transforms import (\n",
        "    Compose,\n",
        "    ToUndirected,\n",
        "    AddLaplacianEigenvectorPE,\n",
        "    SVDFeatureReduction,\n",
        "    ToSparseTensor,\n",
        ")\n",
        "\n",
        "dataset = Coauthor(root=\"data/Coauthor\", name=\"CS\", transform=ToUndirected())\n",
        "\n",
        "print()\n",
        "print(f\"Dataset: {dataset}:\")\n",
        "print(\"======================\")\n",
        "print(f\"Number of graphs: {len(dataset)}\")\n",
        "print(f\"Number of features: {dataset.num_features}\")\n",
        "print(f\"Number of classes: {dataset.num_classes}\")\n",
        "\n",
        "data = dataset[0]  # Get the first graph object.\n",
        "\n",
        "del data.x\n",
        "\n",
        "transform = Compose(\n",
        "    [\n",
        "        # SVDFeatureReduction(dataset.num_classes),\n",
        "        AddLaplacianEigenvectorPE(16, attr_name=None),\n",
        "        # ToSparseTensor(),\n",
        "    ]\n",
        ")\n",
        "data = transform(data)\n",
        "\n",
        "\n",
        "print()\n",
        "print(data)\n",
        "print(\n",
        "    \"===========================================================================================================\"\n",
        ")\n",
        "\n",
        "# Gather some statistics about the graph.\n",
        "print(f\"Number of nodes: {data.num_nodes}\")\n",
        "print(f\"Number of edges: {data.num_edges}\")\n",
        "print(f\"Average node degree: {data.num_edges / data.num_nodes:.1f}\")\n",
        "# print(f'Number of training nodes: {data.train_mask.sum()}')\n",
        "# print(f'Training node label rate: {int(data.train_mask.sum()) / data.num_nodes:.1f}')\n",
        "print(f\"Has isolated nodes: {data.has_isolated_nodes()}\")\n",
        "print(f\"Has self-loops: {data.has_self_loops()}\")\n",
        "print(f\"Is undirected: {data.is_undirected()}\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "rwIPExi4TzpR"
      },
      "outputs": [],
      "source": [
        "find_neuromap(False, True)"
      ]
    },
    {
      "cell_type": "markdown",
      "metadata": {
        "id": "mw1F1mOvG51W"
      },
      "source": [
        "## Coauthor Physics"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "-Fr45UyXkmZI"
      },
      "outputs": [],
      "source": [
        "from torch_geometric.datasets import Coauthor\n",
        "from torch_geometric.transforms import (\n",
        "    Compose,\n",
        "    ToUndirected,\n",
        "    AddLaplacianEigenvectorPE,\n",
        "    SVDFeatureReduction,\n",
        "    ToSparseTensor,\n",
        ")\n",
        "\n",
        "dataset = Coauthor(root=\"data/Coauthor\", name=\"Physics\", transform=ToUndirected())\n",
        "\n",
        "print()\n",
        "print(f\"Dataset: {dataset}:\")\n",
        "print(\"======================\")\n",
        "print(f\"Number of graphs: {len(dataset)}\")\n",
        "print(f\"Number of features: {dataset.num_features}\")\n",
        "print(f\"Number of classes: {dataset.num_classes}\")\n",
        "\n",
        "data = dataset[0]  # Get the first graph object.\n",
        "\n",
        "transform = Compose(\n",
        "    [\n",
        "        # SVDFeatureReduction(dataset.num_classes),\n",
        "        AddLaplacianEigenvectorPE(16, attr_name=None),\n",
        "        # ToSparseTensor(),\n",
        "    ]\n",
        ")\n",
        "data = transform(data)\n",
        "\n",
        "\n",
        "print()\n",
        "print(data)\n",
        "print(\n",
        "    \"===========================================================================================================\"\n",
        ")\n",
        "\n",
        "# Gather some statistics about the graph.\n",
        "print(f\"Number of nodes: {data.num_nodes}\")\n",
        "print(f\"Number of edges: {data.num_edges}\")\n",
        "print(f\"Average node degree: {data.num_edges / data.num_nodes:.1f}\")\n",
        "# print(f'Number of training nodes: {data.train_mask.sum()}')\n",
        "# print(f'Training node label rate: {int(data.train_mask.sum()) / data.num_nodes:.1f}')\n",
        "print(f\"Has isolated nodes: {data.has_isolated_nodes()}\")\n",
        "print(f\"Has self-loops: {data.has_self_loops()}\")\n",
        "print(f\"Is undirected: {data.is_undirected()}\")"
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "reset_results()"
      ],
      "metadata": {
        "id": "mwlgcSa0gs1e"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "PDqFPNX7QaRw"
      },
      "outputs": [],
      "source": [
        "_infomap()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "XJfJk6-MT4Y3"
      },
      "outputs": [],
      "source": [
        "find_neuromap(True, True)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "wpqZm8ho1MZB"
      },
      "outputs": [],
      "source": [
        "from torch_geometric.datasets import Coauthor\n",
        "from torch_geometric.transforms import (\n",
        "    Compose,\n",
        "    ToUndirected,\n",
        "    AddLaplacianEigenvectorPE,\n",
        "    SVDFeatureReduction,\n",
        "    ToSparseTensor,\n",
        ")\n",
        "\n",
        "dataset = Coauthor(root=\"data/Coauthor\", name=\"Physics\", transform=ToUndirected())\n",
        "\n",
        "print()\n",
        "print(f\"Dataset: {dataset}:\")\n",
        "print(\"======================\")\n",
        "print(f\"Number of graphs: {len(dataset)}\")\n",
        "print(f\"Number of features: {dataset.num_features}\")\n",
        "print(f\"Number of classes: {dataset.num_classes}\")\n",
        "\n",
        "data = dataset[0]  # Get the first graph object.\n",
        "\n",
        "# transform = Compose(\n",
        "#     [\n",
        "#         # SVDFeatureReduction(dataset.num_classes),\n",
        "#         # AddLaplacianEigenvectorPE(16, attr_name=None),\n",
        "#         ToSparseTensor(),\n",
        "#     ]\n",
        "# )\n",
        "# data = transform(data)\n",
        "\n",
        "\n",
        "print()\n",
        "print(data)\n",
        "print(\n",
        "    \"===========================================================================================================\"\n",
        ")\n",
        "\n",
        "# Gather some statistics about the graph.\n",
        "print(f\"Number of nodes: {data.num_nodes}\")\n",
        "print(f\"Number of edges: {data.num_edges}\")\n",
        "print(f\"Average node degree: {data.num_edges / data.num_nodes:.1f}\")\n",
        "# print(f'Number of training nodes: {data.train_mask.sum()}')\n",
        "# print(f'Training node label rate: {int(data.train_mask.sum()) / data.num_nodes:.1f}')\n",
        "print(f\"Has isolated nodes: {data.has_isolated_nodes()}\")\n",
        "print(f\"Has self-loops: {data.has_self_loops()}\")\n",
        "print(f\"Is undirected: {data.is_undirected()}\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "FsFjiFmsUPWe"
      },
      "outputs": [],
      "source": [
        "find_neuromap(True, False)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "OclO9A2d1Me9"
      },
      "outputs": [],
      "source": [
        "from torch_geometric.datasets import Coauthor\n",
        "from torch_geometric.transforms import (\n",
        "    Compose,\n",
        "    ToUndirected,\n",
        "    AddLaplacianEigenvectorPE,\n",
        "    SVDFeatureReduction,\n",
        "    ToSparseTensor,\n",
        ")\n",
        "\n",
        "dataset = Coauthor(root=\"data/Coauthor\", name=\"Physics\", transform=ToUndirected())\n",
        "\n",
        "print()\n",
        "print(f\"Dataset: {dataset}:\")\n",
        "print(\"======================\")\n",
        "print(f\"Number of graphs: {len(dataset)}\")\n",
        "print(f\"Number of features: {dataset.num_features}\")\n",
        "print(f\"Number of classes: {dataset.num_classes}\")\n",
        "\n",
        "data = dataset[0]  # Get the first graph object.\n",
        "\n",
        "del data.x\n",
        "\n",
        "transform = Compose(\n",
        "    [\n",
        "        # SVDFeatureReduction(dataset.num_classes),\n",
        "        AddLaplacianEigenvectorPE(16, attr_name=None),\n",
        "        # ToSparseTensor(),\n",
        "    ]\n",
        ")\n",
        "data = transform(data)\n",
        "\n",
        "\n",
        "print()\n",
        "print(data)\n",
        "print(\n",
        "    \"===========================================================================================================\"\n",
        ")\n",
        "\n",
        "# Gather some statistics about the graph.\n",
        "print(f\"Number of nodes: {data.num_nodes}\")\n",
        "print(f\"Number of edges: {data.num_edges}\")\n",
        "print(f\"Average node degree: {data.num_edges / data.num_nodes:.1f}\")\n",
        "# print(f'Number of training nodes: {data.train_mask.sum()}')\n",
        "# print(f'Training node label rate: {int(data.train_mask.sum()) / data.num_nodes:.1f}')\n",
        "print(f\"Has isolated nodes: {data.has_isolated_nodes()}\")\n",
        "print(f\"Has self-loops: {data.has_self_loops()}\")\n",
        "print(f\"Is undirected: {data.is_undirected()}\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "bdXYFWriURcO"
      },
      "outputs": [],
      "source": [
        "find_neuromap(False, True)"
      ]
    },
    {
      "cell_type": "markdown",
      "metadata": {
        "id": "INxpj-B6GDNE"
      },
      "source": [
        "## `ogbn-arxiv`"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "nsqNVPFLlkkd"
      },
      "outputs": [],
      "source": [
        "!pip install ogb\n",
        "\n",
        "from ogb.nodeproppred import PygNodePropPredDataset, Evaluator\n",
        "from torch_geometric.transforms import ToSparseTensor\n",
        "from torch_geometric.transforms import (\n",
        "    Compose,\n",
        "    ToUndirected,\n",
        "    AddLaplacianEigenvectorPE,\n",
        "    NormalizeFeatures,\n",
        "    SVDFeatureReduction,\n",
        "    ToSparseTensor,\n",
        ")\n",
        "\n",
        "# dataset = PygNodePropPredDataset(name='ogbn-arxiv', transform=ToSparseTensor())\n",
        "dataset = PygNodePropPredDataset(\n",
        "    root=\"data/ogbn-arxiv\", name=\"ogbn-arxiv\", transform=ToUndirected()\n",
        ")\n",
        "\n",
        "print()\n",
        "print(f\"Dataset: {dataset}:\")\n",
        "print(\"======================\")\n",
        "print(f\"Number of graphs: {len(dataset)}\")\n",
        "print(f\"Number of features: {dataset.num_features}\")\n",
        "print(f\"Number of classes: {dataset.num_classes}\")\n",
        "\n",
        "data = dataset[0]  # Get the first graph object.\n",
        "\n",
        "# Don't use node features\n",
        "# del data.x\n",
        "\n",
        "transform = Compose(\n",
        "    [\n",
        "        # NormalizeFeatures(),\n",
        "        AddLaplacianEigenvectorPE(16, attr_name=None),\n",
        "        # ToSparseTensor(),\n",
        "    ]\n",
        ")\n",
        "data = transform(data)\n",
        "\n",
        "\n",
        "print()\n",
        "print(data)\n",
        "print(\n",
        "    \"===========================================================================================================\"\n",
        ")\n",
        "\n",
        "# Gather some statistics about the graph.\n",
        "# print(f\"Number of nodes: {data.num_nodes}\")\n",
        "print(f\"Number of edges: {data.num_edges}\")\n",
        "print(f\"Average node degree: {data.num_edges / data.num_nodes:.1f}\")\n",
        "# print(f'Number of training nodes: {data.train_mask.sum()}')\n",
        "# print(f'Training node label rate: {int(data.train_mask.sum()) / data.num_nodes:.1f}')\n",
        "print(f\"Has isolated nodes: {data.has_isolated_nodes()}\")\n",
        "print(f\"Has self-loops: {data.has_self_loops()}\")\n",
        "print(f\"Is undirected: {data.is_undirected()}\")"
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "reset_results()"
      ],
      "metadata": {
        "id": "tQ5VnwM4gtfM"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "D2LLpuV4Vxjf"
      },
      "outputs": [],
      "source": [
        "_infomap()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "M3YaF2SIUVb6"
      },
      "outputs": [],
      "source": [
        "find_neuromap(True, True)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "fd_1x-wsV4jp"
      },
      "outputs": [],
      "source": [
        "!pip install ogb\n",
        "\n",
        "from ogb.nodeproppred import PygNodePropPredDataset, Evaluator\n",
        "from torch_geometric.transforms import ToSparseTensor\n",
        "from torch_geometric.transforms import (\n",
        "    Compose,\n",
        "    ToUndirected,\n",
        "    AddLaplacianEigenvectorPE,\n",
        "    NormalizeFeatures,\n",
        "    SVDFeatureReduction,\n",
        "    ToSparseTensor,\n",
        ")\n",
        "\n",
        "# dataset = PygNodePropPredDataset(name='ogbn-arxiv', transform=ToSparseTensor())\n",
        "dataset = PygNodePropPredDataset(\n",
        "    root=\"data/ogbn-arxiv\", name=\"ogbn-arxiv\", transform=ToUndirected()\n",
        ")\n",
        "\n",
        "print()\n",
        "print(f\"Dataset: {dataset}:\")\n",
        "print(\"======================\")\n",
        "print(f\"Number of graphs: {len(dataset)}\")\n",
        "print(f\"Number of features: {dataset.num_features}\")\n",
        "print(f\"Number of classes: {dataset.num_classes}\")\n",
        "\n",
        "data = dataset[0]  # Get the first graph object.\n",
        "\n",
        "# Don't use node features\n",
        "# del data.x\n",
        "\n",
        "# transform = Compose(\n",
        "#     [\n",
        "#         # NormalizeFeatures(),\n",
        "#         # AddLaplacianEigenvectorPE(16, attr_name=None),\n",
        "#         ToSparseTensor(),\n",
        "#     ]\n",
        "# )\n",
        "# data = transform(data)\n",
        "\n",
        "\n",
        "print()\n",
        "print(data)\n",
        "print(\n",
        "    \"===========================================================================================================\"\n",
        ")\n",
        "\n",
        "# Gather some statistics about the graph.\n",
        "# print(f\"Number of nodes: {data.num_nodes}\")\n",
        "print(f\"Number of edges: {data.num_edges}\")\n",
        "print(f\"Average node degree: {data.num_edges / data.num_nodes:.1f}\")\n",
        "# print(f'Number of training nodes: {data.train_mask.sum()}')\n",
        "# print(f'Training node label rate: {int(data.train_mask.sum()) / data.num_nodes:.1f}')\n",
        "print(f\"Has isolated nodes: {data.has_isolated_nodes()}\")\n",
        "print(f\"Has self-loops: {data.has_self_loops()}\")\n",
        "print(f\"Is undirected: {data.is_undirected()}\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "JfOjD26nUZmm"
      },
      "outputs": [],
      "source": [
        "find_neuromap(True, False)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "mNCXc1_zV4_T"
      },
      "outputs": [],
      "source": [
        "!pip install ogb\n",
        "\n",
        "from ogb.nodeproppred import PygNodePropPredDataset, Evaluator\n",
        "from torch_geometric.transforms import ToSparseTensor\n",
        "from torch_geometric.transforms import (\n",
        "    Compose,\n",
        "    ToUndirected,\n",
        "    AddLaplacianEigenvectorPE,\n",
        "    NormalizeFeatures,\n",
        "    SVDFeatureReduction,\n",
        "    ToSparseTensor,\n",
        ")\n",
        "\n",
        "# dataset = PygNodePropPredDataset(name='ogbn-arxiv', transform=ToSparseTensor())\n",
        "dataset = PygNodePropPredDataset(\n",
        "    root=\"data/ogbn-arxiv\", name=\"ogbn-arxiv\", transform=ToUndirected()\n",
        ")\n",
        "\n",
        "print()\n",
        "print(f\"Dataset: {dataset}:\")\n",
        "print(\"======================\")\n",
        "print(f\"Number of graphs: {len(dataset)}\")\n",
        "print(f\"Number of features: {dataset.num_features}\")\n",
        "print(f\"Number of classes: {dataset.num_classes}\")\n",
        "\n",
        "data = dataset[0]  # Get the first graph object.\n",
        "\n",
        "# Don't use node features\n",
        "del data.x\n",
        "\n",
        "transform = Compose(\n",
        "    [\n",
        "        # NormalizeFeatures(),\n",
        "        AddLaplacianEigenvectorPE(16, attr_name=None),\n",
        "        # ToSparseTensor(),\n",
        "    ]\n",
        ")\n",
        "data = transform(data)\n",
        "\n",
        "\n",
        "print()\n",
        "print(data)\n",
        "print(\n",
        "    \"===========================================================================================================\"\n",
        ")\n",
        "\n",
        "# Gather some statistics about the graph.\n",
        "# print(f\"Number of nodes: {data.num_nodes}\")\n",
        "print(f\"Number of edges: {data.num_edges}\")\n",
        "print(f\"Average node degree: {data.num_edges / data.num_nodes:.1f}\")\n",
        "# print(f'Number of training nodes: {data.train_mask.sum()}')\n",
        "# print(f'Training node label rate: {int(data.train_mask.sum()) / data.num_nodes:.1f}')\n",
        "print(f\"Has isolated nodes: {data.has_isolated_nodes()}\")\n",
        "print(f\"Has self-loops: {data.has_self_loops()}\")\n",
        "print(f\"Is undirected: {data.is_undirected()}\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "bbLumejgUbT9"
      },
      "outputs": [],
      "source": [
        "find_neuromap(False, True)"
      ]
    }
  ],
  "metadata": {
    "accelerator": "GPU",
    "colab": {
      "provenance": [],
      "gpuType": "V100"
    },
    "kernelspec": {
      "display_name": "Python 3",
      "name": "python3"
    },
    "language_info": {
      "name": "python"
    }
  },
  "nbformat": 4,
  "nbformat_minor": 0
}