{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "b5923940",
   "metadata": {},
   "outputs": [],
   "source": [
    "include(\"decomposition.jl\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "6a5c949a",
   "metadata": {},
   "outputs": [],
   "source": [
    "using LightGraphs\n",
    "using TickTock\n",
    "using SparseArrays\n",
    "using ProgressMeter"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "e1a93bb5",
   "metadata": {
    "scrolled": true
   },
   "outputs": [],
   "source": [
    "nam = \"MUTAG\"\n",
    "node_types = 7 #66 for \"SW-620H\", 46 for \"PC-3H\", 7 for \"MUTAG\"\n",
    "\n",
    "name = \"data/\" * nam\n",
    "term = 188 # Graph numbers\n",
    "\n",
    "ad_file = name * \"_A.txt\"\n",
    "graph_ind_file = name * \"_graph_indicator.txt\"\n",
    "graph_label_file = name * \"_graph_labels.txt\"\n",
    "node_label_file = name * \"_node_labels.txt\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "6ba6028b",
   "metadata": {},
   "outputs": [],
   "source": [
    "alpha = 1e7\n",
    "lowest_nodes = 10\n",
    "highest_nodes = 28\n",
    "sparsednodes = []\n",
    "sparsedfeatures = []\n",
    "before = Int[]\n",
    "after = Int[]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "f00e8bbd",
   "metadata": {},
   "outputs": [],
   "source": [
    "graph_ind_mat = open(graph_ind_file) do file\n",
    "    [parse(Int, line) for line in eachline(file)]\n",
    "end\n",
    "\n",
    "graph_label_mat = open(graph_label_file) do file\n",
    "    [parse(Int, line) for line in eachline(file)]\n",
    "end\n",
    "\n",
    "node_label_mat = open(node_label_file) do file\n",
    "    [parse(Int, line) for line in eachline(file)]\n",
    "end\n",
    "\n",
    "ad_mat = []\n",
    "open(ad_file) do file\n",
    "    for line in eachline(file)\n",
    "        temp = parse.(Int, split(line, ','))\n",
    "        push!(ad_mat, temp)\n",
    "    end\n",
    "end"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "6d420f2b",
   "metadata": {},
   "outputs": [],
   "source": [
    "function onehot(vec, number)\n",
    "    mat = Matrix{Int}(undef, length(vec), number)\n",
    "    for i in eachindex(vec)\n",
    "        hotvec = zeros(Int, number)\n",
    "        hotvec[vec[i]+1] = 1\n",
    "        mat[i, :] = hotvec\n",
    "    end\n",
    "    return mat\n",
    "end"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "39a3e838",
   "metadata": {
    "scrolled": true
   },
   "outputs": [],
   "source": [
    "@showprogress for graph_number in 1:term #length(graph_label_mat)\n",
    "\n",
    "    nodenumbers = findall(x -> x == graph_number, graph_ind_mat)\n",
    "    edgenumbers = Int[]\n",
    "    node2numbers = Int[]\n",
    "    node1numbers = Int[]\n",
    "    for (ind, row) in enumerate(ad_mat)\n",
    "        node1, node2 = row\n",
    "        if node1 in nodenumbers && node2 in nodenumbers\n",
    "            push!(edgenumbers, ind)\n",
    "            push!(node1numbers, node2)\n",
    "            push!(node2numbers, node1)\n",
    "        end\n",
    "    end\n",
    "    node_feature = [node_label_mat[node] for node in nodenumbers]\n",
    "    push!(before, length(node_feature))\n",
    "    node_feature_oh = onehot(node_feature, node_types)'\n",
    "    buffer = minimum(nodenumbers) - 1\n",
    "    node1numbers .- buffer\n",
    "\n",
    "    rr = copy(node1numbers .- buffer)\n",
    "    cc = copy(node2numbers .- buffer)\n",
    "    vv = ones(Float64, length(rr))\n",
    "    W = copy(vv)\n",
    "    mg = length(rr)\n",
    "    R = append!(copy(rr), copy(cc))\n",
    "    C = append!(copy(cc), copy(rr))\n",
    "    V = append!(copy(vv), copy(vv))\n",
    "    A = sparse(R, C, V)\n",
    "    NF = copy(node_feature_oh)\n",
    "\n",
    "    for target_node in lowest_nodes:maximum(nodenumbers)+1\n",
    "        A_new= decomposition(A, L, NF, alpha)\n",
    "        i, j, v = findnz(A_new)\n",
    "        push!(after, length(i)/2)\n",
    "\n",
    "        newnode2numbers = j .+ buffer\n",
    "        newnodes = [j.-1, i.-1]\n",
    "        # new_node_feature = [node_label_mat[node] for node in unique(newnode2numbers)]\n",
    "    \n",
    "        push!(sparsednodes, newnodes)\n",
    "        # push!(sparsedfeatures, new_node_feature)\n",
    "        open(\"output/\"*string(target_node)*\"_mutag_coarsened.txt\", \"a\") do f\n",
    "            writedlm(f, newnodes, \",\")\n",
    "        end\n",
    "    end\n",
    "    for target_node in maximum(nodenumbers)+1:highest_nodes\n",
    "        open(\"output/\"*string(target_node)*\"_mutag_coarsened.txt\", \"a\") do f\n",
    "            writedlm(f, [], \",\")\n",
    "        end\n",
    "    end\n",
    "end"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "cf2044a7",
   "metadata": {},
   "outputs": [],
   "source": [
    "# sparsedfeatures"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "76e64342",
   "metadata": {},
   "outputs": [],
   "source": [
    "# mean(after./before)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "b7c9ec66",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.18"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
