#include <bits/stdc++.h>


#include <algorithm>
#include <bit>
#include <cmath>
#include <cstdint>
#include <execution>
#include <iterator>
#include <random>
#include <tuple>
#include <utility>
#include <vector>

#include <cassert>
#include <iostream>
#include <set>

#include "serialization.cpp"

using namespace std;
using ll = long long;

int main(int argc, char* argv[]) {
  if (argc < 2) {
    cerr << "Usage: " << argv[0] << " <filename>" << endl;
    return 1;
  }

  string filename = argv[1];

  if (!filename.ends_with(".in")) {
    cerr << "Input file must be a .in file" << endl;
    return 1;
  }

  ifstream ifs(filename, ios::binary);

  cout << "reading graph " << filename << "..." << endl;

  int n, m;
  ifs >> n >> m;

  vector<pair<ll, ll>> edges(m);
  ll highest_id = -1;
  for (auto& [u, v] : edges) {
    ifs >> u >> v;
    highest_id = max({highest_id, u, v});
  }

  if (highest_id >= n) {
    cerr << "Max ID exceeds number of nodes, coordinate compressing..." << endl;

    vector<ll> ids(2*m);
    auto rng = views::iota(0, m);
    for_each(execution::par_unseq, rng.begin(), rng.end(), [&edges, &ids](auto i) {
        ids[2*i+0] = edges[i].first;
        ids[2*i+1] = edges[i].second;
    });

    cerr << "Flattened edges, now sorting..." << endl;

    sort(execution::par_unseq, ids.begin(), ids.end());
    auto last = unique(ids.begin(), ids.end());

    assert(last - ids.begin() <= n);

    cerr << "Found " << last - ids.begin() << " unique node IDs in edge list" << endl;

    for_each(execution::par_unseq, edges.begin(), edges.end(), [&ids, &last](auto& e) {
        auto& [u, v] = e;
        u = lower_bound(ids.begin(), last, u) - ids.begin();
        v = lower_bound(ids.begin(), last, v) - ids.begin();
    });

    cerr << "Finished compressing!" << endl;
  }

  vector<vector<int>> G(n);

  for (auto& [u, v] : edges) {
    assert(0 <= u && u < n && 0 <= v && v < n);
    G[u].push_back(v);
    G[v].push_back(u);
  }

  cout << "finished reading graph, deduplicating edges..." << endl;

  for_each(std::execution::par_unseq, G.begin(), G.end(), [](auto& x) {
    sort(x.begin(), x.end());
    x.erase(unique(x.begin(), x.end()), x.end());
  });

  cout << "finished deduplication, counting degrees..." << endl;
  ll tot_edges = transform_reduce(std::execution::par_unseq, G.begin(), G.end(),
                                  0ll, std::plus<ll>(),
                                  [](const auto& x) { return x.size(); });
  tot_edges /= 2;
  m = tot_edges;

  string out_filename = filename.substr(0, filename.size() - 3) + ".bin";
  cout << "serializing to " << out_filename << "..." << endl;
  serialize(G, out_filename);
  cout << "done!" << endl;

  return 0;
}