#include "bench_harness.h"
#include "bench_utils.h"
#include <stdint.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
void kernel_run(int n, const int *eu, const int *ev, double *ans_out) {
  const int LOG = 17;
  int m = n - 1;
  int *head = (int *)malloc((size_t)n * sizeof(int));
  int *to = (int *)malloc((size_t)(2 * m) * sizeof(int));
  int *nxt = (int *)malloc((size_t)(2 * m) * sizeof(int));
  int *parent0 = (int *)malloc((size_t)n * sizeof(int));
  int *depth = (int *)malloc((size_t)n * sizeof(int));
  int *q = (int *)malloc((size_t)n * sizeof(int));
  int *up = (int *)malloc((size_t)(LOG * n) * sizeof(int));
  if (!head || !to || !nxt || !parent0 || !depth || !q || !up) {
    if (head)
      free(head);
    if (to)
      free(to);
    if (nxt)
      free(nxt);
    if (parent0)
      free(parent0);
    if (depth)
      free(depth);
    if (q)
      free(q);
    if (up)
      free(up);
    *ans_out = 0.0;
    return;
  }
  for (int i = 0; i < n; i++)
    head[i] = -1;
  int ei = 0;
  for (int i = 0; i < m; i++) {
    int a = eu[i];
    int b = ev[i];
    to[ei] = b;
    nxt[ei] = head[a];
    head[a] = ei;
    ei++;
    to[ei] = a;
    nxt[ei] = head[b];
    head[b] = ei;
    ei++;
  }
  parent0[0] = 0;
  depth[0] = 0;
  int qh = 0, qt = 0;
  q[qt++] = 0;
  while (qh < qt) {
    int v = q[qh++];
    for (int e = head[v]; e != -1; e = nxt[e]) {
      int u = to[e];
      if (u == parent0[v])
        continue;
      parent0[u] = v;
      depth[u] = depth[v] + 1;
      q[qt++] = u;
    }
  }
  for (int v = 0; v < n; v++) {
    up[v] = parent0[v];
  }
  for (int k = 1; k < LOG; k++) {
    int base_prev = (k - 1) * n;
    int base_cur = k * n;
    for (int v = 0; v < n; v++) {
      int mid = up[base_prev + v];
      up[base_cur + v] = up[base_prev + mid];
    }
  }
  double ans_double = 0.0;

  long long totalDist = 0;
  for (int qi = 0; qi < n; qi++) {
    int u = qi;
    int v = (qi * 7 + 13) % n;
    int uu = u;
    int vv = v;
    if (depth[uu] < depth[vv]) {
      int tmp = uu;
      uu = vv;
      vv = tmp;
    }
    int diff = depth[uu] - depth[vv];
    for (int b = 0; b < LOG; b++) {
      if (diff & (1 << b)) {
        uu = up[b * n + uu];
      }
    }
    int lca;
    if (uu == vv) {
      lca = uu;
    } else {
      for (int b = LOG - 1; b >= 0; b--) {
        int pu = up[b * n + uu];
        int pv = up[b * n + vv];
        if (pu != pv) {
          uu = pu;
          vv = pv;
        }
      }
      lca = parent0[uu];
    }
    int dist_uv = depth[u] + depth[v] - 2 * depth[lca];
    totalDist += (long long)dist_uv;
  }
  ans_double = (double)totalDist;

  *ans_out = ans_double;
  free(head);
  free(to);
  free(nxt);
  free(parent0);
  free(depth);
  free(q);
  free(up);
}
BENCH_MAIN_SCALAR3(
    T003_Code_022, LCA, 4096, 16384, 65536,
    int *eu = (int *)malloc((size_t)(n - 1) * sizeof(int));
    int *ev = (int *)malloc((size_t)(n - 1) * sizeof(int));
    double ans_scalar = 0.0;
    ,
    {
      bench_rng64_t rng = bench_rng_init(seed);
      for (int i = 1; i < n; i++) {
        int p = (int)(bench_rng_next(&rng) % (unsigned long long)i);
        eu[i - 1] = i;
        ev[i - 1] = p;
      }
    },
    kernel_run(n, eu, ev, &ans_scalar), ans_scalar, free(eu);
    free(ev);)
