
#include "bench_harness.h"
#include "bench_utils.h"
#include <stdint.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
void kernel_run(int n, const int *eu, const int *ev, const unsigned char *color,
                double *ans_out) {
  int m = n - 1;
  int *head = (int *)malloc((size_t)n * sizeof(int));
  int *to = (int *)malloc((size_t)(2 * m) * sizeof(int));
  int *nxt = (int *)malloc((size_t)(2 * m) * sizeof(int));
  int *parent = (int *)malloc((size_t)n * sizeof(int));
  int *q = (int *)malloc((size_t)n * sizeof(int));
  int *order = (int *)malloc((size_t)n * sizeof(int));
  int *bestcnt = (int *)malloc((size_t)n * sizeof(int));
  int *cnt = (int *)malloc((size_t)n * 64U * sizeof(int));
  if (!head || !to || !nxt || !parent || !q || !order || !bestcnt || !cnt) {
    if (head)
      free(head);
    if (to)
      free(to);
    if (nxt)
      free(nxt);
    if (parent)
      free(parent);
    if (q)
      free(q);
    if (order)
      free(order);
    if (bestcnt)
      free(bestcnt);
    if (cnt)
      free(cnt);
    *ans_out = 0.0;
    return;
  }
  for (int i = 0; i < n; i++)
    head[i] = -1;
  int ei = 0;
  for (int i = 0; i < m; i++) {
    int a = eu[i];
    int b = ev[i];
    to[ei] = b;
    nxt[ei] = head[a];
    head[a] = ei;
    ei++;
    to[ei] = a;
    nxt[ei] = head[b];
    head[b] = ei;
    ei++;
  }
  parent[0] = 0;
  int qh = 0, qt = 0, ord_sz = 0;
  q[qt++] = 0;
  while (qh < qt) {
    int v = q[qh++];
    order[ord_sz++] = v;
    for (int e = head[v]; e != -1; e = nxt[e]) {
      int u = to[e];
      if (u == parent[v])
        continue;
      parent[u] = v;
      q[qt++] = u;
    }
  }
  for (int idx = ord_sz - 1; idx >= 0; idx--) {
    int v = order[idx];
    int basev = v * 64;
    for (int c = 0; c < 64; c++) {
      cnt[basev + c] = 0;
    }
    int colv = (int)(color[v] & 63u);
    cnt[basev + colv] = cnt[basev + colv] + 1;
    int best_local = cnt[basev + colv];
    for (int e = head[v]; e != -1; e = nxt[e]) {
      int u = to[e];
      if (parent[u] == v) {
        int baseu = u * 64;
        for (int c2 = 0; c2 < 64; c2++) {
          int newv = cnt[basev + c2] + cnt[baseu + c2];
          cnt[basev + c2] = newv;
          if (newv > best_local)
            best_local = newv;
        }
      }
    }
    bestcnt[v] = best_local;
  }
  long long total = 0;
  for (int i = 0; i < n; i++) {
    total += (long long)bestcnt[i];
  }
  double ans_double = 0.0;

  ans_double = (double)total;

  *ans_out = ans_double;
  free(head);
  free(to);
  free(nxt);
  free(parent);
  free(q);
  free(order);
  free(bestcnt);
  free(cnt);
}
BENCH_MAIN_SCALAR3(
    T003_Code_026, DSUOT, 4096, 16384, 65536,
    int *eu = (int *)malloc((size_t)(n - 1) * sizeof(int));
    int *ev = (int *)malloc((size_t)(n - 1) * sizeof(int));
    unsigned char *color = (unsigned char *)malloc((size_t)n *
                                                   sizeof(unsigned char));
    double ans_scalar = 0.0;
    ,
    {
      bench_rng64_t rng = bench_rng_init(seed);
      for (int i = 1; i < n; i++) {
        int p = (int)(bench_rng_next(&rng) % (unsigned long long)i);
        eu[i - 1] = i;
        ev[i - 1] = p;
      }
      for (int i = 0; i < n; i++) {
        color[i] = (unsigned char)(bench_rng_next(&rng) % 64ULL);
      }
    },
    kernel_run(n, eu, ev, color, &ans_scalar), ans_scalar, free(eu);
    free(ev); free(color);)
