#include "bench_harness.h"
#include "bench_utils.h"
#include <stdint.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
void kernel_run(int n, const unsigned char *A, const unsigned char *B,
                double *y) {
  int nA = n / 2;
  int nB = n - nA;
  int max_states = 2 * nA + 5;
  int *link_arr = (int *)malloc((size_t)max_states * sizeof(int));
  int *stlen = (int *)malloc((size_t)max_states * sizeof(int));
  int *nxt = (int *)malloc((size_t)max_states * 26 * sizeof(int));
  if (!link_arr || !stlen || !nxt) {
    if (link_arr)
      free(link_arr);
    if (stlen)
      free(stlen);
    if (nxt)
      free(nxt);
    y[0] = 0.0;
    y[1] = 0.0;
    return;
  }
  double last_distinct = 0.0;
  double last_lcs = 0.0;

  int sz = 1;
  int last = 0;
  stlen[0] = 0;
  link_arr[0] = -1;
  memset(nxt + 0 * 26, -1, 26 * sizeof(int));
  for (int i = 0; i < nA; i++) {
    int c = (int)(A[i] - 'a');
    if (c < 0)
      c = 0;
    if (c > 25)
      c = 25;
    int cur = sz++;
    stlen[cur] = stlen[last] + 1;
    memset(nxt + cur * 26, -1, 26 * sizeof(int));
    int p = last;
    while (p != -1 && nxt[p * 26 + c] == -1) {
      nxt[p * 26 + c] = cur;
      p = link_arr[p];
    }
    if (p == -1) {
      link_arr[cur] = 0;
    } else {
      int q = nxt[p * 26 + c];
      if (stlen[p] + 1 == stlen[q]) {
        link_arr[cur] = q;
      } else {
        int clone = sz++;
        stlen[clone] = stlen[p] + 1;
        memcpy(nxt + clone * 26, nxt + q * 26, 26 * sizeof(int));
        link_arr[clone] = link_arr[q];
        while (p != -1 && nxt[p * 26 + c] == q) {
          nxt[p * 26 + c] = clone;
          p = link_arr[p];
        }
        link_arr[q] = clone;
        link_arr[cur] = clone;
      }
    }
    last = cur;
  }
  long long distinct = 0;
  for (int v = 1; v < sz; v++) {
    int lp = link_arr[v];
    int base = (lp < 0) ? 0 : stlen[lp];
    distinct += (long long)(stlen[v] - base);
  }
  {
    int v = 0;
    int lcur = 0;
    int best = 0;
    for (int i = 0; i < nB; i++) {
      int c = (int)(B[i] - 'a');
      if (c < 0)
        c = 0;
      if (c > 25)
        c = 25;
      while (v != -1 && nxt[v * 26 + c] == -1) {
        v = link_arr[v];
        if (v == -1) {
          v = 0;
          lcur = 0;
          break;
        }
        lcur = stlen[v];
      }
      if (nxt[v * 26 + c] != -1) {
        v = nxt[v * 26 + c];
        lcur++;
        if (lcur > best)
          best = lcur;
      }
    }
    last_distinct = (double)distinct;
    last_lcs = (double)best;
  }

  y[0] = last_distinct;
  y[1] = last_lcs;
  free(link_arr);
  free(stlen);
  free(nxt);
}
BENCH_MAIN_ARRAY3_D(
    T003_Code_013, SAMSTAT, 4096, 16384, 65536, int nA = n / 2; int nB = n - nA;
    unsigned char *A = (unsigned char *)malloc((size_t)nA *
                                               sizeof(unsigned char));
    unsigned char *B = (unsigned char *)malloc((size_t)nB *
                                               sizeof(unsigned char));
    double *y = (double *)malloc(2 * sizeof(double));
    ,
    {
      bench_rng64_t rng = bench_rng_init(seed);
      for (int i = 0; i < nA; i++) {
        A[i] = (unsigned char)('a' + (bench_rng_next(&rng) % 26ULL));
      }
      for (int i = 0; i < nB; i++) {
        B[i] = (unsigned char)('a' + (bench_rng_next(&rng) % 26ULL));
      }
    },
    kernel_run(n, A, B, y), y, 2, free(A);
    free(B); free(y);)
