#include "bench_harness.h"
#include "bench_utils.h"
#include <stdint.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
void kernel_run(int n, const unsigned char *text, const unsigned char *pats,
                double *ans_out) {
  const int PATS = 64;
  const int PLEN = 8;
  const int ALPHA = 26;
  const int NODE_CAP = PATS * PLEN + 1;
  int *nxt = (int *)malloc((size_t)NODE_CAP * (size_t)ALPHA * sizeof(int));
  int *fail = (int *)malloc((size_t)NODE_CAP * sizeof(int));
  int *outc = (int *)malloc((size_t)NODE_CAP * sizeof(int));
  int *q = (int *)malloc((size_t)NODE_CAP * sizeof(int));
  if (!nxt || !fail || !outc || !q) {
    if (nxt)
      free(nxt);
    if (fail)
      free(fail);
    if (outc)
      free(outc);
    if (q)
      free(q);
    *ans_out = 0.0;
    return;
  }
  double ans_double = 0.0;

  memset(nxt, -1, (size_t)NODE_CAP * (size_t)ALPHA * sizeof(int));
  memset(fail, 0, (size_t)NODE_CAP * sizeof(int));
  memset(outc, 0, (size_t)NODE_CAP * sizeof(int));
  int node_cnt = 1;
  for (int p = 0; p < PATS; p++) {
    int node = 0;
    for (int k = 0; k < PLEN; k++) {
      unsigned char ch = pats[p * PLEN + k];
      int c = (int)(ch - 'a');
      if (c < 0)
        c = 0;
      if (c > 25)
        c = 25;
      if (nxt[node * ALPHA + c] == -1) {
        nxt[node * ALPHA + c] = node_cnt;
        memset(nxt + node_cnt * ALPHA, -1, ALPHA * sizeof(int));
        fail[node_cnt] = 0;
        outc[node_cnt] = 0;
        node_cnt++;
      }
      node = nxt[node * ALPHA + c];
    }
    outc[node]++;
  }
  int qh = 0, qt = 0;
  for (int c = 0; c < ALPHA; c++) {
    int v = nxt[0 * ALPHA + c];
    if (v != -1) {
      fail[v] = 0;
      q[qt++] = v;
    } else {
      nxt[0 * ALPHA + c] = 0;
    }
  }
  while (qh < qt) {
    int u = q[qh++];
    for (int c = 0; c < ALPHA; c++) {
      int v = nxt[u * ALPHA + c];
      if (v != -1) {
        fail[v] = nxt[fail[u] * ALPHA + c];
        outc[v] += outc[fail[v]];
        q[qt++] = v;
      } else {
        nxt[u * ALPHA + c] = nxt[fail[u] * ALPHA + c];
      }
    }
  }
  long long total_hits = 0;
  {
    int st = 0;
    for (int i = 0; i < n; i++) {
      int c = (int)(text[i] - 'a');
      if (c < 0)
        c = 0;
      if (c > 25)
        c = 25;
      st = nxt[st * ALPHA + c];
      total_hits += (long long)outc[st];
    }
  }
  ans_double = (double)total_hits;

  *ans_out = ans_double;
  free(nxt);
  free(fail);
  free(outc);
  free(q);
}
BENCH_MAIN_SCALAR3(
    T003_Code_008, AHOC, 4096, 16384, 65536, const int PATS = 64;
    const int PLEN = 8;
    unsigned char *text = (unsigned char *)malloc((size_t)n *
                                                  sizeof(unsigned char));
    unsigned char *pats = (unsigned char *)malloc((size_t)(PATS * PLEN) *
                                                  sizeof(unsigned char));
    double ans_scalar = 0.0;
    ,
    {
      bench_rng64_t rng = bench_rng_init(seed);
      for (int i = 0; i < n; i++) {
        text[i] = (unsigned char)('a' + (bench_rng_next(&rng) % 4ULL));
      }
      for (int i = 0; i < PATS * PLEN; i++) {
        pats[i] = (unsigned char)('a' + (bench_rng_next(&rng) % 4ULL));
      }
    },
    kernel_run(n, text, pats, &ans_scalar), ans_scalar, free(text);
    free(pats);)
