#include "bench_harness.h"
#include "bench_utils.h"
#include <stdint.h>
#include <stdlib.h>
#include <string.h>
#define ASET 3
#define MAXNFA 32
#define MAXDFA 64
typedef struct {
  int ch;
  int out1;
  int out2;
} NState;
typedef struct {
  NState st[MAXNFA];
  int start;
  int n;
  int accept;
} MiniNFA;
typedef struct {
  int trans[ASET];
  int accept;
} DState;
typedef struct {
  DState st[MAXDFA];
  int used;
  int start;
} MiniDFA;
static int amap(char c) {
  if (c == 'a')
    return 0;
  if (c == 'b')
    return 1;
  if (c == 'c')
    return 2;
  return -1;
}
static void nfa_build_simple(MiniNFA *nfa) {
  nfa->n = 0;
  int s = nfa->n++;
  int a = nfa->n++;
  int b = nfa->n++;
  int t = nfa->n++;
  nfa->st[s].ch = -1;
  nfa->st[s].out1 = a;
  nfa->st[s].out2 = b;
  nfa->st[a].ch = amap('a');
  nfa->st[a].out1 = t;
  nfa->st[a].out2 = -1;
  nfa->st[b].ch = amap('b');
  nfa->st[b].out1 = t;
  nfa->st[b].out2 = -1;
  nfa->st[t].ch = -1;
  nfa->st[t].out1 = -1;
  nfa->st[t].out2 = -1;
  nfa->start = s;
  nfa->accept = t;
}
static void add_closure(const MiniNFA *nfa, int s, int *set, int *n) {
  int stack[64];
  int sp = 0;
  stack[sp++] = s;
  while (sp) {
    int u = stack[--sp];
    int seen = 0;
    for (int i = 0; i < *n; i++)
      if (set[i] == u) {
        seen = 1;
        break;
      }
    if (seen)
      continue;
    set[(*n)++] = u;
    if (nfa->st[u].ch < 0) {
      if (nfa->st[u].out1 >= 0)
        stack[sp++] = nfa->st[u].out1;
      if (nfa->st[u].out2 >= 0)
        stack[sp++] = nfa->st[u].out2;
    }
  }
}
static void move_set(const MiniNFA *nfa, const int *src, int ns, int c,
                     int *dst, int *nd) {
  *nd = 0;
  for (int i = 0; i < ns; i++) {
    int u = src[i];
    if (nfa->st[u].ch == c) {
      int v = nfa->st[u].out1;
      if (v >= 0)
        add_closure(nfa, v, dst, nd);
    }
  }
}
static int same_set(const int *a, int na, const int *b, int nb) {
  if (na != nb)
    return 0;
  for (int i = 0; i < na; i++)
    if (a[i] != b[i])
      return 0;
  return 1;
}
static int find_set(int sets[][64], int sizes[], int nset, const int *cur,
                    int ncur) {
  for (int i = 0; i < nset; i++) {
    if (same_set(sets[i], sizes[i], cur, ncur))
      return i;
  }
  return -1;
}
static void dfa_build(const MiniNFA *nfa, MiniDFA *dfa) {
  int sets[MAXDFA][64];
  int sizes[MAXDFA];
  int q[64];
  int qh = 0, qt = 0;
  int init[64];
  int ni = 0;
  add_closure(nfa, nfa->start, init, &ni);
  for (int i = 0; i < ni - 1; i++) {
    for (int j = i + 1; j < ni; j++) {
      if (init[j] < init[i]) {
        int tmp = init[i];
        init[i] = init[j];
        init[j] = tmp;
      }
    }
  }
  int idx0 = 0;
  sizes[0] = ni;
  for (int k = 0; k < ni; k++)
    sets[0][k] = init[k];
  dfa->used = 1;
  q[qt++] = 0;
  while (qh < qt) {
    int id = q[qh++];
    int is_acc = 0;
    for (int k = 0; k < sizes[id]; k++) {
      if (sets[id][k] == nfa->accept) {
        is_acc = 1;
        break;
      }
    }
    dfa->st[id].accept = is_acc;
    for (int c = 0; c < ASET; c++) {
      int tmp[64];
      int nt = 0;
      move_set(nfa, sets[id], sizes[id], c, tmp, &nt);
      for (int i = 0; i < nt - 1; i++) {
        for (int j = i + 1; j < nt; j++) {
          if (tmp[j] < tmp[i]) {
            int w = tmp[i];
            tmp[i] = tmp[j];
            tmp[j] = w;
          }
        }
      }
      int fid = -1;
      if (nt > 0) {
        fid = find_set(sets, sizes, dfa->used, tmp, nt);
        if (fid < 0) {
          fid = dfa->used++;
          sizes[fid] = nt;
          for (int k = 0; k < nt; k++)
            sets[fid][k] = tmp[k];
          q[qt++] = fid;
        }
      }
      dfa->st[id].trans[c] = fid;
    }
  }
  dfa->start = 0;
}
static int dfa_run(const MiniDFA *dfa, const char *s, int len) {
  int st = dfa->start;
  for (int i = 0; i < len; i++) {
    int c = amap(s[i]);
    if (c < 0)
      return 0;
    st = dfa->st[st].trans[c];
    if (st < 0)
      return 0;
  }
  return dfa->st[st].accept;
}
static double pipeline_run(const char *texts, int textlen) {
  MiniNFA nfa;
  nfa_build_simple(&nfa);
  MiniDFA dfa;
  dfa_build(&nfa, &dfa);
  double outv = 0.0;

  uint64_t acc = 1469598103934665603ULL;
  int pos = 0;
  while (pos < textlen) {
    int end = pos;
    while (end < textlen && texts[end] != '\n')
      end++;
    int l = end - pos;
    int m = dfa_run(&dfa, texts + pos, l);
    acc ^= ((uint64_t)m + 0x9e3779b97f4a7c15ULL * (uint64_t)l);
    if (end < textlen && texts[end] == '\n')
      end++;
    pos = end;
  }
  outv += (double)acc;

  return outv;
}
BENCH_MAIN_SCALAR3(T004_Module_027, REGDFA, 4096, 16384, 65536,
                   char *texts = (char *)malloc((size_t)n * 16 + 16);
                   int textlen = 0; double ans_scalar = 0.0;
                   , ({
                     bench_rng64_t rng = bench_rng_init(seed);
                     textlen = 0;
                     for (int i = 0; i < n; i++) {
                       unsigned long long r = bench_rng_next(&rng);
                       char line[32];
                       int L = 0;
                       for (int k = 0; k < 6; k++) {
                         char tbl[4] = {'a', 'b', 'c', 'a'};
                         line[L++] = tbl[(r >> (2 * k)) & 3ULL];
                       }
                       line[L++] = '\n';
                       if (textlen + L < (int)(n * 16 + 16)) {
                         memcpy(texts + textlen, line, L);
                         textlen += L;
                       } else {
                         break;
                       }
                     }
                   }),
                   ans_scalar = pipeline_run(texts, textlen), ans_scalar,
                   free(texts);)
