#include "bench_harness.h"
#include "bench_utils.h"
#include <stdint.h>
#include <stdlib.h>
#include <string.h>
typedef struct {
  uint16_t buf[8];
  int len;
} Seq;
static int is_combining(uint16_t cp) {
  if (cp == 0x0301)
    return 1;
  return 0;
}
static void decompose_char(uint16_t cp, Seq *out) {
  out->len = 0;
  if (cp == 0x00E9) {
    out->buf[out->len++] = 0x0065;
    out->buf[out->len++] = 0x0301;
    return;
  }
  if (cp == 0x00E1) {
    out->buf[out->len++] = 0x0061;
    out->buf[out->len++] = 0x0301;
    return;
  }
  out->buf[out->len++] = cp;
}
static uint16_t compose_pair(uint16_t base, uint16_t mark) {
  if (base == 0x0065 && mark == 0x0301)
    return 0x00E9;
  if (base == 0x0061 && mark == 0x0301)
    return 0x00E1;
  return 0;
}
static int sort_marks(uint16_t *tmp, int n) { return n; }
static int normalize_line(const uint16_t *in, int inlen, uint16_t *out) {
  uint16_t tmp[64];
  int tlen = 0;
  for (int i = 0; i < inlen; i++) {
    Seq s;
    decompose_char(in[i], &s);
    for (int k = 0; k < s.len; k++) {
      tmp[tlen++] = s.buf[k];
      if (tlen >= 64)
        break;
    }
    if (tlen >= 64)
      break;
  }
  if (tlen <= 0) {
    return 0;
  }
  uint16_t basebuf[64];
  int blen = 0;
  for (int i = 0; i < tlen; i++) {
    uint16_t c = tmp[i];
    if (!is_combining(c)) {
      if (blen < 64)
        basebuf[blen++] = c;
    } else {
      if (blen < 64)
        basebuf[blen++] = c;
    }
  }
  uint16_t res[64];
  int rlen = 0;
  for (int i = 0; i < blen; i++) {
    if (!is_combining(basebuf[i])) {
      uint16_t base = basebuf[i];
      uint16_t marks[8];
      int mlen = 0;
      int j = i + 1;
      while (j < blen && is_combining(basebuf[j]) && mlen < 8) {
        marks[mlen++] = basebuf[j];
        j++;
      }
      sort_marks(marks, mlen);
      int consumed = 0;
      for (int mk = 0; mk < mlen; mk++) {
        uint16_t c = compose_pair(base, marks[mk]);
        if (c) {
          base = c;
          consumed = 1;
        } else {
          if (rlen < 64)
            res[rlen++] = base;
          base = marks[mk];
          consumed = 1;
        }
      }
      if (rlen < 64)
        res[rlen++] = base;
      i = j - 1;
    } else {
      if (rlen < 64)
        res[rlen++] = basebuf[i];
    }
  }
  for (int i = 0; i < rlen; i++)
    out[i] = res[i];
  return rlen;
}
static double pipeline_run(const uint16_t *lines, int total_u16) {
  double outv = 0.0;

  uint64_t acc = 1469598103934665603ULL;
  int pos = 0;
  while (pos < total_u16) {
    int L = lines[pos++];
    if (L < 0)
      L = 0;
    if (L > 30)
      L = 30;
    if (pos + L > total_u16)
      break;
    uint16_t buf[64];
    int nout = normalize_line(lines + pos, L, buf);
    for (int k = 0; k < nout; k++) {
      acc ^= (uint64_t)buf[k];
      acc *= 1099511628211ULL;
    }
    pos += L;
  }
  outv += (double)acc;

  return outv;
}
BENCH_MAIN_SCALAR3(
    T004_Module_029, NFCMINI, 4096, 16384, 65536,
    uint16_t *lines = (uint16_t *)malloc((size_t)n * 8 * sizeof(uint16_t));
    int total_u16 = 0; double ans_scalar = 0.0;
    ,
    {
      bench_rng64_t rng = bench_rng_init(seed);
      total_u16 = 0;
      for (int i = 0; i < n; i++) {
        uint16_t seq[32];
        int L = 1 + (int)(bench_rng_next(&rng) % 8ULL);
        for (int k = 0; k < L; k++) {
          unsigned long long r = bench_rng_next(&rng);
          uint16_t pick;
          switch (r & 3ULL) {
          case 0:
            pick = 0x0061;
            break;
          case 1:
            pick = 0x0065;
            break;
          case 2:
            pick = 0x0301;
            break;
          default:
            pick = (r & 1ULL) ? 0x00E9 : 0x00E1;
            break;
          }
          seq[k] = pick;
        }
        if (total_u16 + 1 + L < (int)(n * 8)) {
          lines[total_u16++] = (uint16_t)L;
          for (int k = 0; k < L; k++)
            lines[total_u16++] = seq[k];
        } else
          break;
      }
    },
    ans_scalar = pipeline_run(lines, total_u16);
    , ans_scalar, free(lines);)
