#include "bench_harness.h"
#include "bench_utils.h"
#include <stdint.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#define AC_TOTFREQ 4096u
#define AC_SYM_FREQ 256u
typedef struct {
  uint32_t low;
  uint32_t high;
  uint8_t *out;
  size_t outpos;
} ac_enc;
static inline void ac_emit_byte(ac_enc *st, uint8_t b) {
  st->out[st->outpos++] = b;
}
static inline void ac_renorm(ac_enc *st) {
  while (((st->low ^ st->high) & 0xFF000000u) == 0) {
    ac_emit_byte(st, (uint8_t)(st->high >> 24));
    st->low <<= 8;
    st->high = (st->high << 8) | 0xFFu;
  }
}
static inline void ac_init(ac_enc *st, uint8_t *outbuf) {
  st->low = 0;
  st->high = 0xFFFFFFFFu;
  st->out = outbuf;
  st->outpos = 0;
}
static inline void ac_encode_sym(ac_enc *st, uint32_t sym) {
  uint32_t cum = sym << 8;
  uint32_t frq = AC_SYM_FREQ;
  uint64_t range = (uint64_t)st->high - (uint64_t)st->low + 1ull;
  uint32_t newLow =
      st->low + (uint32_t)((range * (uint64_t)cum) / (uint64_t)AC_TOTFREQ);
  uint32_t newHigh =
      st->low +
      (uint32_t)((range * (uint64_t)(cum + frq)) / (uint64_t)AC_TOTFREQ - 1ull);
  st->low = newLow;
  st->high = newHigh;
  ac_renorm(st);
}
static inline void ac_finish(ac_enc *st) {
  for (int i = 0; i < 4; i++) {
    ac_emit_byte(st, (uint8_t)(st->high >> 24));
    st->high <<= 8;
  }
}
static size_t ac_encode_stream(const uint8_t *in, int n, uint8_t *out) {
  ac_enc st;
  ac_init(&st, out);
  for (int i = 0; i < n; i++) {
    uint32_t sym = (uint32_t)(in[i] & 0x0Fu);
    ac_encode_sym(&st, sym);
  }
  ac_finish(&st);
  return st.outpos;
}
static double pipeline_run(int n, const uint8_t *inbuf, uint8_t *outbuf) {
  size_t outsz = ac_encode_stream(inbuf, n, outbuf);
  uint64_t acc = 0;
  for (size_t i = 0; i < outsz; i++)
    acc = (acc + (uint64_t)outbuf[i]) & 0xFFFFFFFFFFFFull;
  double v = 0.0;

  v = (double)acc;
  return v;
}
BENCH_MAIN_SCALAR3(
    T004_Module_037, ARITHENC, 4096, 16384, 65536,
    uint8_t *inbuf = (uint8_t *)malloc((size_t)n);
    uint8_t *outbuf = (uint8_t *)malloc((size_t)(n * 8 + 32));
    double ans_scalar = 0.0;
    ,
    {
      bench_rng64_t rng = bench_rng_init(seed);
      for (int i = 0; i < n; i++)
        inbuf[i] = (uint8_t)(bench_rng_next(&rng) & 0x0Fu);
    },
    ans_scalar = pipeline_run(n, inbuf, outbuf), ans_scalar, free(inbuf);
    free(outbuf);)
