
#include "bench_harness.h"
#include "bench_utils.h"
#include <math.h>
#include <stdint.h>
#include <stdlib.h>
#include <string.h>
#define MDCT_N 8
#define MDCT_BLK (2 * MDCT_N)
static const double mdct_win16[MDCT_BLK] = {
    0.19509032201612825,  0.55557023301960218,  0.83146961230254524,
    0.98078528040323043,  0.98078528040323043,  0.83146961230254546,
    0.55557023301960218,  0.19509032201612861,  -0.19509032201612836,
    -0.55557023301960196, -0.83146961230254524, -0.98078528040323032,
    -0.98078528040323043, -0.83146961230254546, -0.55557023301960218,
    -0.19509032201612872};
static inline void apply_window16(const double *in, double *tmp) {
  for (int i = 0; i < MDCT_BLK; i++) {
    tmp[i] = in[i] * mdct_win16[i];
  }
}
static inline void mdct8(const double *xw, double *coef) {
  for (int k = 0; k < MDCT_N; k++) {
    double acc = 0.0;
    for (int n2 = 0; n2 < MDCT_BLK; n2++) {
      double ang = M_PI / (double)MDCT_N *
                   ((double)n2 + 0.5 + (double)MDCT_N / 2.0) *
                   ((double)k + 0.5);
      acc += xw[n2] * cos(ang);
    }
    coef[k] = acc;
  }
}
static double process_frames(int n, const double *input) {
  int frames = n / MDCT_BLK;
  double *blk = (double *)malloc((size_t)MDCT_BLK * sizeof(double));
  double *tmp = (double *)malloc((size_t)MDCT_BLK * sizeof(double));
  double *coef = (double *)malloc((size_t)MDCT_N * sizeof(double));
  double energy = 0.0;
  double e_local = 0.0;
  for (int f = 0; f < frames; f++) {
    const double *src = input + f * MDCT_BLK;
    for (int i = 0; i < MDCT_BLK; i++) {
      blk[i] = src[i];
    }
    apply_window16(blk, tmp);
    mdct8(tmp, coef);
    for (int k = 0; k < MDCT_N; k++) {
      double v = coef[k];
      e_local += v * v;
    }
  }
  energy = e_local;
  free(blk);
  free(tmp);
  free(coef);
  return energy;
}
BENCH_MAIN_SCALAR3(
    T004_Module_013, MDCTW, 4096, 16384, 65536,
    double *input = (double *)malloc((size_t)n * sizeof(double));
    double ans_scalar = 0.0;
    ,
    {
      bench_rng64_t rng = bench_rng_init(seed);
      for (int i = 0; i < n; i++) {
        input[i] = bench_rng_double_signed(&rng);
      }
    },
    ans_scalar = process_frames(n, input), ans_scalar, free(input);)
