#include "bench_harness.h"
#include "bench_utils.h"
#include <stdint.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
void kernel_run(int n, const double *x, double *y) {
  int w = n / 64 + 1;
  if (w < 1)
    w = 1;
  if (w > n)
    w = n;
  int *dq = (int *)malloc((size_t)n * sizeof(int));
  if (!dq)
    return;

  int head = 0;
  int tail = 0;
  int out_idx = 0;
  for (int i = 0; i < n; i++) {
    while (head < tail && x[dq[tail - 1]] <= x[i]) {
      tail--;
    }
    dq[tail++] = i;
    if (dq[head] <= i - w)
      head++;
    if (i >= w - 1) {
      y[out_idx++] = x[dq[head]];
    }
  }
  for (int k = out_idx; k < n; k++) {
    y[k] = 0.0;
  }

  free(dq);
}
BENCH_MAIN_ARRAY3_D(T003_Code_007, SWMAX, 4096, 16384, 65536,
                    double *x = malloc((size_t)n * sizeof(double));
                    double *y = malloc((size_t)n * sizeof(double)),
                    bench_fill_array(x, n, seed);
                    , kernel_run(n, x, y), y, n, free(x); free(y);)
