#include "bench_harness.h"
#include "bench_utils.h"
#include <stdint.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
void kernel_run(int n, const int *a, double *ans_out) {
  double ans_double = 0.0;
  const int K = 5;
  const int MAXV = 64;

  long long res_k = 0;
  long long res_km1 = 0;
  {
    int cnt[MAXV];
    for (int ii = 0; ii < MAXV; ii++)
      cnt[ii] = 0;
    int distinct = 0;
    int left = 0;
    for (int right = 0; right < n; right++) {
      int v = a[right] & 63;
      if (cnt[v] == 0)
        distinct++;
      cnt[v]++;
      while (distinct > K) {
        int v2 = a[left] & 63;
        cnt[v2]--;
        if (cnt[v2] == 0)
          distinct--;
        left++;
      }
      res_k += (long long)(right - left + 1);
    }
  }
  {
    int cnt[MAXV];
    for (int ii = 0; ii < MAXV; ii++)
      cnt[ii] = 0;
    int distinct = 0;
    int left = 0;
    int K2 = K - 1;
    for (int right = 0; right < n; right++) {
      int v = a[right] & 63;
      if (cnt[v] == 0)
        distinct++;
      cnt[v]++;
      while (distinct > K2) {
        int v2 = a[left] & 63;
        cnt[v2]--;
        if (cnt[v2] == 0)
          distinct--;
        left++;
      }
      res_km1 += (long long)(right - left + 1);
    }
  }
  long long exact = res_k - res_km1;
  ans_double = (double)exact;

  *ans_out = ans_double;
}
BENCH_MAIN_SCALAR3(
    T003_Code_006, KDIST, 4096, 16384, 65536,
    int *a = (int *)malloc((size_t)n * sizeof(int));
    double ans_scalar = 0.0;,
                            {
                              bench_rng64_t rng = bench_rng_init(seed);
                              for (int i = 0; i < n; i++) {
                                a[i] = (int)(bench_rng_next(&rng) & 63ULL);
                              }
                            },
                            kernel_run(n, a, &ans_scalar), ans_scalar, free(a);)
