
#include "bench_harness.h"
#include "bench_utils.h"
#include <stdint.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
void kernel_run(int n, double *ans_out) {
  if (n < 2)
    n = 2;
  uint32_t *orig = (uint32_t *)malloc((size_t)n * sizeof(uint32_t));
  uint32_t *vals = (uint32_t *)malloc((size_t)n * sizeof(uint32_t));
  uint32_t *tmpv = (uint32_t *)malloc((size_t)n * sizeof(uint32_t));
  uint32_t *uniq = (uint32_t *)malloc((size_t)n * sizeof(uint32_t));
  int *rankv = (int *)malloc((size_t)n * sizeof(int));
  int *cnt = (int *)malloc((size_t)65536 * sizeof(int));
  int *roots = (int *)malloc((size_t)(n + 1) * sizeof(int));
  int capNodes = n * 24 + 5;
  int *lc = (int *)malloc((size_t)capNodes * sizeof(int));
  int *rc = (int *)malloc((size_t)capNodes * sizeof(int));
  int *sm = (int *)malloc((size_t)capNodes * sizeof(int));
  if (!orig || !vals || !tmpv || !uniq || !rankv || !cnt || !roots || !lc ||
      !rc || !sm) {
    if (orig)
      free(orig);
    if (vals)
      free(vals);
    if (tmpv)
      free(tmpv);
    if (uniq)
      free(uniq);
    if (rankv)
      free(rankv);
    if (cnt)
      free(cnt);
    if (roots)
      free(roots);
    if (lc)
      free(lc);
    if (rc)
      free(rc);
    if (sm)
      free(sm);
    *ans_out = 0.0;
    return;
  }
  for (int i = 0; i < n; i++) {
    uint32_t v = (uint32_t)((1103515245u * (unsigned)i + 12345u + (unsigned)n) &
                            0x00FFFFFFu);
    orig[i] = v;
    vals[i] = v;
  }
  for (int i = 0; i < 65536; i++)
    cnt[i] = 0;
  for (int i = 0; i < n; i++) {
    unsigned idx = vals[i] & 0xFFFFu;
    cnt[idx]++;
  }
  {
    int sumc = 0;
    for (int i = 0; i < 65536; i++) {
      int c = cnt[i];
      cnt[i] = sumc;
      sumc += c;
    }
  }
  for (int i = 0; i < n; i++) {
    unsigned idx = vals[i] & 0xFFFFu;
    tmpv[cnt[idx]++] = vals[i];
  }
  for (int i = 0; i < 65536; i++)
    cnt[i] = 0;
  for (int i = 0; i < n; i++) {
    unsigned idx = (tmpv[i] >> 16) & 0xFFFFu;
    cnt[idx]++;
  }
  {
    int sumc = 0;
    for (int i = 0; i < 65536; i++) {
      int c = cnt[i];
      cnt[i] = sumc;
      sumc += c;
    }
  }
  for (int i = 0; i < n; i++) {
    unsigned idx = (tmpv[i] >> 16) & 0xFFFFu;
    vals[cnt[idx]++] = tmpv[i];
  }
  int m = 0;
  for (int i = 0; i < n; i++) {
    if (i == 0 || vals[i] != vals[i - 1]) {
      uniq[m++] = vals[i];
    }
  }
  if (m <= 0)
    m = 1;
  for (int i = 0; i < n; i++) {
    uint32_t x = orig[i];
    int lo = 0, hi = m - 1;
    while (lo <= hi) {
      int mid = (lo + hi) >> 1;
      if (uniq[mid] < x) {
        lo = mid + 1;
      } else {
        hi = mid - 1;
      }
    }
    rankv[i] = lo + 1;
  }
  lc[0] = 0;
  rc[0] = 0;
  sm[0] = 0;
  int nodeCnt = 1;
  roots[0] = 0;
  for (int i = 0; i < n; i++) {
    int rnk = rankv[i];
    int prevRoot = roots[i];
    int newRoot = nodeCnt++;
    {
      int pr = prevRoot;
      if (pr == 0) {
        lc[newRoot] = 0;
        rc[newRoot] = 0;
        sm[newRoot] = 0;
      } else {
        lc[newRoot] = lc[pr];
        rc[newRoot] = rc[pr];
        sm[newRoot] = sm[pr];
      }
    }
    int curNew = newRoot;
    int curPrev = prevRoot;
    sm[curNew] = sm[curPrev] + 1;
    int lo = 1;
    int hi2 = m;
    while (lo < hi2) {
      int mid = (lo + hi2) >> 1;
      if (rnk <= mid) {
        int prevLeft = (curPrev == 0) ? 0 : lc[curPrev];
        int prevRight = (curPrev == 0) ? 0 : rc[curPrev];
        int newLeft = nodeCnt++;
        if (prevLeft == 0) {
          lc[newLeft] = 0;
          rc[newLeft] = 0;
          sm[newLeft] = 0;
        } else {
          lc[newLeft] = lc[prevLeft];
          rc[newLeft] = rc[prevLeft];
          sm[newLeft] = sm[prevLeft];
        }
        lc[curNew] = newLeft;
        rc[curNew] = prevRight;
        curNew = newLeft;
        curPrev = prevLeft;
        sm[curNew] = sm[curPrev] + 1;
        hi2 = mid;
      } else {
        int prevLeft = (curPrev == 0) ? 0 : lc[curPrev];
        int prevRight = (curPrev == 0) ? 0 : rc[curPrev];
        int newRight = nodeCnt++;
        if (prevRight == 0) {
          lc[newRight] = 0;
          rc[newRight] = 0;
          sm[newRight] = 0;
        } else {
          lc[newRight] = lc[prevRight];
          rc[newRight] = rc[prevRight];
          sm[newRight] = sm[prevRight];
        }
        lc[curNew] = prevLeft;
        rc[curNew] = newRight;
        curNew = newRight;
        curPrev = prevRight;
        sm[curNew] = sm[curPrev] + 1;
        lo = mid + 1;
      }
    }
    roots[i + 1] = newRoot;
  }
  unsigned long long checksum = 0ULL;
  for (int t = 0; t < n; t++) {
    int L = (t * 37 + 11) % n;
    int R = (t * 97 + 7) % n;
    if (L > R) {
      int tmp = L;
      L = R;
      R = tmp;
    }
    int len = R - L + 1;
    if (len <= 0)
      len = 1;
    int kth = (int)(((unsigned)(t * 131 + 17U) % (unsigned)len)) + 1;
    int leftRoot = roots[L];
    int rightRoot = roots[R + 1];
    int lo = 1;
    int hi2 = m;
    while (lo < hi2) {
      int mid = (lo + hi2) >> 1;
      int leftL = lc[leftRoot];
      int rightL = lc[rightRoot];
      int cntLeft = sm[rightL] - sm[leftL];
      if (kth <= cntLeft) {
        leftRoot = leftL;
        rightRoot = rightL;
        hi2 = mid;
      } else {
        kth -= cntLeft;
        leftRoot = rc[leftRoot];
        rightRoot = rc[rightRoot];
        lo = mid + 1;
      }
    }
    uint32_t realv = uniq[lo - 1];
    checksum += (unsigned long long)realv;
  }
  double ans_double = 0.0;

  ans_double = (double)checksum;

  *ans_out = ans_double;
  free(orig);
  free(vals);
  free(tmpv);
  free(uniq);
  free(rankv);
  free(cnt);
  free(roots);
  free(lc);
  free(rc);
  free(sm);
}
BENCH_MAIN_SCALAR3(T003_Code_049, PST, 4096, 16384, 65536,
                   double ans_scalar = 0.0;
                   , ;, kernel_run(n, &ans_scalar), ans_scalar, ;)
