#include "bench_harness.h"
#include "bench_utils.h"
#include <stdint.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
void kernel_run(int n, const int *a, double *ans_out) {
  int *tails_val = (int *)malloc((size_t)n * sizeof(int));
  int *tails_idx = (int *)malloc((size_t)n * sizeof(int));
  int *prev_idx = (int *)malloc((size_t)n * sizeof(int));
  if (!tails_val || !tails_idx || !prev_idx) {
    if (tails_val)
      free(tails_val);
    if (tails_idx)
      free(tails_idx);
    if (prev_idx)
      free(prev_idx);
    *ans_out = 0.0;
    return;
  }
  int lis_len = 0;
  for (int i = 0; i < n; i++) {
    int v = a[i];
    int lo = 0, hi = lis_len;
    while (lo < hi) {
      int mid = (lo + hi) >> 1;
      if (tails_val[mid] >= v)
        hi = mid;
      else
        lo = mid + 1;
    }
    int pos = lo;
    tails_val[pos] = v;
    tails_idx[pos] = i;
    prev_idx[i] = (pos > 0) ? tails_idx[pos - 1] : -1;
    if (pos == lis_len)
      lis_len++;
  }
  long long sum_lis = 0;
  if (lis_len > 0) {
    int cur = tails_idx[lis_len - 1];
    while (cur != -1) {
      sum_lis += (long long)a[cur];
      cur = prev_idx[cur];
    }
  }
  double base_ans = (double)lis_len + 1e-6 * (double)sum_lis;
  double ans_double = 0.0;

  ans_double = base_ans;

  *ans_out = ans_double;
  free(tails_val);
  free(tails_idx);
  free(prev_idx);
}
BENCH_MAIN_SCALAR3(
    T003_Code_029, LIS, 4096, 16384, 65536,
    int *a = (int *)malloc((size_t)n * sizeof(int));
    double ans_scalar = 0.0;
    ,
    {
      bench_rng64_t rng = bench_rng_init(seed);
      for (int i = 0; i < n; i++) {
        a[i] = (int)((long long)(bench_rng_next(&rng) % 1000000ULL) - 500000LL);
      }
    },
    kernel_run(n, a, &ans_scalar), ans_scalar, free(a);)
