#include "bench_harness.h"
#include "bench_utils.h"
#include <stdint.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
void kernel_run(int n, const int *inc, double *ans_out) {
  if (n < 1) {
    *ans_out = 0.0;
    return;
  }
  long long *x = (long long *)malloc((size_t)n * sizeof(long long));
  long long *dp = (long long *)malloc((size_t)n * sizeof(long long));
  long long *hm = (long long *)malloc((size_t)n * sizeof(long long));
  long long *hb = (long long *)malloc((size_t)n * sizeof(long long));
  if (!x || !dp || !hm || !hb) {
    if (x)
      free(x);
    if (dp)
      free(dp);
    if (hm)
      free(hm);
    if (hb)
      free(hb);
    *ans_out = 0.0;
    return;
  }
  x[0] = 0;
  for (int i = 1; i < n; i++) {
    x[i] = x[i - 1] + (long long)inc[i];
  }
  const long long C = 1000LL;
  int hhead = 0, htail = 0;
  dp[0] = 0;
  hm[htail] = -2LL * x[0];
  hb[htail] = dp[0] + x[0] * x[0];
  htail++;
  for (int i = 1; i < n; i++) {
    while (htail - hhead >= 2) {
      long long m1 = hm[hhead];
      long long b1 = hb[hhead];
      long long m2 = hm[hhead + 1];
      long long b2 = hb[hhead + 1];
      long long v1 = m1 * x[i] + b1;
      long long v2 = m2 * x[i] + b2;
      if (v2 <= v1)
        hhead++;
      else
        break;
    }
    long long best = hm[hhead] * x[i] + hb[hhead];
    dp[i] = x[i] * x[i] + C + best;
    long long new_m = -2LL * x[i];
    long long new_b = dp[i] + x[i] * x[i];
    while (htail - hhead >= 2) {
      long long m1 = hm[htail - 2];
      long long b1 = hb[htail - 2];
      long long m2 = hm[htail - 1];
      long long b2 = hb[htail - 1];
      long long m3 = new_m;
      long long b3 = new_b;
      long double left = ((long double)(b2 - b1)) / ((long double)(m1 - m2));
      long double right = ((long double)(b3 - b2)) / ((long double)(m2 - m3));
      if (right <= left) {
        htail--;
      } else {
        break;
      }
    }
    hm[htail] = new_m;
    hb[htail] = new_b;
    htail++;
  }
  long long final_ans = dp[n - 1];
  double base_ans = (double)final_ans;
  double ans_double = 0.0;

  ans_double = base_ans;

  *ans_out = ans_double;
  free(x);
  free(dp);
  free(hm);
  free(hb);
}
BENCH_MAIN_SCALAR3(
    T003_Code_032, CHT, 4096, 16384, 65536,
    int *inc = (int *)malloc((size_t)n * sizeof(int));
    double ans_scalar = 0.0;
    ,
    {
      bench_rng64_t rng = bench_rng_init(seed);
      for (int i = 0; i < n; i++) {
        inc[i] = (int)(bench_rng_next(&rng) % 10ULL) + 1;
      }
    },
    kernel_run(n, inc, &ans_scalar), ans_scalar, free(inc);)
