#define _POSIX_C_SOURCE 199309L
#include "bench_utils.h"

#include <math.h>
#include <stdlib.h>
#include <string.h>
#include <sys/time.h>
#include <time.h>

/* ---------------- Timer ---------------- */
static struct timespec __t0;
void bench_timer_start(void) {
#if defined(CLOCK_MONOTONIC)
  clock_gettime(CLOCK_MONOTONIC, &__t0);
#else
  struct timeval tv;
  gettimeofday(&tv, NULL);
  __t0.tv_sec = tv.tv_sec;
  __t0.tv_nsec = tv.tv_usec * 1000;
#endif
}
double bench_timer_stop_seconds(void) {
#if defined(CLOCK_MONOTONIC)
  struct timespec t1;
  clock_gettime(CLOCK_MONOTONIC, &t1);
  return (t1.tv_sec - __t0.tv_sec) + (t1.tv_nsec - __t0.tv_nsec) / 1e9;
#else
  struct timeval tv;
  gettimeofday(&tv, NULL);
  long sec = tv.tv_sec - __t0.tv_sec;
  long nsec = tv.tv_usec * 1000 - __t0.tv_nsec;
  return sec + nsec / 1e9;
#endif
}

/* ---------------- FNV-1a base ---------------- */
static inline uint64_t fnv1a64_bytes(const void *data, size_t n) {
  const unsigned char *p = (const unsigned char *)data;
  uint64_t h = 1469598103934665603ULL;
  for (size_t i = 0; i < n; i++) {
    h ^= (uint64_t)p[i];
    h *= 1099511628211ULL;
  }
  return h;
}

/* ---------------- Tolerant hashing ---------------- */
static inline uint64_t mask_mantissa(double x, int ignore_bits,
                                     double atol_zero) {
  union {
    double d;
    uint64_t u;
  } v;
  v.d = x;
  if (x == 0.0 || fabs(x) < atol_zero)
    return 0ULL; /* canonical tiny/zero */
  uint64_t u = v.u;
  uint64_t exp = (u >> 52) & 0x7FFu;
  if (exp == 0x7FFu) { /* inf/NaN canonicalize */
    return (u & (1ULL << 63)) ? 0xFFF0000000000000ULL : 0x7FF0000000000000ULL;
  }
  if (ignore_bits <= 0)
    return u;
  uint64_t mask = ~((1ULL << ignore_bits) - 1ULL); /* chop low mantissa bits */
  return u & mask;
}

bench_tol_t bench_default_tol(void) {
  bench_tol_t t;
  t.ulp_ignore_bits = 3;
  t.atol_zero = 1e-300;
  const char *s1 = getenv("BENCH_TOL_IGN_BITS");
  const char *s2 = getenv("BENCH_ATOL");
  if (s1 && *s1) {
    int v = atoi(s1);
    if (v >= 0 && v <= 20)
      t.ulp_ignore_bits = v;
  }
  if (s2 && *s2) {
    t.atol_zero = atof(s2);
  }
  return t;
}

uint64_t bench_tol_hash_arrayd(const double *a, size_t n, bench_tol_t tol) {
  uint64_t h = 1469598103934665603ULL;
  for (size_t i = 0; i < n; i++) {
    uint64_t m = mask_mantissa(a[i], tol.ulp_ignore_bits, tol.atol_zero);
    h ^= m;
    h *= 1099511628211ULL;
  }
  return h;
}
uint64_t bench_tol_hash_double(double x, bench_tol_t tol) {
  uint64_t m = mask_mantissa(x, tol.ulp_ignore_bits, tol.atol_zero);
  return fnv1a64_bytes(&m, sizeof(m));
}

/* ---------------- Non-tolerant hashing ---------------- */
uint64_t bench_hash_bytes(const void *data, size_t nbytes) {
  return fnv1a64_bytes(data, nbytes);
}
uint64_t bench_hash_array_u64(const uint64_t *a, size_t n) {
  return fnv1a64_bytes(a, n * sizeof(uint64_t));
}

/* ---------------- Outer loop policy ---------------- */
static long long read_ll_env(const char *name, long long defv) {
  const char *s = getenv(name);
  if (!s || !*s)
    return defv;
  char *endp = NULL;
  long long v = strtoll(s, &endp, 10);
  if (endp == s)
    return defv;
  return v > 0 ? v : defv;
}
long long bench_outer_loops(int level) {
  long long l0 = read_ll_env("BENCH_OUTER0", 1LL);
  long long l1 = read_ll_env("BENCH_OUTER1", 100LL);
  long long l2 = read_ll_env("BENCH_OUTER2", 10000LL);
  long long l3 = read_ll_env("BENCH_OUTER3", 1000000LL);
  long long l4 = read_ll_env("BENCH_OUTER4", 100000000LL);
  long long l5 = read_ll_env("BENCH_OUTER5", 10000000000LL);
  long long l6 = read_ll_env("BENCH_OUTER6", 1000000000000LL);
  long long l7 = read_ll_env("BENCH_OUTER7", 100000000000000LL);
  long long l8 = read_ll_env("BENCH_OUTER8", 10000000000000000LL);
  if (level == 0)
    return l0;
  if (level == 1)
    return l1;
  if (level == 2)
    return l2;
  if (level == 3)
    return l3;
  if (level == 4)
    return l4;
  if (level == 5)
    return l5;
  if (level == 6)
    return l6;
  if (level == 7)
    return l7;
  return l8;
}

/* ---------------- RNG & fillers ---------------- */
bench_rng64_t bench_rng_init(uint64_t seed) {
  bench_rng64_t r;
  r.s = seed ? seed : 0x9e3779b97f4a7c15ULL;
  return r;
}
uint64_t bench_rng_next(bench_rng64_t *r) {
  uint64_t x = r->s;
  x ^= x >> 12;
  x ^= x << 25;
  x ^= x >> 27;
  r->s = x;
  return x * 2685821657736338717ULL;
}
double bench_rng_double01(bench_rng64_t *r) {
  union {
    uint64_t u;
    double d;
  } v;
  v.u = 0x3FF0000000000000ULL | (bench_rng_next(r) >> 12);
  return v.d - 1.0;
}
double bench_rng_double_signed(bench_rng64_t *r) {
  return 2.0 * bench_rng_double01(r) - 1.0;
}

void bench_fill_array(double *a, size_t n, uint64_t seed) {
  bench_rng64_t rng = bench_rng_init(seed);
  for (size_t i = 0; i < n; i++)
    a[i] = bench_rng_double_signed(&rng);
}
void bench_fill_array_pos(double *a, size_t n, uint64_t seed) {
  bench_rng64_t rng = bench_rng_init(seed);
  for (size_t i = 0; i < n; i++)
    a[i] = 0.5 + 0.5 * bench_rng_double01(&rng);
}

uint64_t bench_seed(int case_id) {
  return 0xC0FFEE1234567890ULL ^ (uint64_t)case_id * 0x9e3779b97f4a7c15ULL;
}
