#include "bench_harness.h"
#include "bench_utils.h"
#include <stdint.h>
#include <stdlib.h>
#include <string.h>
#define HSEED 0x9e3779b9u
static inline uint32_t mix32(uint32_t x) {
  x ^= HSEED;
  x ^= x >> 16;
  x *= 0x7feb352dU;
  x ^= x >> 15;
  x *= 0x846ca68bU;
  x ^= x >> 16;
  return x;
}
static size_t next_pow2_size(size_t x) {
  size_t p = 1;
  while (p < x)
    p <<= 1;
  return p;
}
static double hj_run(int n, const int *build_k, const double *build_v,
                     const int *probe_k, const double *probe_v) {
  int n_build = n / 2;
  if (n_build < 1)
    n_build = 1;
  int n_probe = n - n_build;
  size_t need = (size_t)((n_build * 10) / 7 + 1);
  size_t cap = next_pow2_size(need);
  int *hkeys = (int *)malloc(cap * sizeof(int));
  double *hvals = (double *)malloc(cap * sizeof(double));
  unsigned char *hused = (unsigned char *)malloc(cap * sizeof(unsigned char));
  if (!hkeys || !hvals || !hused) {
    if (hkeys)
      free(hkeys);
    if (hvals)
      free(hvals);
    if (hused)
      free(hused);
    return 0.0;
  }
  memset(hused, 0, cap * sizeof(unsigned char));
  for (int i = 0; i < n_build; i++) {
    int key = build_k[i];
    double val = build_v[i];
    size_t idx = (size_t)(mix32((uint32_t)key) & (uint32_t)(cap - 1));
    while (hused[idx] && hkeys[idx] != key)
      idx = (idx + 1) & (cap - 1);
    if (hused[idx]) {
      hvals[idx] += val;
    } else {
      hused[idx] = 1;
      hkeys[idx] = key;
      hvals[idx] = val;
    }
  }
  double acc = 0.0;
  for (int i = 0; i < n_probe; i++) {
    int key = probe_k[i];
    double v2 = probe_v[i];
    size_t idx = (size_t)(mix32((uint32_t)key) & (uint32_t)(cap - 1));
    while (hused[idx]) {
      if (hkeys[idx] == key) {
        acc += hvals[idx] * v2;
        break;
      }
      idx = (idx + 1) & (cap - 1);
    }
  }
  free(hkeys);
  free(hvals);
  free(hused);
  double ans = 0.0;

  ans = acc;
  return ans;
}
BENCH_MAIN_SCALAR3(
    T004_Module_051, HJOIN, 4096, 16384, 65536,
    int *build_k = (int *)malloc((size_t)n * sizeof(int));
    double *build_v = (double *)malloc((size_t)n * sizeof(double));
    int *probe_k = (int *)malloc((size_t)n * sizeof(int));
    double *probe_v = (double *)malloc((size_t)n * sizeof(double));
    double ans_scalar = 0.0;
    ,
    {
      bench_rng64_t rng = bench_rng_init(seed);
      int n_build = n / 2;
      if (n_build < 1)
        n_build = 1;
      int n_probe = n - n_build;
      for (int i = 0; i < n_build; i++) {
        build_k[i] = (int)(bench_rng_next(&rng) & 0xFFFFu);
        build_v[i] = bench_rng_double_signed(&rng);
      }
      for (int i = 0; i < n_probe; i++) {
        uint64_t r = bench_rng_next(&rng);
        if ((r & 1ULL) == 0 && n_build > 0) {
          int idx = (int)(bench_rng_next(&rng) % (unsigned long long)n_build);
          probe_k[i] = build_k[idx];
        } else {
          probe_k[i] = (int)(bench_rng_next(&rng) & 0xFFFFu);
        }
        probe_v[i] = bench_rng_double_signed(&rng);
      }
    },
    ans_scalar = hj_run(n, build_k, build_v, probe_k, probe_v), ans_scalar,
    free(build_k);
    free(build_v); free(probe_k); free(probe_v);)
