
#include "bench_harness.h"
#include "bench_utils.h"
#include <stdint.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
void kernel_run(int n, const uint64_t *arr, double *ans_out) {
  int limit = (n < 64) ? n : 64;
  unsigned long long result_sum = 0ULL;
  unsigned long long rho_rng = 0x9e3779b97f4a7c15ULL ^ (unsigned long long)n;
  for (int idx = 0; idx < limit; idx++) {
    unsigned long long num0 = arr[idx];
    if (num0 < 2ULL)
      continue;
    unsigned long long st[128];
    int sp = 0;
    st[sp++] = num0;
    while (sp > 0) {
      unsigned long long cur_n = st[--sp];
      if (cur_n == 1ULL)
        continue;
      int isPrime;
      if (cur_n < 4ULL) {
        isPrime = (cur_n == 2ULL || cur_n == 3ULL);
      } else if ((cur_n & 1ULL) == 0ULL) {
        isPrime = 0;
      } else {
        isPrime = 1;
        unsigned long long d = cur_n - 1ULL;
        int s = 0;
        while ((d & 1ULL) == 0ULL) {
          d >>= 1;
          s++;
        }
        unsigned int bases[7] = {2U, 3U, 5U, 7U, 11U, 13U, 17U};
        for (int bi = 0; bi < 7 && isPrime; bi++) {
          unsigned long long a_base = (unsigned long long)bases[bi];
          if (a_base % cur_n == 0ULL)
            continue;
          unsigned long long base = a_base % cur_n;
          unsigned long long e = d;
          unsigned long long modn = cur_n;
          unsigned long long x = 1ULL;
          while (e) {
            if (e & 1ULL) {
              unsigned __int128 tmp = (unsigned __int128)x * base;
              x = (unsigned long long)(tmp % modn);
            }
            unsigned __int128 tmp2 = (unsigned __int128)base * base;
            base = (unsigned long long)(tmp2 % modn);
            e >>= 1ULL;
          }
          if (x == 1ULL || x == (modn - 1ULL))
            continue;
          int witness_ok = 0;
          for (int r = 1; r < s; r++) {
            unsigned __int128 tmp3 = (unsigned __int128)x * x;
            x = (unsigned long long)(tmp3 % modn);
            if (x == modn - 1ULL) {
              witness_ok = 1;
              break;
            }
          }
          if (!witness_ok) {
            isPrime = 0;
          }
        }
      }
      if (isPrime) {
        result_sum += cur_n;
        continue;
      }
      if ((cur_n & 1ULL) == 0ULL) {
        st[sp++] = 2ULL;
        st[sp++] = (cur_n >> 1);
        continue;
      }
      unsigned long long n_c = cur_n;
      unsigned long long found_factor = n_c;
      while (found_factor == n_c) {
        {
          unsigned long long xrs = rho_rng;
          xrs ^= xrs >> 12;
          xrs ^= xrs << 25;
          xrs ^= xrs >> 27;
          xrs *= 2685821657736338717ULL;
          rho_rng = xrs;
        }
        unsigned long long c = (rho_rng % (n_c - 1ULL)) + 1ULL;
        {
          unsigned long long xrs = rho_rng;
          xrs ^= xrs >> 12;
          xrs ^= xrs << 25;
          xrs ^= xrs >> 27;
          xrs *= 2685821657736338717ULL;
          rho_rng = xrs;
        }
        unsigned long long x = (rho_rng % (n_c - 2ULL)) + 2ULL;
        unsigned long long y = x;
        unsigned long long d = 1ULL;
        while (d == 1ULL) {
          {
            unsigned __int128 t1 = (unsigned __int128)x * x;
            x = (unsigned long long)(t1 % n_c);
            x += c;
            if (x >= n_c)
              x -= n_c;
          }
          {
            unsigned __int128 t2 = (unsigned __int128)y * y;
            y = (unsigned long long)(t2 % n_c);
            y += c;
            if (y >= n_c)
              y -= n_c;
            t2 = (unsigned __int128)y * y;
            y = (unsigned long long)(t2 % n_c);
            y += c;
            if (y >= n_c)
              y -= n_c;
          }
          unsigned long long diff = (x > y) ? (x - y) : (y - x);
          {
            unsigned long long a1 = diff;
            unsigned long long b1 = n_c;
            while (a1) {
              unsigned long long t = b1 % a1;
              b1 = a1;
              a1 = t;
            }
            d = b1;
          }
          if (d == n_c)
            break;
        }
        if (d != 1ULL && d != n_c) {
          found_factor = d;
          break;
        }
      }
      if (found_factor == n_c) {
        result_sum += n_c;
      } else {
        unsigned long long other = n_c / found_factor;
        st[sp++] = found_factor;
        st[sp++] = other;
      }
    }
  }
  double ans_double = 0.0;

  ans_double = (double)result_sum;

  *ans_out = ans_double;
}
BENCH_MAIN_SCALAR3(
    T003_Code_036, MRPOLLARD, 4096, 16384, 65536,
    uint64_t *arr = (uint64_t *)malloc((size_t)n * sizeof(uint64_t));
    double ans_scalar = 0.0;
    ,
    {
      bench_rng64_t rng = bench_rng_init(seed);
      for (int i = 0; i < n; i++) {
        uint64_t a0 = bench_rng_next(&rng) | 1ULL;
        uint64_t b0 = bench_rng_next(&rng) | 1ULL;
        uint64_t aa = a0 % 1000000007ULL;
        uint64_t bb = b0 % 1000000007ULL;
        arr[i] = aa * bb;
        if (arr[i] < 2ULL)
          arr[i] = 2ULL;
      }
    },
    kernel_run(n, arr, &ans_scalar), ans_scalar, free(arr);)
