
#include "bench_harness.h"
#include "bench_utils.h"
#include <stdint.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
void kernel_run(int n, const uint32_t *remarr, const uint32_t *modarr,
                double *ans_out) {
  int T = (n < 3) ? n : 3;
  if (T <= 0) {
    *ans_out = 0.0;
    return;
  }
  unsigned long long r = (unsigned long long)(remarr[0] % modarr[0]);
  unsigned long long M = (unsigned long long)modarr[0];
  if (M == 0ULL)
    M = 1ULL;
  for (int idx = 1; idx < T; idx++) {
    unsigned long long a2 = (unsigned long long)(remarr[idx] % modarr[idx]);
    unsigned long long m2 = (unsigned long long)modarr[idx];
    if (m2 == 0ULL)
      m2 = 1ULL;
    unsigned long long r_mod_m2 = r % m2;
    unsigned long long diff_mod =
        (a2 >= r_mod_m2) ? (a2 - r_mod_m2) : (a2 + m2 - r_mod_m2);
    unsigned long long A = M;
    unsigned long long B = m2;
    while (B != 0ULL) {
      unsigned long long tmp = A % B;
      A = B;
      B = tmp;
    }
    unsigned long long g = A;
    if ((diff_mod % g) != 0ULL) {
      continue;
    }
    unsigned long long Mprime = M / g;
    unsigned long long mprime = m2 / g;
    unsigned long long rhs = diff_mod / g;
    unsigned long long aa = Mprime;
    unsigned long long bb = mprime;
    long long x0 = 1, y0 = 0;
    long long x1 = 0, y1 = 1;
    while (bb != 0ULL) {
      unsigned long long q = aa / bb;
      unsigned long long tmp_ab = aa - q * bb;
      aa = bb;
      bb = tmp_ab;
      long long tx = x0 - (long long)q * x1;
      long long ty = y0 - (long long)q * y1;
      x0 = x1;
      y0 = y1;
      x1 = tx;
      y1 = ty;
    }
    long long invMprime_signed = x0;
    long long mod_mprime_signed = (long long)mprime;
    long long t_mod_signed =
        (long long)(((__int128)rhs * (__int128)invMprime_signed) %
                    (__int128)mod_mprime_signed);
    if (t_mod_signed < 0)
      t_mod_signed += (long long)mprime;
    unsigned long long t_mod = (unsigned long long)t_mod_signed;
    unsigned long long M_new = M * (m2 / g);
    __uint128_t bigX = (__uint128_t)r + (__uint128_t)M * (__uint128_t)t_mod;
    unsigned long long x_new = (unsigned long long)(bigX % (__uint128_t)M_new);
    r = x_new;
    M = M_new;
    if (M == 0ULL)
      M = 1ULL;
  }
  double ans_double = 0.0;

  ans_double = (double)r;

  *ans_out = ans_double;
}
BENCH_MAIN_SCALAR3(
    T003_Code_038, CRTG, 4096, 16384, 65536,
    uint32_t *rarr = (uint32_t *)malloc((size_t)n * sizeof(uint32_t));
    uint32_t *marr = (uint32_t *)malloc((size_t)n * sizeof(uint32_t));
    double ans_scalar = 0.0;
    ,
    {
      bench_rng64_t rng = bench_rng_init(seed);
      for (int i = 0; i < n; i++) {
        uint32_t mv = (uint32_t)(1000U + (bench_rng_next(&rng) % 8000ULL));
        if (mv == 0U)
          mv = 1U;
        marr[i] = mv;
        uint32_t rv = (uint32_t)(bench_rng_next(&rng) % mv);
        rarr[i] = rv;
      }
    },
    kernel_run(n, rarr, marr, &ans_scalar), ans_scalar, free(rarr);
    free(marr);)
