
#include "bench_harness.h"
#include "bench_utils.h"
#include <math.h>
#include <stdint.h>
#include <stdlib.h>
static inline uint8_t clamp_u8(float v) {
  float r = roundf(v);
  if (r < 0.0f)
    r = 0.0f;
  if (r > 255.0f)
    r = 255.0f;
  return (uint8_t)r;
}
void kernel_run(int n, const float *x, const float *scale, const float *zero,
                uint8_t *q) {
  if (n < 1)
    n = 1;

  for (int i = 0; i < n; i++) {
    float sc = scale[i];
    if (sc == 0.0f) {
      sc = 1.0f;
    }
    float qf = x[i] / sc + zero[i];
    q[i] = clamp_u8(qf);
  }
}
BENCH_MAIN_ARRAY3_BYTES(
    T003_Code_059, OP89, 4096, 16384, 65536,
    uint8_t *q = (uint8_t *)malloc((size_t)n * sizeof(uint8_t));
    float *x = (float *)malloc((size_t)n * sizeof(float));
    float *scale = (float *)malloc((size_t)n * sizeof(float));
    float *zero = (float *)malloc((size_t)n * sizeof(float));
    double dummy_scalar = 0.0;
    ,
    {
      bench_rng64_t rng = bench_rng_init(seed);
      for (int i = 0; i < n; i++) {
        x[i] = (float)bench_rng_double_signed(&rng) * 8.0f;
        scale[i] = 0.1f + 0.9f * (float)bench_rng_double01(&rng);
        zero[i] = (float)(bench_rng_next(&rng) & 0xFFu);
      }
    },
    kernel_run(n, x, scale, zero, q), q, n, free(q);
    free(x); free(scale); free(zero);)
