
#include "bench_harness.h"
#include "bench_utils.h"
#include <stdint.h>
#include <stdlib.h>
void kernel_run(int rows, int cols, const double *x, const double *bias,
                double *y) {

  for (int r = 0; r < rows; r++) {
    for (int c = 0; c < cols; c++) {
      int idx = r * cols + c;
      y[idx] = x[idx] + bias[c];
    }
  }
}
BENCH_MAIN_ARRAY3_D(
    T002_Ops_039, OP69, 16384, 32768, 65536,
    int rows = (case_id == 1 ? 128 : (case_id == 2 ? 256 : 512));
    int cols = 128; double *x = malloc((size_t)n * sizeof(double));
    double *bias = malloc((size_t)cols * sizeof(double));
    double *y = malloc((size_t)n * sizeof(double)),
    bench_fill_array(x, (size_t)n, bench_seed(69));
    bench_fill_array(bias, (size_t)cols, bench_seed(69) ^ 0xBEEu);
    , kernel_run(rows, cols, x, bias, y), y, (size_t)n, free(x); free(bias);
    free(y))
