
#include "bench_harness.h"
#include "bench_utils.h"
#include <stdint.h>
#include <stdlib.h>
void kernel_run(int C, int H, int W, const double *x, double *y) {
  int HW = H * W;

  for (int c = 0; c < C; c++) {
    double acc = 0.0;
    for (int hw = 0; hw < HW; hw++) {
      acc += x[c * HW + hw];
    }
    y[c] = acc / (double)HW;
  }
}
BENCH_MAIN_ARRAY3_D(T002_Ops_042, OP72, 4096, 16384, 65536, int H = 32;
                    int W = 32;
                    int C = (case_id == 1 ? 4 : (case_id == 2 ? 16 : 64));
                    double *x = malloc((size_t)(C * H * W) * sizeof(double));
                    double *y = malloc((size_t)C * sizeof(double)),
                    bench_fill_array(x, (size_t)(C * H * W), bench_seed(72));
                    , kernel_run(C, H, W, x, y), y, (size_t)C, free(x); free(y))
