
#include "bench_harness.h"
#include "bench_utils.h"
#include <stdint.h>
#include <stdlib.h>
void kernel_run(int H, int W, const double *x, double *y) {
  int HW = H * W;

  for (int iy = 0; iy < H; iy++) {
    for (int ix = 0; ix < W; ix++) {
      int base = (iy * W + ix) * 9;
      int k = 0;
      for (int ky = -1; ky <= 1; ky++) {
        int sy = iy + ky;
        for (int kx = -1; kx <= 1; kx++) {
          int sx = ix + kx;
          double v = 0.0;
          if (!(sy < 0 || sy >= H || sx < 0 || sx >= W)) {
            v = x[sy * W + sx];
          }
          y[base + k] = v;
          k++;
        }
      }
    }
  }
  (void)HW;
}
BENCH_MAIN_ARRAY3_D(T002_Ops_057, OP87, 4096, 16384, 65536,
                    int H = (case_id == 1 ? 16 : (case_id == 2 ? 32 : 64));
                    int W = H; int HW = H * W;
                    double *x = malloc((size_t)(HW) * sizeof(double));
                    double *y = malloc((size_t)(HW * 9) * sizeof(double)),
                    bench_fill_array(x, (size_t)(HW), bench_seed(87));
                    , kernel_run(H, W, x, y), y, (size_t)(HW * 9), free(x);
                    free(y))
