
#include "bench_harness.h"
#include "bench_utils.h"
#include <math.h>
#include <stdint.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
void kernel_run(int H, int W, const double *x, double *y) {
  int OH = H / 2, OW = W / 2;

  for (int i = 0; i < OH; i++) {
    for (int j = 0; j < OW; j++) {
      int r = i * 2, c = j * 2;
      double a = x[r * W + c], b = x[r * W + c + 1], d = x[(r + 1) * W + c],
             e = x[(r + 1) * W + c + 1];
      double m = a;
      if (b > m)
        m = b;
      if (d > m)
        m = d;
      if (e > m)
        m = e;
      y[i * OW + j] = m;
    }
  }
}
BENCH_MAIN_ARRAY3_D(
    T002_Ops_016, OP16, 4096, 16384, 65536,
    int H = (case_id == 1 ? 64 : (case_id == 2 ? 128 : 256));
    int W = H; double *x = malloc((size_t)H * W * sizeof(double));
    double *y = malloc((size_t)(H / 2) * (W / 2) * sizeof(double)),
    bench_fill_array(x, (size_t)H *W, bench_seed(16));
    , kernel_run(H, W, x, y), y, (size_t)(H / 2) * (W / 2), free(x); free(y))
