#include "bench_harness.h"
#include "bench_utils.h"
#include <math.h>
#include <stdint.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#define IDX(i, j, n) ((size_t)(i) * (size_t)(n) + (size_t)(j))
void kernel_run(int n, double *ex, double *ey, double *hz) {
  double ce = 0.5, ch = 0.7;

  for (int i = 0; i < n; i++) {
    for (int j = 1; j < n; j++) {
      ex[IDX(i, j, n)] =
          ex[IDX(i, j, n)] + ce * (hz[IDX(i, j, n)] - hz[IDX(i, j - 1, n)]);
    }
  }
  for (int i = 1; i < n; i++) {
    for (int j = 0; j < n; j++) {
      ey[IDX(i, j, n)] =
          ey[IDX(i, j, n)] - ce * (hz[IDX(i, j, n)] - hz[IDX(i - 1, j, n)]);
    }
  }
  for (int i = 0; i < n - 1; i++) {
    for (int j = 0; j < n - 1; j++) {
      hz[IDX(i, j, n)] =
          hz[IDX(i, j, n)] + ch * (ex[IDX(i, j + 1, n)] - ex[IDX(i, j, n)] +
                                   ey[IDX(i + 1, j, n)] - ey[IDX(i, j, n)]);
    }
  }
}
BENCH_MAIN_ARRAY3_D(T001_Loops_022, 06, 128, 256, 512,
                    double *ex = malloc((size_t)n * n * sizeof(double));
                    double *ey = malloc((size_t)n * n * sizeof(double));
                    double *hz = malloc((size_t)n * n * sizeof(double));
                    , bench_fill_array(ex, (size_t)n *n, bench_seed(10));
                    bench_fill_array(ey, (size_t)n *n, bench_seed(11));
                    bench_fill_array(hz, (size_t)n *n, bench_seed(12));
                    , kernel_run(n, ex, ey, hz);, hz, (size_t)n *n, free(ex);
                    free(ey); free(hz);)
