
#include "bench_harness.h"
#include "bench_utils.h"
#include <stdint.h>
static inline size_t IDX(int r, int c, int m) {
  return (size_t)r * (size_t)m + (size_t)c;
}
void kernel_run(int n, int m, double *a, double *b, double *c, double *d,
                double *e, double *aa, double *bb, double *cc) {

  for (int j = 0; j < m; j++) {
    for (int i = j + 1; i < m; i++) {
      a[i] -= aa[IDX(j, i, m)] * a[j];
    }
  }
}
BENCH_MAIN_ARRAY3_D(T001_Loops_035, 115, 256, 1024, 4096, int m = n;
                    double *a = malloc((size_t)n * (size_t)m * sizeof(double));
                    double *b = malloc((size_t)n * (size_t)m * sizeof(double));
                    double *c = malloc((size_t)n * (size_t)m * sizeof(double));
                    double *d = malloc((size_t)n * (size_t)m * sizeof(double));
                    double *e = malloc((size_t)n * (size_t)m * sizeof(double));
                    double *aa = malloc((size_t)n * (size_t)m * sizeof(double));
                    double *bb = malloc((size_t)n * (size_t)m * sizeof(double));
                    double *cc = malloc((size_t)n * (size_t)m * sizeof(double));
                    , bench_fill_array(a, (n * m), bench_seed(1) ^ 0xa1);
                    bench_fill_array(b, (n * m), bench_seed(1) ^ 0xa2);
                    bench_fill_array(c, (n * m), bench_seed(1) ^ 0xa3);
                    bench_fill_array(d, (n * m), bench_seed(1) ^ 0xa4);
                    bench_fill_array(e, (n * m), bench_seed(1) ^ 0xa5);
                    bench_fill_array(aa, (n * m), bench_seed(1) ^ 0xa6);
                    bench_fill_array(bb, (n * m), bench_seed(1) ^ 0xa7);
                    bench_fill_array(cc, (n * m), bench_seed(1) ^ 0xa8);
                    , kernel_run(n, m, a, b, c, d, e, aa, bb, cc), a, (n * m),
                    free(a);
                    free(b); free(c); free(d); free(e); free(aa); free(bb);
                    free(cc);)
