
#include "bench_harness.h"
#include "bench_utils.h"
#include <math.h>
#include <stdint.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
void kernel_run(int n, double *w, double **b) {

  for (int i = 1; i < n; i++) {
    for (int k = 0; k < i; k++) {
      w[i] += b[k][i] * w[(i - k) - 1];
    }
  }
}
BENCH_MAIN_ARRAY3_D(
    T001_Loops_005, 06, 128, 256, 512,
    double *w = calloc((size_t)n, sizeof(double));
    double **b = malloc((size_t)n * sizeof(double *));
    double *bstore = malloc((size_t)n * n * sizeof(double)),
    {
      for (int i = 0; i < n; i++) {
        b[i] = bstore + i * (size_t)n;
      }
      bench_fill_array(w, n, bench_seed(8) ^ 0x13579);
      bench_fill_array(bstore, (size_t)n * n, bench_seed(8) ^ 0x24680);
    },
    kernel_run(n, w, b), w, n, free(bstore);
    free(b); free(w))
