#include "bench_harness.h"
#include "bench_utils.h"
#include <math.h>
#include <stdint.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>

#define IDX(i, j, n) ((size_t)(i) * (size_t)(n) + (size_t)(j))
static inline int pairable(int a, int b) { return ((a + b) % 3) == 0; }

void kernel_run(int n, int *S, const int *seq) {
  for (int d = 1; d < n; d++) {
    for (int i = 0; i < n - d; i++) {
      int j = i + d;
      int best = 0;
      best = S[i * n + (j - 1)];
      if (pairable(seq[i], seq[j])) {
        int v = ((i + 1) <= (j - 1)) ? S[(i + 1) * n + (j - 1)] + 1 : 1;
        if (v > best)
          best = v;
      }
      for (int k = i; k < j; k++) {
        int v = S[i * n + k] + S[(k + 1) * n + j];
        if (v > best)
          best = v;
      }
      S[i * n + j] = best;
    }
  }
}

BENCH_MAIN_ARRAY3_BYTES(
    pb_nussinov, 16, 128, 192, 256,
    int *S = (int *)calloc((size_t)n * (size_t)n, sizeof(int));
    int *seq = (int *)malloc((size_t)n * sizeof(int));
    , bench_rng64_t r = bench_rng_init(bench_seed(222));
    for (int i = 0; i < n; i++) seq[i] = (int)(bench_rng_next(&r) & 3ULL);
    , kernel_run(n, S, seq), S, (size_t)n *(size_t)n * sizeof(int), free(S);
    free(seq);)
