#include "bench_harness.h"
#include "bench_utils.h"
#include <stdint.h>
#include <stdlib.h>
#include <string.h>
static inline uint16_t rd16be(const uint8_t *p) {
  return (uint16_t)(((uint16_t)p[0] << 8) | (uint16_t)p[1]);
}
static inline uint32_t rd32be(const uint8_t *p) {
  return ((uint32_t)p[0] << 24) | ((uint32_t)p[1] << 16) |
         ((uint32_t)p[2] << 8) | (uint32_t)p[3];
}
static inline uint16_t ip_checksum16(const uint8_t *p, int len) {
  uint32_t s = 0;
  for (int i = 0; i < len; i += 2) {
    uint16_t w = (uint16_t)(((uint16_t)p[i] << 8) | (uint16_t)p[i + 1]);
    s += (uint32_t)w;
    if (s > 0xFFFFu)
      s = (s & 0xFFFFu) + 1u;
  }
  return (uint16_t)(~s & 0xFFFFu);
}
static void make_pkt(uint8_t *pkt, bench_rng64_t *rng) {
  for (int i = 0; i < 6; i++)
    pkt[i] = (uint8_t)(bench_rng_next(rng) & 0xFFu);
  for (int i = 0; i < 6; i++)
    pkt[6 + i] = (uint8_t)(bench_rng_next(rng) & 0xFFu);
  pkt[12] = 0x08;
  pkt[13] = 0x00;
  uint8_t *ip = pkt + 14;
  memset(ip, 0, 20);
  ip[0] = 0x45;
  uint16_t totlen = (uint16_t)40;
  ip[2] = (uint8_t)(totlen >> 8);
  ip[3] = (uint8_t)(totlen & 0xFF);
  uint16_t ipid = (uint16_t)(bench_rng_next(rng) & 0xFFFFu);
  ip[4] = (uint8_t)(ipid >> 8);
  ip[5] = (uint8_t)(ipid & 0xFF);
  ip[6] = 0x00;
  ip[7] = 0x00;
  ip[8] = (uint8_t)(bench_rng_next(rng) & 0xFFu);
  ip[9] = 0x06;
  uint32_t sip = (uint32_t)(bench_rng_next(rng) & 0xFFFFFFFFu);
  uint32_t dip = (uint32_t)(bench_rng_next(rng) & 0xFFFFFFFFu);
  ip[12] = (uint8_t)(sip >> 24);
  ip[13] = (uint8_t)(sip >> 16);
  ip[14] = (uint8_t)(sip >> 8);
  ip[15] = (uint8_t)(sip);
  ip[16] = (uint8_t)(dip >> 24);
  ip[17] = (uint8_t)(dip >> 16);
  ip[18] = (uint8_t)(dip >> 8);
  ip[19] = (uint8_t)(dip);
  ip[10] = 0;
  ip[11] = 0;
  uint16_t cs = ip_checksum16(ip, 20);
  ip[10] = (uint8_t)(cs >> 8);
  ip[11] = (uint8_t)(cs & 0xFF);
  uint8_t *tcp = pkt + 34;
  memset(tcp, 0, 20);
  uint16_t sp = (uint16_t)(bench_rng_next(rng) & 0xFFFFu);
  uint16_t dp = (uint16_t)(bench_rng_next(rng) & 0xFFFFu);
  tcp[0] = (uint8_t)(sp >> 8);
  tcp[1] = (uint8_t)(sp & 0xFF);
  tcp[2] = (uint8_t)(dp >> 8);
  tcp[3] = (uint8_t)(dp & 0xFF);
  uint32_t sq = (uint32_t)(bench_rng_next(rng) & 0xFFFFFFFFu);
  uint32_t aq = (uint32_t)(bench_rng_next(rng) & 0xFFFFFFFFu);
  tcp[4] = (uint8_t)(sq >> 24);
  tcp[5] = (uint8_t)(sq >> 16);
  tcp[6] = (uint8_t)(sq >> 8);
  tcp[7] = (uint8_t)(sq);
  tcp[8] = (uint8_t)(aq >> 24);
  tcp[9] = (uint8_t)(aq >> 16);
  tcp[10] = (uint8_t)(aq >> 8);
  tcp[11] = (uint8_t)(aq);
  tcp[12] = 0x50;
  tcp[13] = 0x18;
  uint16_t win = (uint16_t)(bench_rng_next(rng) & 0xFFFFu);
  tcp[14] = (uint8_t)(win >> 8);
  tcp[15] = (uint8_t)(win & 0xFF);
  tcp[16] = 0;
  tcp[17] = 0;
  tcp[18] = 0;
  tcp[19] = 0;
}
static double pkt_run(int n, const uint8_t *buf) {
  const int PKTLEN = 64;
  double acc0 = 0.0;
  for (int i = 0; i < n; i++) {
    const uint8_t *pkt = buf + (size_t)i * PKTLEN;
    const uint8_t *ip = pkt + 14;
    const uint8_t *tcp = pkt + 34;
    uint16_t oldcs = rd16be(ip + 10);
    uint8_t tmpip[20];
    memcpy(tmpip, ip, 20);
    tmpip[10] = 0;
    tmpip[11] = 0;
    uint16_t newcs = ip_checksum16(tmpip, 20);
    if (newcs == oldcs) {
      uint32_t s = rd32be(ip + 12);
      uint32_t d = rd32be(ip + 16);
      uint32_t sp = rd16be(tcp);
      uint32_t dp = rd16be(tcp + 2);
      acc0 += (double)((s ^ d) ^ ((sp << 16) ^ dp));
    } else {
      acc0 -= 1.0;
    }
  }
  double ans = 0.0;

  ans = acc0;
  return ans;
}
BENCH_MAIN_SCALAR3(
    T004_Module_057, NETPKT, 4096, 16384, 65536,
    uint8_t *buf = (uint8_t *)malloc((size_t)n * 64);
    double ans_scalar = 0.0;
    ,
    {
      bench_rng64_t rng = bench_rng_init(seed);
      for (int i = 0; i < n; i++) {
        make_pkt(buf + (size_t)i * 64, &rng);
      }
    },
    ans_scalar = pkt_run(n, buf), ans_scalar, free(buf);)
