"""
KernelBench Dataset Definition.

This module defines the operator dataset for KernelBench benchmarks.
Each operator has a category (for few-shot example selection) and a level.

Levels:
- level1: Basic operators (matmul, activation, pooling, normalization, etc.)
- level2: Fused operators (Conv+BN+ReLU, Matmul+GELU, etc.)
- level3: Architecture components (ResNet, VGG, Transformer blocks, etc.)
- level4: Complete HuggingFace models (GPT2, BART, etc.)
"""

import json
import os

# Category to example operator mapping (for few-shot learning)
# These map to existing AscendC few-shot examples in /prompts/ascendc_new_model_*.py
# Available examples: add, leaky_relu, matmul_add, mse_loss, reduce_sum, sigmoid
category2exampleop = {
    "matmul": "matmul_add",        # matmul + bias fusion
    "activation": "leaky_relu",    # activation function
    "normalization": "reduce_sum", # reduction-based (layer_norm removed)
    "pooling": "reduce_sum",       # pooling is reduction-like
    "reduce": "reduce_sum",        # direct match
    "convolution": "matmul_add",   # heavy compute pattern
    "loss": "mse_loss",            # loss function
    "fuse": "matmul_add",          # fused ops
    "arch": "matmul_add",          # complex architecture
    "transformer": "matmul_add",   # transformer blocks
}

# KernelBench dataset with category and level info
# Loaded from dataset.json which contains normalized and PascalCase names
_dataset_path = os.path.join(os.path.dirname(__file__), "dataset.json")

if not os.path.exists(_dataset_path):
    raise FileNotFoundError(
        f"KernelBench dataset not found at {_dataset_path}. "
        "The op_eval package requires dataset.json to load operator metadata."
    )

try:
    with open(_dataset_path, "r") as _f:
        dataset = json.load(_f)
except Exception as exc:
    raise RuntimeError(
        f"Failed to load KernelBench dataset from {_dataset_path}: {exc}"
    ) from exc
