import json
from typing import List
from .base import Dataset, Request


class SpecBench(Dataset):

    def __init__(self, path, num_samples=480, **kwargs):
        self.data: List[Request] = [] #list of list of questions.
        self.num_samples = num_samples
        self._preprocess(path)

    def _preprocess(self, path):
        with open(path, "r") as f:
            for l in f.readlines():
                line = json.loads(l)
                self.data.append(Request(question_id=line["question_id"], category=line["category"], system_prompt=None, turns=line['turns']))
        self.data = self.data[:self.num_samples]