# data/dataset_builder.py
"""
Taskset generation and dataset utilities.
Provides:
 - Task namedtuple
 - generate_random_taskset(...)
 - read_tasks(...) (from file lines "id, period, exectime, deadline")
"""
from typing import List, NamedTuple
import random
from math import floor
import numpy as np

random.seed(0)
np.random.seed(0)

class Task(NamedTuple):
    id: int
    period: int
    exectime: int
    deadline: int

def generate_random_taskset(
    n_tasks: int = 5,
    total_utilization: float = 1.0,
    min_period: int = 5,
    max_period: int = 20,
) -> List[Task]:
    """
    Random UUniFast-like generator that returns a list of Task NamedTuples.
    Ensures total utilization <= total_utilization.
    Periods chosen as multiples of 1 (or 5 if desired).
    """
    while True:
        utils_rng = []
        sum_u = total_utilization
        for i in range(1, n_tasks):
            next_sum = sum_u * (random.random() ** (1.0 / (n_tasks - i)))
            utils_rng.append(sum_u - next_sum)
            sum_u = next_sum
        utils_rng.append(sum_u)
        tasks = []
        for idx, u in enumerate(utils_rng):
            period = random.randint(min_period, max_period)
            exectime = max(1, int(floor(u * period)))
            deadline = period
            tasks.append(Task(id=idx, period=period, exectime=exectime, deadline=deadline))
        util = sum(t.exectime / t.period for t in tasks)
        if util <= total_utilization + 1e-6:
            return tasks

def read_tasks(filename: str):
    """
    Read tasks from file (each line: id, period, exectime, deadline) or (period, exectime, deadline) per line.
    Returns list[Task].
    """
    tasks = []
    with open(filename, "r", encoding="utf-8") as fh:
        for i, line in enumerate(fh):
            line = line.strip()
            if not line or line.startswith("#"):
                continue
            parts = [int(x.strip()) for x in line.split(",")]
            if len(parts) == 4:
                t = Task(id=parts[0], period=parts[1], exectime=parts[2], deadline=parts[3])
            else:
                t = Task(id=i, period=parts[0], exectime=parts[1], deadline=parts[2])
            tasks.append(t)
    return tasks
