# tests/test_environment.py
"""
Unit tests for TaskSchedulingEnvironment dynamics (release, deadline, reward).
Run: pytest tests/test_environment.py -q
"""
import pytest
import torch
from data.dataset_builder import Task, generate_random_taskset
from chronoscore.environment import TaskSchedulingEnvironment, IDLE_TASK_ID

def test_env_basic_cycle():
    # create two simple tasks with small periods
    t0 = Task(id=0, period=3, exectime=1, deadline=3)
    t1 = Task(id=1, period=4, exectime=1, deadline=4)
    env = TaskSchedulingEnvironment([t0, t1], n_quanta=2)
    state = env.reset()
    # run one full period L
    total_reward = 0
    for i in range(env.L):
        # pick first available job or idle
        action = env.sample_random_action()
        state, r, done = env.step(action)
        total_reward += r
        if done:
            break
    # reward is finite and env ran
    assert isinstance(total_reward, (int, float))
    assert env.time > 0

def test_quantization_bounds():
    t = Task(id=0, period=10, exectime=2, deadline=10)
    env = TaskSchedulingEnvironment([t], n_quanta=5)
    env.reset()
    # ensure quantized values in state don't exceed max_deadline
    s = env.state
    assert all(isinstance(x, int) for x in s)
