"""
Test script for QMIX agent
──────────────────────────
This script runs the AppleGridMDP environment with a QMIX policy to 
verify that the loaded agent behaves correctly (ε=0 greedy). 
It should be used together with the policy wrapper (`get_policy` / 
`rnn_agent.py`) where the trained QMIX agent is loaded and actions are defined.
"""

import sys
import os
sys.path.append(os.path.abspath(os.path.join(os.path.dirname(__file__), '..')))
from src.agents.qmix.get_policy import reset_policy, act
from src.environment.test.apple_grid_qmix import AppleGridMDP


env = AppleGridMDP()
obs = env.reset()
reset_policy()
len_test_timesteps = 10
done = False

for _ in range(len_test_timesteps):
    avail = [env.get_avail_actions_agent(i) for i in range(env.n_agents)] \
            if hasattr(env, "get_avail_actions_agent") else None
    actions = act(obs, avail_actions=avail)   # greedy (ε=0)
    
    env.step(actions)
    obs = env.get_obs()
    env.render()
