###
# Imports
###
import sys
import os
import time

sys.path.append(os.getcwd())

from src.log import LogFile
from src.utils.args import get_args
from src.envs.MazeEnv import load_default_scenario

###
# Setting the environment
###
args = get_args()
env, scenario_id = load_default_scenario(args.atype,scenario_id=args.id,display=False)

###
# ADLEAP-MAS MAIN ROUTINE
###
state = env.reset()
agent = env.get_adhoc_agent()

header = ['Iteration','Reward','Time to reason','N Rollouts', 'N Simulations']
log = LogFile('MazeEnv',scenario_id,args.atype,args.exp_num,header)

MAX_EPISODES = 200
done = False
while not done and env.episode < MAX_EPISODES:
    # 1. Importing agent method
    agent = env.get_adhoc_agent()
    method = env.import_method(agent.type)

    # 2. Reasoning about next action and target
    start = time.time()
    agent.next_action, _ = method(state, agent)
    end = time.time()

    # 3. Taking a step in the environment
    state,reward,done,info = env.step(agent.next_action)
    data = {'it':env.episode,
            'reward':reward,
            'time':end-start,
            'nrollout':agent.smart_parameters['count']['nrollouts'],
            'nsimulation':agent.smart_parameters['count']['nsimulations']}
    log.write(data)

env.close()
###
# THE END - That's all folks :)
###