"""Train/evaluate/Plot in Plants watering environments"""
import gymnasium as gym
import os
import hydra
from omegaconf import DictConfig

from src.actor import MonEpsilonGreedyOneAction
from src.critic import MonQCNN, MonRoomCNN
from src.experiment import MonExperiment
from src.wrappers.env_wrappers import WallObs, WindowViewObs, MultiChannel
from src.wrappers.monitor_wrappers import BinaryMonitor, RoomMonitor

EVAL = False
LOG_DIR = "models/9_9/Plants/reward_model/env_0.0/eps_1.0/q_lr_1.0/reward_lr_1.0/"


@hydra.main(version_base=None, config_path="configs", config_name="default")
def run_monitor(cfg: DictConfig) -> None:
    """Run env"""

    q_lr, reward_lr, eps = cfg.agent.critic.lr, cfg.agent.critic.reward_model.lr, cfg.agent.actor.init_eps
    dry, window_size = cfg.environment.plants_dryness_prob, cfg.environment.window_size
    eps_decay = cfg.agent.actor.eps_decay
    train_dir = "general_models/Plants/" + "/" + str(cfg.agent.critic.strategy) + "/10_10_channel/dry_{}/".format(dry)
    agent_start_pos = None if cfg.monitor.id == "RoomMonitor" else cfg.environment.agent_start_pos
    if cfg.monitor.id == "RoomMonitor":
        train_dir += "3_room/"
    train_dir += "/window_{}/eps_decay_{}/q_lr_{}/reward_lr_{}/".format(window_size, eps_decay, q_lr, reward_lr)
    os.makedirs(train_dir, exist_ok=True)

    env = gym.make(
        cfg.environment.id,
        grid_size=cfg.environment.grid_size,
        n_plants=cfg.environment.n_plants,
        plants_dryness_prob=cfg.environment.plants_dryness_prob,
        dry_difference=cfg.environment.dry_difference,
        agent_start_pos=agent_start_pos,
        max_episode_steps=cfg.environment.max_episode_steps,
        add_new_plants=cfg.environment.add_new_plants,
        add_more_plants=cfg.environment.add_more_plants,
    )
    env = WallObs(env, grid_size=cfg.environment.grid_size, n_walls=cfg.environment.n_walls)
    env = WindowViewObs(env, window_size=cfg.environment.window_size)
    env = MultiChannel(env, normalize_obs=True)

    if cfg.monitor.id == "RoomMonitor":
        env = RoomMonitor(env, full_monitor=False, **cfg.monitor)
        critic = MonRoomCNN(
            cfg.environment.id,
            env.observation_space,
            env.action_space,
            dir_name=train_dir,
            **cfg.agent.critic,
        )
    else:
        env = BinaryMonitor(env, full_monitor=False, **cfg.monitor)
        critic = MonQCNN(
            cfg.environment.id,
            env.observation_space,
            env.action_space,
            dir_name=train_dir,
            **cfg.agent.critic,
        )

    actor = MonEpsilonGreedyOneAction(critic, train=not EVAL, **cfg.agent.actor)
    experiment = MonExperiment(
        env,
        actor,
        critic,
        log_dir=LOG_DIR if EVAL else train_dir,
        replay_buffer=True,
        **cfg.experiment,
    )
    experiment.train()


if __name__ == "__main__":
    run_monitor()
