# Отладочный конфиг для быстрого тестирования
from pathlib import Path

from tame.agents.simple_ppo3 import Agent, Args
from tame.envs.mpe_simple_spread import Env

MAX_TS = 200

agent_args = Args(
    total_timesteps=50000,
    cuda=0,
    seed=42,
    verbose=True,
    freq_top=2,
    freq_mid=2,
    freq_bottom=1,
    learn_comm=True,
    learn_proxy=True,
    save_all_trace=True,
    learning_rate=0.003,
    gamma=0.99,
    batch_size=512,
    num_minibatches=4,
    clip_coef=0.2,
    ent_coef=0.0,
    comm_size=8,
)

TOTAL_AGENTS = 4
EVAL_RUNS = 3
SAVE_PATH = Path("./debug_exps")
RUN_NAME = f"simple_ppo3_debug__a{TOTAL_AGENTS}_s{agent_args.seed}"
TRAIN = True
