import argparse

import numpy as np


def get_config():
    parser = argparse.ArgumentParser(
        description='onpolicy', formatter_class=argparse.RawDescriptionHelpFormatter)

    # env parameters
    parser.add_argument("--env_name", type=str, required=True, help="specify the name of environment")
    parser.add_argument('--task_name', type=str, required=True, help="Which task to run on")

    parser.add_argument("--algorithm_name", type=str, default='smac',
                        choices=["smac", "actor-critic", "actor-critic-sgd", "actor-critic-npg", "ac-kfac"])

    parser.add_argument("--seed", type=int, default=int(np.random.choice(65536, replace=False, size=1)),
                        help="Random seed for numpy/torch")
    parser.add_argument("--cuda", action='store_false', default=True,
                        help="by default True, will use GPU to train; or else will use CPU;")
    parser.add_argument("--cuda_deterministic",
                        action='store_false', default=True,
                        help="by default, make sure random seed effective. if set, bypass such function.")
    parser.add_argument("--n_training_threads", type=int,
                        default=1, help="Number of torch threads for training")
    parser.add_argument("--num_env_steps", type=int, default=10e6,
                        help='Number of environment steps to train (default: 10e6)')
    parser.add_argument("--add", type=str, default="")

    parser.add_argument("--online_update", default=False, action='store_true')
    parser.add_argument("--ief", default=False, action='store_true')
    parser.add_argument("--damping_factor", type=float, default=0.1)
    parser.add_argument("--matrix_free", default=False, action='store_true')

    # replay buffer parameters
    parser.add_argument("--episode_length", type=int,
                        default=500, help="Max length for any episode")

    # network parameters
    parser.add_argument("--hidden_size", nargs='*', type=int, default=[64],
                        help="Dimension of hidden layers for actor/critic networks")
    parser.add_argument("--activation", type=str,
                        default='tanh', choices=["relu", "tanh", "sigmoid"])

    # optimizer parameters
    parser.add_argument("--optimizer", type=str, default="adam", choices=["sgd", "adam"])
    parser.add_argument("--lr", type=float, default=5e-4,
                        help='learning rate (default: 5e-4)')
    parser.add_argument("--critic_lr", type=float, default=5e-4,
                        help='critic learning rate (default: 5e-4)')
    parser.add_argument("--opti_eps", type=float, default=1e-5,
                        help='RMSprop optimizer epsilon (default: 1e-5)')
    parser.add_argument("--weight_decay", type=float, default=0.001)

    parser.add_argument("--batch_size", type=int, default=None)
    parser.add_argument("--gamma", type=float, default=0.99,
                        help='discount factor for rewards (default: 0.99)')
    parser.add_argument("--use_value_active_masks",
                        action='store_false', default=True,
                        help="by default True, whether to mask useless data in value loss.")
    parser.add_argument("--use_policy_active_masks",
                        action='store_false', default=True,
                        help="by default True, whether to mask useless data in policy loss.")

    parser.add_argument("--max_grad_norm", type=float, default=0.0,
                        help='max norm of gradients (default: 0.0)')

    parser.add_argument("--entropy_coeff", type=float, default=0.0)

    # GAE parameters
    parser.add_argument("--tau", type=float, default=0.9)

    # KFAC parameters
    parser.add_argument("--kfac_damping", type=float, default=0.001)
    parser.add_argument("--kfac_factor_decay", type=float, default=0.99)
    parser.add_argument("--kfac_kl_clip", type=float, default=0.001)
    parser.add_argument("--kfac_update_freq", type=float, default=1)

    parser.add_argument("--env_steps_before_update", type=int, default=0,
                        help='env steps before update (0 == one full trajectory')

    parser.add_argument("--use_linear_lr_decay", action='store_true',
                        default=False, help='use a linear schedule on the learning rate')
    parser.add_argument("--use_critic_linear_lr_decay", action='store_true',
                        default=False, help='use a linear schedule on the learning rate')
    # save parameters
    parser.add_argument("--save_interval", type=int, default=10,
                        help="time duration between contiunous twice models saving.")

    # log parameters
    parser.add_argument("--log_interval", type=int, default=3,
                        help="time duration between contiunous twice log printing.")
    parser.add_argument("--no_wandb", action='store_false', dest='use_wandb', default=True)

    return parser
