import argparse
from functools import wraps
from typing import Callable, List


def output_added_arguments(add_algo_arguments: Callable) -> Callable:
    @wraps(add_algo_arguments)
    def decorated(parser: argparse.ArgumentParser) -> List[str]:
        unfiltered_old_arguments = list(parser._option_string_actions.keys())

        add_algo_arguments(parser)

        unfiltered_arguments = list(parser._option_string_actions.keys())
        unfiltered_added_arguments = [
            argument
            for argument in unfiltered_arguments
            if argument not in unfiltered_old_arguments
        ]

        return [
            argument.strip("-")
            for argument in unfiltered_added_arguments
            if argument.startswith("--") and argument not in ["--help"]
        ]

    return decorated


@output_added_arguments
def add_base_arguments(parser: argparse.ArgumentParser):
    parser.add_argument(
        "-en",
        "--experiment_name",
        help="Experiment name.",
        type=str,
        required=True,
    )
    parser.add_argument(
        "-s",
        "--seed",
        help="Seed of the experiment.",
        type=int,
        required=True,
    )
    parser.add_argument(
        "-dw",
        "--disable_wandb",
        help="Disable wandb.",
        default=False,
        action="store_true",
    )
    parser.add_argument(
        "-f",
        "--features",
        nargs="*",
        help="List of features for the Q-networks.",
        type=int,
        default=[200, 200],
    )
    parser.add_argument(
        "-rbc",
        "--replay_buffer_capacity",
        help="Replay Buffer capacity.",
        type=int,
        default=10_000,
    )
    parser.add_argument(
        "-bs",
        "--batch_size",
        help="Batch size for training.",
        type=int,
        default=32,
    )
    parser.add_argument(
        "-n",
        "--update_horizon",
        help="Value of n in n-step TD update.",
        type=int,
        default=1,
    )
    parser.add_argument(
        "-gamma",
        "--gamma",
        help="Discounting factor.",
        type=float,
        default=0.99,
    )
    parser.add_argument(
        "-lr",
        "--learning_rate",
        help="Learning rate.",
        type=float,
        default=3e-4,
    )
    parser.add_argument(
        "-ae",
        "--adam_eps",
        help="Epislon in Adam.",
        type=float,
        default=1.5e-4,
    )
    parser.add_argument(
        "-horizon",
        "--horizon",
        help="Horizon for truncation.",
        type=int,
        default=1000,
    )
    parser.add_argument(
        "-at",
        "--architecture_type",
        help="Type of architecture.",
        type=str,
        default="fc",
        choices=["cnn", "impala", "fc"],
    )
    parser.add_argument(
        "-tf",
        "--target_function",
        help="Type of target function to use.",
        type=str,
        default="default",
        choices=[
            "default",
            "online",
            "min",
            "max",
            "mean",
            "random",
        ],
    )
    parser.add_argument(
        "-ln",
        "--layer_norm",
        help="Add Layer Norm to architecture.",
        default=False,
        action="store_true",
    )


@output_added_arguments
def add_dqn_arguments(parser: argparse.ArgumentParser):
    parser.add_argument(
        "-ne",
        "--n_epochs",
        help="Number of epochs to perform.",
        type=int,
        default=50,
    )
    parser.add_argument(
        "-ntspe",
        "--n_training_steps_per_epoch",
        help="Number of training steps per epoch.",
        type=int,
        default=10_000,
    )
    parser.add_argument(
        "-dtu",
        "--data_to_update",
        help="Number of data points to collect per online Q-network update.",
        type=float,
        default=1,
    )
    parser.add_argument(
        "-tuf",
        "--target_update_frequency",
        help="Number of training steps before updating the target Q-network.",
        type=int,
        default=200,
    )
    parser.add_argument(
        "-nis",
        "--n_initial_samples",
        help="Number of initial samples before the training starts.",
        type=int,
        default=1_000,
    )
    parser.add_argument(
        "-ee",
        "--epsilon_end",
        help="Ending value for the linear decaying epsilon used for exploration.",
        type=float,
        default=0.01,
    )
    parser.add_argument(
        "-ed",
        "--epsilon_duration",
        help="Duration of epsilon's linear decay used for exploration.",
        type=float,
        default=1_000,
    )


@output_added_arguments
def add_doubledqn_arguments(parser: argparse.ArgumentParser):
    return add_dqn_arguments(parser)


@output_added_arguments
def add_iqn_arguments(parser: argparse.ArgumentParser):
    return add_dqn_arguments(parser)


@output_added_arguments
def add_frdqn_arguments(parser: argparse.ArgumentParser):
    parser.add_argument(
        "-k",
        "--kappa",
        help="Weight for functional regularizer in FRDQN.",
        type=float,
        default=1.0,
    )
    return add_dqn_arguments(parser)


@output_added_arguments
def add_scdqn_arguments(parser: argparse.ArgumentParser):
    parser.add_argument(
        "-b",
        "--beta",
        help="Weight for correcting term in ScDQN.",
        type=float,
        default=3.0,
    )
    return add_dqn_arguments(parser)


@output_added_arguments
def add_maxmindqn_arguments(parser: argparse.ArgumentParser):
    parser.add_argument(
        "-n_qs",
        "--n_qs",
        help="Number of Q-networks in MaxMinDQN.",
        type=int,
        default=2,
    )
    return add_dqn_arguments(parser)
