import argparse

def parse_args():
    parser = argparse.ArgumentParser(description="PyTorch Training")

    # primary
    parser.add_argument(
        "--configs", type=str, default="./configs/config-cifar10.yml", help="configs file",
    )
    parser.add_argument(
        "--result-dir",
        default="./trained_models",
        type=str,
        help="directory to save results",
    )
    parser.add_argument(
        "--exp-name",
        type=str,
        help="Name of the experiment (creates dir with this name in --result-dir)",
    )

    parser.add_argument(
        "--exp-mode",
        type=str,
        choices=("pretrain",
                 "score_prune", "score_finetune",
                 "rate_prune", "rate_finetune",
                 "harp_prune", "harp_finetune", "harp_finetune_lwm"),
        help="Train networks following one of these methods.",
    )

    # Model
    parser.add_argument("--arch", type=str, help="Model achitecture")
    parser.add_argument(
        "--num-classes",
        type=int,
        default=10,
        help="Number of output classes in the model",
    )
    parser.add_argument(
        "--layer-type", type=str, choices=("dense", "subnet"), help="dense | subnet"
    )
    parser.add_argument(
        "--init_type",
        choices=("kaiming_normal", "kaiming_uniform", "signed_const"),
        help="Which init to use for weight parameters: kaiming_normal | kaiming_uniform | signed_const",
    )
    parser.add_argument(
        "--k_s2ap",
        type=float,
        default=1.0,
        help="Fraction of weight variables to perturb",
    )
    parser.add_argument(
        "--misalign_pert",
        action="store_true",
        default=False,
        help="When true, it misaligns with the sparsity k and perturbs the k_s2ap weights during sparse pruning",
    )

    # Pruning

    parser.add_argument(
        "--k",
        type=float,
        default=1.0,
        help="Fraction of weight variables kept in subnet",
    )

    parser.add_argument(
        "--prune_reg",
        type=str,
        default='weight',
        help="Prune regularity",
    )

    parser.add_argument(
        "--stg_mode",
        type=str,
        default="harp",
        help="Prune strategy mode [harp, random, uniform]",
    )

    parser.add_argument(
        "--stg_id",
        type=str,
        default="010_0",
        help="Prune rate in conv_subnet",
    )

    parser.add_argument(
        "--conv_k",
        type=list,
        default=[1.0],
        help="Prune rate in conv_subnet",
    )

    parser.add_argument(
        "--shortcut_k",
        type=list,
        default=[1.0],
        help="Prune rate in conv_subnet",
    )

    parser.add_argument(
        "--fc_k",
        type=list,
        default=[1.0],
        help="Prune rate in subnet",
    )

    parser.add_argument(
        "--scaled-score-init",
        action="store_true",
        default=False,
        help="Init importance scores proportaional to weights (default kaiming init)",
    )

    parser.add_argument(
        "--save_mask",
        action="store_true",
        default=False,
        help="Save only mask and interrupt process when doing LWM",
    )

    parser.add_argument(
        "--perturb_weights",
        action="store_true",
        default=False,
        help="While pruning, perturbs the freezed weights instead of the scores if true",
    )

    parser.add_argument(
        "--save_mask_path",
        type=str,
        default=None,
        help="Path where to save the mask.",
    )
    parser.add_argument(
        "--rate-stg-init",
        action="store_true",
        default=False,
        help="Init weight with SoTA strategy",
    )

    parser.add_argument(
        "--freeze-bn",
        action="store_true",
        default=False,
        help="freeze batch-norm parameters in pruning",
    )

    parser.add_argument(
        "--source-net",
        type=str,
        default="",
        help="Checkpoint which will be pruned/fine-tuned",
    )

    parser.add_argument(
        "--scores_init_type",
        choices=("kaiming_normal", "kaiming_uniform", "xavier_uniform", "xavier_normal"),
        help="Which init to use for relevance scores",
    )

    # Data
    parser.add_argument(
        "--dataset",
        type=str,
        choices=("CIFAR10", "CIFAR100", "SVHN", "MNIST", "imagenet"),
        help="Dataset for training and eval",
    )
    parser.add_argument(
        "--batch-size",
        type=int,
        default=128,
        metavar="N",
        help="input batch size for training (default: 128)",
    )
    parser.add_argument(
        "--test-batch-size",
        type=int,
        default=128,
        metavar="N",
        help="input batch size for testing (default: 128)",
    )
    parser.add_argument(
        "--normalize",
        action="store_true",
        default=False,
        help="whether to normalize the data",
    )
    parser.add_argument(
        "--sparse_s2ap",
        action="store_true",
        default=False,
        help="whether to apply sparse or dense s2ap",
    )
    parser.add_argument(
        "--data-dir", type=str, default="./datasets", help="path to datasets"
    )

    parser.add_argument(
        "--mean", type=tuple, default=(0, 0, 0), help="Mean for data normalization"
    )
    parser.add_argument(
        "--std", type=tuple, default=(1, 1, 1), help="Std for data normalization"
    )

    parser.add_argument(
        "--data-fraction",
        type=float,
        default=1.0,
        help="Fraction of images used from training set",
    )

    # Training
    parser.add_argument(
        "--trainer",
        type=str,
        default="base",
        choices=("base", "adv", "s2ap", "freeadv", "fat", "fat_s2ap"),
        help="Natural (base) or adversarial or verifiable training",
    )
    parser.add_argument(
        "--adv_loss",
        type=str,
        default="pgd",
        choices=("pgd", "trades", "mart", "nat"),
        help="Adversarial training loss",
    )
    parser.add_argument(
        "--soft_hw",
        action='store_true',
        help="Activate soft HW Flops control",
    )
    parser.add_argument(
        "--gamma",
        type=float,
        default=1.0,
        help="regularization for HW Flops control",
    )
    parser.add_argument(
        "--alpha",
        type=float,
        default=0.1,
        help="control compression rate lower bound: rate_min = k * alpha",
    )
    parser.add_argument(
        "--gamma_dynamic",
        action="store_true",
        default=True,
        help="Dynamic HW-Loss regularization",
    )
    parser.add_argument(
        "--eigenvalues",
        action="store_true",
        default=False,
        help="Computes the eigenvalues at each iteration if true",
    )

    parser.add_argument(
        "--hamming",
        action="store_true",
        default=False,
        help="Saves the mask and computes the hamming distance if true",
    )

    parser.add_argument(
        "--epochs", type=int, default=100, metavar="N", help="number of epochs to train"
    )
    parser.add_argument(
        "--optimizer", type=str, default="sgd", choices=("sgd", "adam", "rmsprop")
    )
    parser.add_argument("--wd", default=1e-4, type=float, help="Weight decay")
    parser.add_argument("--lr", type=float, default=0.1, help="learning rate")
    parser.add_argument(
        "--lr-schedule",
        type=str,
        default="cosine",
        choices=("step", "cosine"),
        help="Learning rate schedule",
    )
    parser.add_argument("--momentum", type=float, default=0.9, help="SGD momentum")
    parser.add_argument(
        "--warmup-epochs", type=int, default=0, help="Number of warmup epochs"
    )
    parser.add_argument(
        "--warmup-loss",
        type=str,
        default="nat",
        choices=("fgsm", "nat", "pgd", "trades"),
        help="adversarial loss that used for warmup"
    )
    parser.add_argument(
        "--warmup-lr", type=float, default=0.1, help="warmup learning rate"
    )
    parser.add_argument(
        "--save-dense",
        action="store_true",
        default=False,
        help="Save dense model alongwith subnets.",
    )

    # Free-adv training (only for imagenet)
    parser.add_argument(
        "--n-repeats",
        type=int,
        default=4,
        help="--number of repeats in free-adv training",
    )

    # Adversarial attacks
    parser.add_argument("--attack_eval", default="pgd", type=str, help="whitebox attack for evaluation", choices=("pgd", "fgsm", "cw"))
    parser.add_argument("--epsilon", default=8.0 / 255, type=float, help="perturbation")
    parser.add_argument(
        "--num-steps", default=10, type=int, help="perturb number of steps"
    )
    parser.add_argument(
        "--step-size", default=2.0 / 255, type=float, help="perturb step size"
    )
    parser.add_argument("--clip-min", default=0, type=float, help="perturb step size")
    parser.add_argument("--clip-max", default=1.0, type=float, help="perturb step size")
    parser.add_argument(
        "--distance",
        type=str,
        default="l_inf",
        choices=("l_inf", "l_2"),
        help="attack distance metric",
    )
    parser.add_argument(
        "--const-init",
        action="store_true",
        default=False,
        help="use random initialization of epsilon for attacks",
    )
    parser.add_argument(
        "--beta",
        default=6.0,
        type=float,
        help="regularization, i.e., 1/lambda in TRADES",
    )

    # Evaluate
    parser.add_argument(
        "--evaluate", action="store_true", default=False, help="Evaluate model"
    )

    parser.add_argument(
        "--val_method",
        type=str,
        default="base",
        choices=("base", "adv", "freeadv"),
        help="base: evaluation on unmodified inputs | adv: evaluate on adversarial inputs",
    )

    # Restart
    parser.add_argument(
        "--start-epoch",
        type=int,
        default=0,
        help="manual start epoch (useful in restarts)",
    )
    parser.add_argument(
        "--resume",
        type=str,
        default="",
        help="path to latest checkpoint (default:None)",
    )

    # Additional
    parser.add_argument(
        "--gpu", type=str, default="0", help="Comma separated list of GPU ids"
    )
    parser.add_argument(
        "--no-cuda", action="store_true", default=False, help="disables CUDA training"
    )
    parser.add_argument("--seed", type=int, default=1234, help="random seed")
    parser.add_argument(
        "--print-freq",
        type=int,
        default=100,
        help="Number of batches to wait before printing training logs",
    )

    parser.add_argument(
        "--schedule_length",
        type=int,
        default=0,
        help="Number of epochs to schedule the training epsilon.",
    )
    
    # s2ap 
    parser.add_argument('--s2ap-gamma', default=0.01, type=float,
                    help='whether or not to add parametric noise') 
    
    parser.add_argument('--s2ap-warmup', default=10, type=int,
                    help='We could apply s2ap after some epochs for accelerating.') 
    
    # swa 
    parser.add_argument(
        "--swa", action="store_true", default=False, help="if True indicates a robustbench model"
    )
    parser.add_argument(
        "--tau",         
        type=float,
        default=0.995,
        help="Fraction of weight variables kept in subnet",
    )
    
    # semisup data
    parser.add_argument(
        "--is-semisup",
        action="store_true",
        default=False,
        help="Use semisupervised training",
    )

    parser.add_argument(
        "--semisup-data",
        type=str,
        choices=("tinyimages", "splitgan"),
        help="Name for semi-supervision dataset",
    )

    parser.add_argument(
        "--semisup-fraction",
        type=float,
        default=1.0,
        help="Fraction of images used in training from semisup dataset",
    )
    
    return parser.parse_args()
