# Copyright (c) 2018, Curious AI Ltd. All rights reserved.
#
# This work is licensed under the Creative Commons Attribution-NonCommercial
# 4.0 International License. To view a copy of this license, visit
# http://creativecommons.org/licenses/by-nc/4.0/ or send a letter to
# Creative Commons, PO Box 1866, Mountain View, CA 94042, USA.
"""Functions for ramping hyperparameters up or down

Each function takes the current training step or epoch, and the
ramp length in the same format, and returns a multiplier between
0 and 1.
"""

import numpy as np


def sigmoid_rampup(current, rampup_length):
    """Exponential rampup from https://arxiv.org/abs/1610.02242"""
    if rampup_length == 0:
        return 1.0
    else:
        current = np.clip(current, 0.0, rampup_length)
        phase = 1.0 - current / rampup_length
        return float(np.exp(-5.0 * phase * phase))


def sigmoid_rampdown(current, rampdown_length):
    """Exponential rampdown"""
    if rampdown_length == 0:
        return 1.0
    else:
        current = np.clip(current, 0.0, rampdown_length)
        phase = 1.0 - (rampdown_length - current) / rampdown_length
        return float(np.exp(-12.5 * phase * phase))


def exp_rampup(current, rampup_length):
    """Exponential rampup from https://arxiv.org/abs/1610.02242"""
    if rampup_length == 0:
        return 1.0
    else:
        current = np.clip(current, 0.0, rampup_length)
        phase = current / rampup_length - 1.0
        return float(np.exp(5.0 * phase))


def log_rampup(current, rampup_length):
    """Exponential rampup from https://arxiv.org/abs/1610.02242"""
    if rampup_length == 0:
        return 1.0
    else:
        current = np.clip(current, 0.0, rampup_length)
        phase = current / rampup_length
        return float(1.0 - np.exp(-5.0 * phase))


def linear_rampup(current, rampup_length):
    """Linear rampup"""
    assert current >= 0 and rampup_length >= 0
    if current >= rampup_length:
        lr = 1.0
    else:
        lr = current / rampup_length

    #print (lr)
    return lr


def linear_rampdown(current, rampdown_length):
    """Linear rampup"""
    assert current >= 0 and rampdown_length >= 0
    if current >= rampdown_length:
        return 1.0
    else:
        return 1.0 - current / rampdown_length


def cosine_rampup(current, rampup_length):
    """Cosine rampup"""
    current = np.clip(current, 0.0, rampup_length)
    return float(-.5 * (np.cos(np.pi * current / rampup_length) - 1))


def cosine_rampdown(current, rampdown_length):
    """Cosine rampdown from https://arxiv.org/abs/1608.03983"""
    assert 0 <= current <= rampdown_length
    return float(.5 * (np.cos(np.pi * current / rampdown_length) + 1))


if __name__ == '__main__':
    import matplotlib.pyplot as plt
    import numpy as np

    #x = np.zeros(100)
    #for i in range(100):
    #    x[i]=sigmoid_rampup(i, 50)
    lr_list = []
    """
    def adjust_learning_rate(epoch, step_in_epoch, total_steps_in_epoch):
        lr =0.4
        lr_rampup = 5.0
        initial_lr = 0.1

        lr_rampdown_epochs = 45

        epoch = epoch + step_in_epoch / total_steps_in_epoch

        # LR warm-up to handle large minibatch sizes from https://arxiv.org/abs/1706.02677

        lr = linear_rampup(epoch, lr_rampup) * (lr - initial_lr) + initial_lr

        # Cosine LR rampdown from https://arxiv.org/abs/1608.03983 (but one cycle only)
        if lr_rampdown_epochs:
            assert lr_rampdown_epochs >= epoch
            lr *= cosine_rampdown(epoch, lr_rampdown_epochs)

        return lr

    """
    def adjust_learning_rate(epoch, lr_sch, step_in_epoch,
                             total_steps_in_epoch):

        lr = 0.4
        lr_rampup = 5.0
        initial_lr = 0.1

        epoch = epoch + step_in_epoch / total_steps_in_epoch
        print(epoch)
        # LR warm-up to handle large minibatch sizes from https://arxiv.org/abs/1706.02677
        lr = linear_rampup(epoch, lr_rampup) * (lr - initial_lr) + initial_lr

        lr = lr * (0.1**(epoch // lr_sch))

        return lr

    for epoch in range(20):
        for step_in_epoch in range(5):
            lr_temp = adjust_learning_rate(epoch, 6, step_in_epoch, 5)
            lr_list.append(lr_temp)

    #plt.ylim(1.0)
    plt.plot(np.asarray(lr_list))
    plt.show()
