import torch
import sys
import os

from find_high_accuracy_path_v2.find_parameters import ParameterMove, ParameterTrain, ParameterRebuildNorm, ParameterGeneral
from find_high_accuracy_path_v2.runtime_parameters import RuntimeParameters

sys.path.append(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
from py_src.ml_setup import MlSetup

model_name = 'regnet_x_200mf'

def get_parameter_general(runtime_parameter: RuntimeParameters, ml_setup: MlSetup):
    output = ParameterGeneral()
    if ml_setup.model_name == model_name:
        output.max_tick = 58 * 300
        output.dataloader_worker = 8
        output.test_dataset_use_whole = True
    else:
        raise NotImplemented
    return output

def get_parameter_move(runtime_parameter: RuntimeParameters, ml_setup: MlSetup):
    output = ParameterMove()
    test_weights_keyword = ['running_mean', 'running_var', 'num_batches_tracked']
    phase_time = 300
    adoptive_step_size = 0.003
    ratio_step_size = 0.003
    layer_1_0 = 'layer1.0.'
    layer_2_0 = 'layer2.0.'
    layer_3_0 = 'layer3.0.'
    layer_3_1 = 'layer3.1.'
    layer_3_2 = 'layer3.2.'
    layer_3_3 = 'layer3.3.'
    layer_4_0 = 'layer4.0.'
    layer_4_1 = 'layer4.1.'
    layer_4_2 = 'layer4.2.'
    layer_4_3 = 'layer4.3.'
    layer_4_4 = 'layer4.4.'
    layer_4_5 = 'layer4.5.'
    layer_4_6 = 'layer4.6.'
    layer1 = ['conv1', 'bn1']
    layer2 = ['conv2', 'bn2']
    layer3 = ['conv3', 'bn3']
    layer4 = ['shortcut']
    def get_ignore_layer_list(operate_on_layer, layer_type):
        if layer_type == 1:
            return [f"{operate_on_layer}{i}" for i in layer2] + [f"{operate_on_layer}{i}" for i in layer3] + [f"{operate_on_layer}{i}" for i in layer4]
        if layer_type == 2:
            return [f"{operate_on_layer}{i}" for i in layer3] + [f"{operate_on_layer}{i}" for i in layer4]
        if layer_type == 3:
            return [f"{operate_on_layer}{i}" for i in layer4]
        if layer_type == 4:
            return []
        raise NotImplemented

    if ml_setup.model_name == model_name:
        if runtime_parameter.current_tick == 0:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = ['layer1', 'layer2', 'layer3', 'layer4', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False

        # layer_1_0
        elif runtime_parameter.current_tick == phase_time * 1:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_1_0, 1) + ['layer2', 'layer3', 'layer4', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 2:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_1_0, 2) + ['layer2', 'layer3', 'layer4', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 3:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_1_0, 3) + ['layer2', 'layer3', 'layer4', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 4:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_1_0, 4) + ['layer2', 'layer3', 'layer4', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        
        # layer_2_0
        elif runtime_parameter.current_tick == phase_time * 5:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_2_0, 1) + ['layer3', 'layer4', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 6:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_2_0, 2) + ['layer3', 'layer4', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 7:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_2_0, 3) + ['layer3', 'layer4', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 8:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_2_0, 4) + ['layer3', 'layer4', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        
        # layer_3_0
        elif runtime_parameter.current_tick == phase_time * 9:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_3_0, 1) + ['layer3.1','layer3.2','layer3.3', 'layer4', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 10:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_3_0, 2) + ['layer3.1','layer3.2','layer3.3', 'layer4', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 11:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_3_0, 3) + ['layer3.1','layer3.2','layer3.3', 'layer4', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 12:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_3_0, 4) + ['layer3.1','layer3.2','layer3.3', 'layer4', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        
        # layer_3_1
        elif runtime_parameter.current_tick == phase_time * 13:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_3_1, 1) + ['layer3.2','layer3.3', 'layer4', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 14:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_3_1, 2) + ['layer3.2','layer3.3', 'layer4', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 15:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_3_1, 3) + ['layer3.2','layer3.3', 'layer4', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 16:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_3_1, 4) + ['layer3.2','layer3.3', 'layer4', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False

        # layer_3_2
        elif runtime_parameter.current_tick == phase_time * 17:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_3_2, 1) + ['layer3.3', 'layer4', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 18:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_3_2, 2) + ['layer3.3', 'layer4', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 19:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_3_2, 3) + ['layer3.3', 'layer4', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 20:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_3_2, 4) + ['layer3.3', 'layer4', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        
        # layer_3_3
        elif runtime_parameter.current_tick == phase_time * 21:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_3_3, 1) + ['layer4', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 22:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_3_3, 2) + ['layer4', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 23:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_3_3, 3) + ['layer4', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 24:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_3_3, 4) + ['layer4', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False

        # layer_4_0
        elif runtime_parameter.current_tick == phase_time * 25:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_4_0, 1) + ['layer4.1', 'layer4.2', 'layer4.3', 'layer4.4', 'layer4.5', 'layer4.6', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 26:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_4_0, 2) + ['layer4.1', 'layer4.2', 'layer4.3', 'layer4.4', 'layer4.5', 'layer4.6', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 27:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_4_0, 3) + ['layer4.1', 'layer4.2', 'layer4.3', 'layer4.4', 'layer4.5', 'layer4.6', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 28:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_4_0, 4) + ['layer4.1', 'layer4.2', 'layer4.3', 'layer4.4', 'layer4.5', 'layer4.6', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False

        # layer_4_1
        elif runtime_parameter.current_tick == phase_time * 29:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_4_1, 1) + ['layer4.2', 'layer4.3', 'layer4.4', 'layer4.5', 'layer4.6', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 30:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_4_1, 2) + ['layer4.2', 'layer4.3', 'layer4.4', 'layer4.5', 'layer4.6', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 31:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_4_1, 3) + ['layer4.2', 'layer4.3', 'layer4.4', 'layer4.5', 'layer4.6', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 32:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_4_1, 4) + ['layer4.2', 'layer4.3', 'layer4.4', 'layer4.5', 'layer4.6', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False

        # layer_4_2
        elif runtime_parameter.current_tick == phase_time * 33:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_4_2, 1) + ['layer4.3', 'layer4.4', 'layer4.5', 'layer4.6', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 34:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_4_2, 2) + ['layer4.3', 'layer4.4', 'layer4.5', 'layer4.6', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 35:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_4_2, 3) + ['layer4.3', 'layer4.4', 'layer4.5', 'layer4.6', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 36:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_4_2, 4) + ['layer4.3', 'layer4.4', 'layer4.5', 'layer4.6', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False

        # layer_4_3
        elif runtime_parameter.current_tick == phase_time * 37:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_4_3, 1) + ['layer4.4', 'layer4.5', 'layer4.6', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 38:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_4_3, 2) + ['layer4.4', 'layer4.5', 'layer4.6', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 39:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_4_3, 3) + ['layer4.4', 'layer4.5', 'layer4.6', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 40:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_4_3, 4) + ['layer4.4', 'layer4.5', 'layer4.6', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        
        # layer_4_4
        elif runtime_parameter.current_tick == phase_time * 41:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_4_4, 1) + ['layer4.5', 'layer4.6', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 42:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_4_4, 2) + ['layer4.5', 'layer4.6', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 43:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_4_4, 3) + ['layer4.5', 'layer4.6', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 44:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_4_4, 4) + ['layer4.5', 'layer4.6', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False

        # layer_4_5
        elif runtime_parameter.current_tick == phase_time * 45:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_4_5, 1) + ['layer4.6', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 46:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_4_5, 2) + ['layer4.6', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 47:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_4_5, 3) + ['layer4.6', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 48:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_4_5, 4) + ['layer4.6', 'linear'] + test_weights_keyword
            output.merge_bias_with_weights = False

        # layer_4_6
        elif runtime_parameter.current_tick == phase_time * 49:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_4_6, 1) + ['linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 50:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_4_6, 2) + ['linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 51:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_4_6, 3) + ['linear'] + test_weights_keyword
            output.merge_bias_with_weights = False
        elif runtime_parameter.current_tick == phase_time * 52:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = get_ignore_layer_list(layer_4_6, 4) + ['linear'] + test_weights_keyword
            output.merge_bias_with_weights = False

        # linear
        elif runtime_parameter.current_tick == phase_time * 53:
            output.step_size = 0
            output.adoptive_step_size = adoptive_step_size
            output.ratio_step_size = ratio_step_size
            output.layer_skip_move = []
            output.layer_skip_move_keyword = [] + test_weights_keyword
            output.merge_bias_with_weights = False
        else:
            return None
    else:
        raise NotImplemented
    return output


def get_parameter_train(runtime_parameter: RuntimeParameters, ml_setup: MlSetup):
    output = ParameterTrain()
    if ml_setup.model_name == model_name:
        if runtime_parameter.current_tick == 0:
            output.train_for_max_rounds = 1000
            output.train_for_min_rounds = 100
            output.train_until_loss = 0.1
            output.pretrain_optimizer = False
            output.load_existing_optimizer = False
        else:
            return None
    else:
        raise NotImplemented
    return output

def get_optimizer_train(runtime_parameter: RuntimeParameters, ml_setup: MlSetup, model_parameter):
    if ml_setup.model_name == model_name:
        if runtime_parameter.current_tick == 0:
            # optimizer = torch.optim.SGD(model_parameter, lr=0.001)
            base_lr = 0.001
            optimizer = torch.optim.SGD(
                [{'params': param, 'lr': base_lr} for param in model_parameter]
            )
        else:
            return None
    else:
        raise NotImplemented
    return optimizer

def get_parameter_rebuild_norm(runtime_parameter: RuntimeParameters, ml_setup: MlSetup):
    output = ParameterRebuildNorm()
    if ml_setup.model_name == model_name:
        if runtime_parameter.current_tick == 0:
            output.rebuild_norm_for_max_rounds = 0
            output.rebuild_norm_for_min_rounds = 0
            output.rebuild_norm_until_loss = 0
            output.rebuild_norm_layer = []
            output.rebuild_norm_layer_keyword = []
        else:
            return None
    else:
        raise NotImplemented
    return output

def get_optimizer_rebuild_norm(runtime_parameter: RuntimeParameters, ml_setup: MlSetup, model_parameter):
    if ml_setup.model_name == model_name:
        if runtime_parameter.current_tick == 0:
            # optimizer = torch.optim.SGD(model_parameter, lr=0.001, momentum=0.9, weight_decay=5e-4)
            base_lr = 0.001
            optimizer = torch.optim.SGD(
                [{'params': param, 'lr': base_lr} for param in model_parameter],
                momentum=0.9, weight_decay=5e-4
            )
        else:
            return None
    else:
        raise NotImplemented
    return optimizer

