from ml_collections import config_dict


def get_config(algorithm_name):
    config = config_dict.ConfigDict()

    config.name = algorithm_name

    config.device = "gpu"  # cpu, gpu
    config.nr_parallel_seeds = 1
    config.total_timesteps = 2e9
    config.learning_rate = 4e-4
    config.anneal_learning_rate = True
    config.nr_steps = 128
    config.nr_epochs = 10
    config.minibatch_size = 32768
    config.gamma = 0.99
    config.gae_lambda = 0.9
    config.clip_range = 0.1
    config.entropy_coef = 0.001
    config.critic_coef = 1.0
    config.max_grad_norm = 5.0
    config.std_dev = 1.0
    config.action_clipping_and_rescaling = False
    config.evaluation_and_save_frequency = 17301504  # -1 to disable
    config.evaluation_active = True

    # TRIRL Params
    config.nr_hidden_units_disc = 256
    config.learning_rate_disc = 4e-4
    config.nr_epochs_disc = 30  # Number of disc epochs
    config.env_reward_frac = 0.0
    config.data_path = "../expert_data/30_episodes/expert_dataset_Ant-v5_30_PPO.npz"

    config.gp_lambda = 0.01
    config.gp_alpha = 0.5

    config.handle_absorbing_states = True
    config.reward_type = 'shaped' # options: state-action, state-based, shaped, shaped-sa, uncorrelated
    
    # config.global_rew_experiment = False
    # config.subsampling_cutoff = 1

    return config
