{
    "exp_name": "line_environment_test",
    "master_dir": "exps",
    "plot": true,
    "freq_plot": 10,
    "n_iterations": 1000,
    "batch_size": 64,
    "device": "cpu",
    "seed": 4444,
    "freq_md": 10,
    "freq_rb": 2,
    "freq_ns": 2,
    "repeats": 1,
    "n_threads": -1,
    "n_processes": -1,
    "data_saving": {
        "on_policy_samples": 10000,
        "freq_data_save": 10,
        "loss": true,
        "logZ": true,
        "L1_policy_error": true,
        "L1_potential_kde_error": true
    },
    "env": {
        "env_name": "line",
        "mus": [-2, -2, 2, 20],
        "variances": [1.0, 0.4, 0.6, 0.1], 
        "lower_bound": [-5],
        "upper_bound": [23],
        "init_value": [0],
        "mixture_dim": 3,
        "num_grid_points": [500],
        "max_policy_std": 1,
        "min_policy_std": 0.1
    },
    "gfn": {
        "optimizer": "adam",
        "gradient_clipping": true,
        "clip_value": 1,
        "trajectory_length": 3,
        "hidden_dim": 256,
        "n_hidden_layers": 3,
        "lr_model": 1e-3,
        "lr_logz": 1e-1,
        "lr_schedule": "linear",
        "loss": "TB",
        "lambda": 0.9,
        "tie_weights": true,
        "log_reward_clip_min": -10,
        "thompson_sampling": false,
        "thompson_sampling_num_heads": 10,
        "local_search": false,
        "local_search_K": 1, 
        "nested_sampling": false,
        "noise_exploration" : {
            "active": false,
            "initial_noise": 2,
            "final_noise": 0,
            "noise_profile": "exponential_flat"
        }
    },
    "metad" : {
        "active": false,
        "train": true,
        "delta_t": 0.05, 
        "n": 2,
        "beta": 1,
        "gamma": 2,
        "w": 0.15, 
        "epsilon": 1e-3,
        "kde_widths": [0.1],
        "z_mu0s": [0],
        "z_var0s": [1],
        "p_mu0s": [0],
        "p_var0s": [0.5]
    },
    "replay_buffer": {
        "sampling_method": "biased", 
        "reward_only": true,
        "active": true,
        "capacity": 10000,
        "alpha": 0.5,
        "beta": 0.3,
        "log_reward_threshold": -3
    }
}