{
    "exp_name": "pendulum_environment_test",
    "master_dir": "exps",
    "plot": true,
    "freq_plot": 10,
    "n_iterations": 1000,
    "batch_size": 64,
    "device": "cpu",
    "seed": 4444,
    "freq_md": 10,
    "freq_rb": 2,
    "repeats": 1,
    "n_threads": -1,
    "n_processes": -1,
    "data_saving": {
        "on_policy_samples": 10000,
        "freq_data_save": 10,
        "loss": true,
        "logZ": true,
        "L1_policy_error": true,
        "L1_potential_kde_error": true
    },
    "env": {
        "env_name": "pendulum",
        "max_speed": 8,
        "max_impulse": 2,
        "max_impulse_std": 0.5, 
        "min_impulse_std": 0.1,
        "timestep": 0.05, 
        "gravity": 10.0,
        "mass": 1.0,
        "length": 1.0,
        "interval_between_steps": 0.5,
        "lower_bound": -8,
        "upper_bound": 8,
        "init_value": [0, 0],
        "mixture_dim": 1,
        "num_grid_points": [200, 200]
    },
    "gfn": {
        "optimizer": "adam",
        "gradient_clipping": true,
        "clip_value": 1,
        "trajectory_length": 3,
        "hidden_dim": 512,
        "n_hidden_layers": 3,
        "lr_model": 1e-3,
        "lr_logz": 1e-1,
        "lr_schedule": "linear",
        "loss": "TB",
        "lambda": 0.9,
        "tie_weights": true,
        "log_reward_clip_min": -10,
        "thompson_sampling": false,
        "thompson_sampling_num_heads": 10,
        "local_search": false,
        "local_search_K": 1,
        "nested_sampling": false,
        "noise_exploration" : {
            "active": false,
            "initial_noise": 2,
            "final_noise": 0,
            "noise_profile": "exponential_flat"
        }
    },
    "metad" : {
        "active": false,
        "train": true,
        "delta_t": 0.05, 
        "n": 2,
        "beta": 1,
        "gamma": 2,
        "w": 0.15, 
        "kde_widths": [0.5, 0.5],
        "epsilon": 1e-3,
        "z_mu0s": [-1, 0],
        "p_mu0s": [0, 0],
        "z_var0s": [-1, 1],
        "p_var0s": [0.5, 0.5]
    },
    "replay_buffer": {
        "sampling_method": "biased", 
        "reward_only": true,
        "active": true,
        "capacity": 10000,
        "alpha": 0.5,
        "beta": 0.3,
        "log_reward_threshold": -3
    }
}