{
"exp_name": "hypergrid_environment_test",
"master_dir": "exps",
"plot": true,
"freq_plot": 10,
"n_iterations": 5000,
"batch_size": 128,
"device": "cpu",
"seed": 4444,
"freq_md": 10,
"freq_rb": 2,
"freq_ns": 2,
"repeats": 1,
"n_threads": -1,    
"n_processes": -1,
"data_saving": {
    "on_policy_samples": 10000,
    "freq_data_save": 10,
    "loss": true,
    "logZ": true,
    "L1_policy_error": true,
    "L1_potential_kde_error": true
},
"env": {
    "env_name": "hypergrid",
    "grid_dimension": 3, 
    "edge_size": 10,
    "max_policy_std": 7.0, 
    "min_policy_std": 0.1,
    "init_value": 0,
    "mixture_dim": 4,
    "num_grid_points": 50
},
"gfn": {
    "optimizer": "adam",
    "gradient_clipping": true,
    "clip_value": 1,
    "trajectory_length": 3,
    "hidden_dim": 512,
    "n_hidden_layers": 3,
    "lr_model": 1e-3,
    "lr_logz": 1e-1,
    "lr_schedule": "linear",
    "loss": "TB",
    "lambda": 0.9,
    "tie_weights": true,
    "log_reward_clip_min": -10,
    "thompson_sampling": false,
    "thompson_sampling_num_heads": 10,
    "local_search": false,
    "local_search_K": 1, 
    "nested_sampling": false,
    "noise_exploration" : {
        "active": false,
        "initial_noise": 0.5,
        "final_noise": 0,
        "noise_profile": "exponential_flat"
    }
},
"metad" : {
    "active": false,
    "train": true,
    "delta_t": 1, 
    "n": 1,
    "beta": 1,
    "gamma": 0.1,
    "w": 0.10, 
    "kde_widths": [2, 2, 2],
    "epsilon": 1e-3,
    "z_mu0s": [0, 0, 0],
    "p_mu0s": [0, 0, 0],
    "z_var0s": [1, 1, 1],
    "p_var0s": [1, 1, 1]
},
"replay_buffer": {
    "sampling_method": "biased", 
    "reward_only": true,
    "active": true,
    "capacity": 10000,
    "alpha": 0.5,
    "beta": 0.3,
    "log_reward_threshold": -4
}
}