{
    "num_workers": 0, 
    "observation_filter": "MeanStdFilter", 
    "train_batch_size": 8192, 
    "target_entropy": -8, 
    "gamma": 0.995, 
    "batch_mode": "truncate_episodes", 
    "horizon": 10000, 
    "num_gpus": 0, 
    "framework": "torch", 
    "no_done_at_end": true, 
    "target_network_update_freq": 1000, 
    "tau": 0.001, 
    "num_steps_sampled_before_learning_starts": 500, 
    "initial_alpha": 1, 
    "twin_q": true, 
    "optimization": {
                    "actor_learning_rate": 0.0003, 
                    "critic_learning_rate": 0.0003, 
                    "entropy_learning_rate": 0.0001}, 
    "replay_buffer_config": {
                    "capacity": 10000000, 
                    "type": "MultiAgentReplayBuffer"}}