{
    "seed": 0,
    "train_cfgs": {
        "device": "cpu",
        "torch_threads": 1,
        "vector_env_nums": 2,
        "parallel": 1,
        "total_steps": 4096,
        "epochs": 2
    },
    "algo_cfgs": {
        "steps_per_epoch": 2048,
        "update_iters": 10,
        "batch_size": 64,
        "target_kl": 0.02,
        "entropy_coef": 0.0,
        "reward_normalize": false,
        "cost_normalize": false,
        "obs_normalize": true,
        "kl_early_stop": true,
        "use_max_grad_norm": true,
        "max_grad_norm": 40.0,
        "use_critic_norm": true,
        "critic_norm_coef": 0.001,
        "gamma": 0.99,
        "cost_gamma": 0.99,
        "lam": 0.95,
        "lam_c": 0.95,
        "adv_estimation_method": "gae",
        "standardized_rew_adv": true,
        "standardized_cost_adv": true,
        "penalty_coef": 0.0,
        "use_cost": false
    },
    "logger_cfgs": {
        "use_wandb": false,
        "wandb_project": "omnisafe",
        "use_tensorboard": true,
        "save_model_freq": 100,
        "log_dir": "",
        "window_lens": 100
    },
    "model_cfgs": {
        "weight_initialization_mode": "kaiming_uniform",
        "actor_type": "gaussian_learning",
        "linear_lr_decay": true,
        "exploration_noise_anneal": false,
        "std_range": [
            0.5,
            0.1
        ],
        "actor": {
            "hidden_sizes": [
                64,
                64
            ],
            "activation": "tanh",
            "lr": 0.0003
        },
        "critic": {
            "hidden_sizes": [
                64,
                64
            ],
            "activation": "tanh",
            "lr": 0.0003
        }
    },
    "exp_increment_cfgs": {
        "seed": 0,
        "algo_cfgs": {
            "steps_per_epoch": 2048
        },
        "train_cfgs": {
            "total_steps": 4096,
            "torch_threads": 1,
            "vector_env_nums": 2
        },
        "logger_cfgs": {
            "use_wandb": false,
            "log_dir": ""
        }
    },
    "exp_name": "PolicyGradient-{SafetyAntVelocity-v1}",
    "env_id": "SafetyAntVelocity-v1",
    "algo": "PolicyGradient"
}
