{
    "seed": 0,
    "train_cfgs": {
        "device": "cpu",
        "torch_threads": 16,
        "vector_env_nums": 1,
        "parallel": 1,
        "total_steps": 1024000,
        "algo": "PPO",
        "env_id": "SafetyPointGoal1-v0",
        "epochs": 1000
    },
    "algo_cfgs": {
        "steps_per_epoch": 1024,
        "update_iters": 40,
        "batch_size": 64,
        "target_kl": 0.02,
        "entropy_coef": 0.0,
        "reward_normalize": true,
        "cost_normalize": true,
        "obs_normalize": true,
        "kl_early_stop": true,
        "use_max_grad_norm": true,
        "max_grad_norm": 40.0,
        "use_critic_norm": true,
        "critic_norm_coef": 0.001,
        "gamma": 0.99,
        "cost_gamma": 0.99,
        "lam": 0.95,
        "lam_c": 0.95,
        "clip": 0.2,
        "adv_estimation_method": "gae",
        "standardized_rew_adv": true,
        "standardized_cost_adv": true,
        "penalty_coef": 0.0,
        "use_cost": false
    },
    "logger_cfgs": {
        "use_wandb": false,
        "wandb_project": "omnisafe",
        "use_tensorboard": true,
        "save_model_freq": 100,
        "log_dir": "./runs",
        "window_lens": 100
    },
    "model_cfgs": {
        "weight_initialization_mode": "kaiming_uniform",
        "actor_type": "gaussian_learning",
        "linear_lr_decay": true,
        "exploration_noise_anneal": false,
        "std_range": [
            0.5,
            0.1
        ],
        "actor": {
            "hidden_sizes": [
                64,
                64
            ],
            "activation": "tanh",
            "lr": 0.0003
        },
        "critic": {
            "hidden_sizes": [
                64,
                64
            ],
            "activation": "tanh",
            "lr": 0.0003
        }
    },
    "exp_name": "PPO-(SafetyPointGoal1-v0)",
    "env_id": "SafetyPointGoal1-v0",
    "algo": "PPO"
}
