{
    "physics_params": {
        "x_threshold": 0.3,
        "theta_dot_threshold": 15,
        "kinematics_integrator": "euler",
        "ini_states": [
            0.0,
            0.0,
            -3.141592653589793,
            0.0,
            false
        ],
        "gravity": 9.8,
        "mass_cart": 0.94,
        "mass_pole": 0.23,
        "force_mag": 20.0,
        "voltage_mag": 20.0,
        "length": 0.64,
        "theta_random_std": 0.8,
        "friction_cart": 10,
        "friction_pole": 0.0011,
        "with_friction": true,
        "force_input": false,
        "simulation_frequency": 30,
        "actuation_delay": 1
    },
    "reward_params": {
        "distance_score_reward": 1.2,
        "action_penalty": 0.01,
        "crash_penalty": 0,
        "distance_score_factor": 5
    },
    "stats_params": {
        "max_episode_steps": 500,
        "total_steps": 20000,
        "target_distance_score": 0.77880078307,
        "targets": [
            0.0,
            0.0
        ],
        "model_name": "model_name",
        "eval_period": 20,
        "log_file_name": "20250919-140903",
        "force_override": false,
        "weights_path": null,
        "running_mode": "train",
        "random_initial_ips": true,
        "visualize_eval": false,
        "reset_delay": 1.0,
        "can_swing_up_steps": 100,
        "on_target_reset_steps": 500,
        "converge_episodes": 3,
        "converge_swing_up_time": 250
    },
    "agent_params": {
        "agent_name": "SAC",
        "mode": "train",
        "soft_alpha": 0.005,
        "learning_rate_actor": 0.0003,
        "learning_rate_critic": 0.0003,
        "batch_size": 128,
        "target_network_frequency": 1,
        "noise_clip": 0.5,
        "entropy_alpha": 0.1,
        "gamma_discount": 0.99,
        "model_path": "",
        "total_training_steps": 5000000,
        "replay_buffer_size": 500000,
        "learning_starts": 128,
        "policy_update_frequency": 1,
        "use_layer_norm": false,
        "actor_hidden_units": [
            256,
            256
        ],
        "critic_hidden_units": [
            256,
            256
        ],
        "actor_activation": "relu",
        "critic_activation": "relu",
        "autosafe_lam_mode": "opt",
        "add_actions_observations": true,
        "action_observations_dim": 5,
        "action_noise_factor": 0
    },
    "redis_params": {
        "servers": [
            {
                "port": "6379",
                "password": "ippc123456",
                "host_ip": "10.162.12.223",
                "name": "cloud"
            }
        ],
        "ch_edge_control": {
            "server_name": "cloud",
            "channel_name": "ch_plant_control"
        },
        "ch_plant_trajectory_segment": {
            "server_name": "cloud",
            "channel_name": "ch_plant_trajectory_segment"
        },
        "ch_plant_reset": {
            "server_name": "cloud",
            "channel_name": "ch_plant_reset"
        },
        "ch_edge_weights": {
            "server_name": "cloud",
            "channel_name": "ch_edge_weights"
        },
        "ch_edge_ready_update": {
            "server_name": "cloud",
            "channel_name": "ch_edge_ready_update"
        },
        "ch_edge_mode": {
            "server_name": "cloud",
            "channel_name": "ch_edge_mode"
        },
        "ch_edge_trajectory": {
            "server_name": "cloud",
            "channel_name": "ch_edge_trajectory"
        },
        "ch_training_steps": {
            "server_name": "cloud",
            "channel_name": "ch_training_steps"
        }
    },
    "cloud_params": {
        "sleep_after_reset": 2,
        "agent_type": 0,
        "pre_fill_steps": 0,
        "weights_update_period": 1,
        "artificial_bandwidth": -1,
        "artificial_ping": 0,
        "ethernet_bandwidth": 100,
        "ethernet_ping": 0.2
    },
    "trainer_params": {
        "gamma_discount": 0.99,
        "rm_size": 1000000,
        "combined_experience_replay": true,
        "use_prioritized_replay": false,
        "batch_size": 128,
        "learning_rate_actor": 0.0003,
        "learning_rate_critic": 0.0003,
        "is_remote_train": false,
        "actor_freeze_step_count": 128,
        "pre_fill_exp": 128,
        "target_action_noise": true,
        "training_epoch": 1,
        "actor_update_period": 1,
        "step_soft_update": false
    }
}