{
    "seed": 1,
    "env_type": "driving",
    "env_id": "highD",
    "env": "tools.environments.create('driving', 'highD', normalize_states=False, time_limit=1000)",
    "flow_epochs": 20,
    "minibatch_size": 64,
    "discount_factor": 0.99,
    "learning_rate": 5e-4,
    "learning_rate_feasibility": 2.5e-5,
    "replay_buffer_size": 10000,
    "hidden_size": 64,
    "subepochs": 25,
    "debug": true,
    "episodes_per_epoch": 20,
    "ppo_clip_param": 0.1,
    "forward_crl": "CPPO",
    "policy_class": "tools.algorithms.PPOPolicy",
    "ppo_entropy_coef": 0.01,
    "ppo_epochs": 50,
    "ppo_epochs_novelty": 25,
    "ppo_outer_epochs_novelty": 5,
    "normalize_flow_inputs": true,
    "window": 25,
    "beta": 0.1,
    "past_pi_weights": [],
    "past_pi_dissimilarities": [],
    "expert_episodes": 50,
    "pi_episodes": 50,
    "updates_per_epoch": 25,
    "alpha": 15,
    "outer_epochs": 3,
    "normalize_func": "bin",
    "cost_condition": "",
    "cost_comparison": "",
    "accrual_comparison": "lambda ea, a: __import__('tools').utils.mse(ea, a)",
    "input_format": "lambda s, a: [*s]",
    "vector_input_format": "lambda S, A: S",
    "state_reduction": "lambda s: [s[2], s[-1]]",
    "vector_state_reduction": "lambda S: S[:, :, [2, -1]]",
    "action_reduction": "lambda a: a",
    "vector_action_reduction": "lambda A: A",
    "i": 2,
    "mix_save_epoch": 25
}