{
    "seed": 1,
    "env_type": "driving",
    "env_id": "exiD",
    "env": "tools.environments.create('driving', 'exiD', normalize_states=False, normalize_actions=False, time_limit=1000)",
    "flow_epochs": 20,
    "minibatch_size": 64,
    "discount_factor": 0.99,
    "learning_rate": 5e-4,
    "learning_rate_feasibility": 2.5e-5,
    "steps_per_epoch": 1000,
    "replay_buffer_size": 10000,
    "hidden_size": 64,
    "subepochs": 25,
    "debug": true,
    "episodes_per_epoch": 20,
    "ppo_clip_param": 0.1,
    "forward_crl": "PPOLag2",
    "policy_class": "tools.algorithms.PPOPolicy",
    "ppo_entropy_coef": 0.01,
    "ppo_epochs": 50,
    "ppo_epochs_novelty": 50,
    "ppo_outer_epochs_novelty": 5,
    "normalize_flow_inputs": true,
    "window": 25,
    "beta": 5,
    "past_pi_weights": [],
    "past_pi_dissimilarities": [],
    "expert_episodes": 50,
    "pi_episodes": 50,
    "updates_per_epoch": 25,
    "alpha": 15,
    "outer_epochs": 5,
    "normalize_func": "max",
    "cost_condition": "",
    "cost_comparison": "",
    "accrual_comparison": "lambda ea, a: __import__('tools').utils.mse(ea, a)",
    "input_format": "lambda s, a: [s[0]/10., a[0]/5.]",
    "vector_input_format": "lambda S, A: torch.cat((S/10., A/5.), dim=-1)",
    "state_reduction": "lambda s: s",
    "vector_state_reduction": "lambda S: S",
    "action_reduction": "lambda a: a",
    "vector_action_reduction": "lambda A: A",
    "i": 2,
    "mix_save_epoch": 50
}