{
    "seed": 1,
    "env_type": "gym",
    "env_id": "HCWithPos-v0",
    "env": "tools.environments.create('gym', 'HCWithPos-v0', normalize_states=False, time_limit=1000)",
    "flow_epochs": 20,
    "minibatch_size": 64,
    "discount_factor": 0.99,
    "learning_rate": 5e-4,
    "gae_lambda": 0.97,
    "learning_rate_feasibility": 2.5e-5,
    "replay_buffer_size": 10000,
    "hidden_size": 64,
    "subepochs": 25,
    "steps_per_epoch": 4000,
    "debug": true,
    "episodes_per_epoch": 10,
    "ppo_clip_param": 0.2,
    "forward_crl": "PPOLag2",
    "policy_class": "tools.algorithms.PPOPolicy",
    "ppo_entropy_coef": 0,
    "ppo_epochs": 50,
    "ppo_epochs_novelty": 50,
    "ppo_outer_epochs_novelty": 5,
    "normalize_flow_inputs": true,
    "window": 25,
    "beta": 15,
    "past_pi_weights": [],
    "past_pi_dissimilarities": [],
    "expert_episodes": 100,
    "pi_episodes": 100,
    "updates_per_epoch": 25,
    "alpha": 15,
    "outer_epochs": 5,
    "normalize_func": "max",
    "cost_condition": "lambda s, a: s[0] <= -1",
    "cost_comparison": "lambda mc, c: __import__('tools').utils.mse(mc, c)",
    "accrual_comparison": "lambda ea, a: __import__('tools').utils.wasserstein_distance2d(ea.reshape(1, -1), a.reshape(1, -1))",
    "input_format": "lambda s, a: [*s]",
    "vector_input_format": "lambda S, A: S",
    "state_reduction": "lambda s: s[:1]",
    "vector_state_reduction": "lambda S: S[:, :, :1]",
    "action_reduction": "lambda a: a",
    "vector_action_reduction": "lambda A: A",
    "i": 1,
    "mix_save_epoch": 50
}
