{"env_seed": 1, "n_actions_on_max": 200, "max_action_on_max": 8, "max_discrete_state": 4, "max_discrete_action": 4, "---- Shared parameters ---": "-", "n_discrete_states": 11, "n_discrete_actions": 11, "batch_size_samples": 121, "max_bellman_iterations": 2, "---- FQI ---": "-", "fitting_steps_fqi": 800, "starting_lr_fqi": 0.01, "ending_lr_fqi": 1e-05, "---- PBOs ---": "-", "n_weights": 1, "batch_size_weights": 1, "training_steps": 3200, "fitting_steps_pbo": 1, "starting_lr_pbo": 0.01, "ending_lr_pbo": 1e-05, "initial_weight_std": 0.0005}