{"env_seed": 0, "n_states": 20, "sucess_probability": 0.9, "---- Shared parameters ---": "-", "gamma": 0.9, "n_repetitions": 10, "batch_size_samples": 20, "max_bellman_iterations": 5, "---- FQI ---": "-", "fitting_steps_fqi": 400, "starting_lr_fqi": 0.01, "ending_lr_fqi": 1e-05, "---- PBOs ---": "-", "n_weights": 100, "batch_size_weights": 100, "training_steps": 400, "fitting_steps_pbo": 4, "starting_lr_pbo": 0.005, "ending_lr_pbo": 1e-05, "initial_weight_std": 0.0005}