{"true_reward": 3.929448866673884, "expected_reward": 3.6789037525999166, "runtime": 11.004025248940001, "actions": 5.0, "seed": 249.5, "steps": 5000, "exploration_coeff": 100.0, "rollout_depth": 0}