{"true_reward": 3.8680177630860544, "expected_reward": 3.6897736449682874, "runtime": 18.836131658941984, "actions": 5.0, "seed": 249.5, "steps": 5000, "exploration_coeff": 5.0, "rollout_depth": 3}