{"true_reward": 3.9146137740042435, "expected_reward": 3.6846202246072433, "runtime": 3.640309292977995, "actions": 5.0, "seed": 249.5, "steps": 1000, "exploration_coeff": 10.0, "rollout_depth": 3}