{"true_reward": 3.827526112627572, "expected_reward": 3.6515383579187946, "runtime": 0.2090997968909997, "actions": 5.0, "seed": 5499.5, "steps": 100, "exploration_coeff": 0.5, "rollout_depth": 0}