{"true_reward": 3.8392455806924515, "expected_reward": 3.657138747175988, "runtime": 0.19350797305000003, "actions": 5.0, "seed": 9499.5, "steps": 100, "exploration_coeff": 0.5, "rollout_depth": 0}