Num_observation_layers: 1
First_layer_num: 5
Observation_critic: False
Pseudocode: False

Code_debug: True
search_budget_node: 25
expand_num_per_call: 3
expand_budget: 3
Selection_method: ["Test case", "Reward model"]
select_top_k: 1
Selection_reward_weight:
   "Test case": 10
   "Reward model": 1
   "Self score": 1

Pass@n: 25