{
    "reasoning_method": "bfs",
    "n_actions": 3,
    "model_name": "Qwen/Qwen3-32B-AWQ",
    "eval_model_name": "Qwen/Qwen3-32B-AWQ",
    "enable_think_policy": [
        true
    ],
    "enable_think_eval": [
        true
    ],
    "enable_think_terminal_gen": [
        false
    ],
    "gpu_device": "nvidia l40s",
    "terminate_constraints": [
        "binary_sampling"
    ],
    "terminate_ORM_name": null,
    "terminal_gen_model_name": "Qwen/Qwen3-32B-AWQ",
    "r_terminating": null,
    "sample_size_terminate": 10,
    "sample_threshold_terminate": 0.8,
    "sample_threshold_verify": 0.8,
    "depth_limit": 10,
    "force_terminating_on_depth_limit": false,
    "terminate_on_terminal_node": true,
    "bn_model_name": null,
    "add_continuation": true,
    "reward_alpha": null,
    "reward_beta": null,
    "reward_gamma": 0.49,
    "reward_gamma1": null,
    "n_actions_for_bne": 3,
    "bn_method": "sc",
    "only_continuation_at_head": false,
    "max_new_tokens_for_bn_eval": null,
    "max_try_for_bn_eval": 3,
    "think_for_usefulness": false,
    "think_for_correctness": false,
    "n_for_correctness": 2,
    "n_for_usefulness": 1,
    "package_version": "v0.1.6",
    "beam_size": 5
}