approach: specalign_rejection
logname: specalign_rejection
dataset_name: "/root/specalign/external/qwen25_math_evaluation/data/amc23/test.jsonl"
n: 4
search_batch_size: 1
dataset_start: null
dataset_end: null
seed: 42
rm_regularizer: 1
num_iterations: 10
sort_completed: true
max_tokens: 512
speculative: true
sample_final_pred: false
sample: true
temperature: 0.2 
draft_model_path: "Qwen/Qwen2.5-Math-1.5B-Instruct"
draft_model_ip_address: "http://localhost:12343/v1"
target_model_path: "Qwen/Qwen2.5-Math-7B-Instruct"
target_model_ip_address: "http://localhost:12345/v1"
prm_path: "Skywork/Skywork-o1-Open-PRM-Qwen-2.5-7B"
prm_ip_address: "http://localhost:12342/v1"