prefix='math_500'
prefix='omni_math'

for prefix in 'math_500' 'omni_math'; do
  PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python Task_1/math/get_response_raw.py --input_file critic_bench/${prefix}_parsed_reassemble_verified_pp.jsonl --save_path Task_1/${prefix}_raw_r1_m.jsonl --model_name 'deepseek-r1' --client_name 'aliyun' --use_raw --num_concurrent 250 --max_queries 50 --temperature 0.
  PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python Task_1/math/get_response_unclear.py --input_file critic_bench/${prefix}_information_missing_level1_verified_pp.jsonl --save_path Task_1/${prefix}_information_missing_level1_r1_m.jsonl --model_name 'deepseek-r1' --client_name 'aliyun' --num_concurrent 250 --max_queries 50 --temperature 0.
  PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python Task_1/math/get_response_unclear.py --input_file critic_bench/${prefix}_purpose_missing_verified_pp.jsonl --save_path Task_1/${prefix}_purpose_missing_r1_m.jsonl --model_name 'deepseek-r1' --client_name 'aliyun' --num_concurrent 250 --max_queries 50 --temperature 0.
done

for suffix in '0' '1' '2' '3' '4'; do
  for prefix in 'math_500' 'omni_math'; do
    PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python Task_1/math/get_response_raw.py --input_file critic_bench/${prefix}_parsed_reassemble_verified_pp.jsonl --save_path Task_1/${prefix}_raw_r1_m${suffix}.jsonl --model_name 'deepseek-r1' --client_name 'aliyun' --use_raw --num_concurrent 250 --max_queries 50 --temperature 0.6
    PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python Task_1/math/get_response_unclear.py --input_file critic_bench/${prefix}_information_missing_level1_verified_pp.jsonl --save_path Task_1/${prefix}_information_missing_level1_r1_m${suffix}.jsonl --model_name 'deepseek-r1' --client_name 'aliyun' --num_concurrent 250 --max_queries 50 --temperature 0.6
    PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python Task_1/math/get_response_unclear.py --input_file critic_bench/${prefix}_purpose_missing_verified_pp.jsonl --save_path Task_1/${prefix}_purpose_missing_r1_m${suffix}.jsonl --model_name 'deepseek-r1' --client_name 'aliyun' --num_concurrent 250 --max_queries 50 --temperature 0.6
  done
done

#PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python Task_1/math/evaluation.py --input_path_cls Task_1/${prefix}_raw_r1_m.jsonl --input_path_raw Task_1/${prefix}_raw_r1_m.jsonl
PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python Task_1/math/evaluation.py --input_path_cls Task_1/${prefix}_information_missing_level1_r1_m.jsonl --input_path_raw Task_1/${prefix}_raw_r1_m.jsonl
PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python Task_1/math/evaluation.py --input_path_cls Task_1/${prefix}_purpose_missing_r1_m.jsonl --input_path_raw Task_1/${prefix}_raw_r1_m.jsonl

#PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python Task_1/math/evaluation_m.py --input_path_cls Task_1/${prefix}_raw_r1_m{}.jsonl --input_path_raw Task_1/${prefix}_raw_r1_m{}.jsonl
PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python Task_1/math/evaluation_m.py --input_path_cls Task_1/${prefix}_information_missing_level1_r1_m{}.jsonl --input_path_raw Task_1/${prefix}_raw_r1_m{}.jsonl
PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python Task_1/math/evaluation_m.py --input_path_cls Task_1/${prefix}_purpose_missing_r1_m{}.jsonl --input_path_raw Task_1/${prefix}_raw_r1_m{}.jsonl
