prefix='openr1_math'

# decomposition
#PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python benchmark_construction/raw_datasets/get_${prefix}.py
#PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python benchmark_construction/stage_1/math/task_decomposition.py --input_file critic_bench/${prefix}.jsonl
PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python benchmark_construction/stage_1/math/post_process.py --input_file critic_bench/${prefix}_parsed.jsonl --output_file critic_bench/${prefix}_non_parsed.jsonl

# information missing
#PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python benchmark_construction/stage_2/math/information_missing.py --input_file critic_bench/${prefix}_parsed_pp.jsonl --output_file critic_bench/${prefix}_information_missing_level1.jsonl --task_level 1 --seed 42 --variants 2
PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python benchmark_construction/stage_2/math/post_process_type_1.py --input_file critic_bench/${prefix}_information_missing_level1.jsonl

# purpose missing
PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python benchmark_construction/stage_2/math/purpose_missing.py --input_file critic_bench/${prefix}_parsed_pp.jsonl --output_file critic_bench/${prefix}_purpose_missing.jsonl --seed 42
PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python benchmark_construction/stage_2/math/post_process_type_2.py --input_file critic_bench/${prefix}_purpose_missing.jsonl

# get_response
PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python Task_1/math/get_response_raw.py --input_file critic_bench/${prefix}_parsed_pp.jsonl --save_path Task_1/${prefix}_raw_r1.jsonl --model_name 'deepseek-r1' --client_name 'aliyun' --use_raw --num_concurrent 250
PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python Task_1/math/get_response_raw.py --input_file critic_bench/${prefix}_non_parsed.jsonl --save_path Task_1/${prefix}_raw_r1_non_parsed.jsonl --model_name 'deepseek-r1' --client_name 'aliyun' --use_raw --num_concurrent 250
PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python Task_1/math/get_response_unclear.py --input_file critic_bench/${prefix}_information_missing_level1_pp.jsonl --save_path Task_1/${prefix}_information_missing_level1_r1.jsonl --model_name 'deepseek-r1' --client_name 'aliyun' --num_concurrent 250
PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python Task_1/math/get_response_unclear.py --input_file critic_bench/${prefix}_purpose_missing_pp.jsonl --save_path Task_1/${prefix}_purpose_missing_r1.jsonl --model_name 'deepseek-r1' --client_name 'aliyun' --num_concurrent 250

PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python Task_1/math/training_sampling_filtering.py --input_file_raw Task_1/${prefix}_raw_r1.jsonl --input_file_raw_non_parsed Task_1/${prefix}_raw_r1_non_parsed.jsonl --input_file_im Task_1/${prefix}_information_missing_level1_r1.jsonl --input_file_pm Task_1/${prefix}_purpose_missing_r1.jsonl --output_non_cls Task_1/${prefix}_non_cls_training.jsonl --output_cls Task_1/${prefix}_cls_training.jsonl

PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python benchmark_construction/dataset_statistics.py --input_file Task_1/${prefix}_information_missing_level1_r1.jsonl --training
PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python benchmark_construction/dataset_statistics.py --input_file Task_1/${prefix}_purpose_missing_r1.jsonl --training
PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python benchmark_construction/dataset_statistics.py --input_file Task_1/${prefix}_non_cls_training.jsonl

PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python Task_1/math/training_sampling_filtering_2.py --input_file_raw Task_1/${prefix}_raw_r1.jsonl --input_file_raw_non_parsed Task_1/${prefix}_raw_r1_non_parsed.jsonl --input_file_im Task_1/${prefix}_information_missing_level1_r1.jsonl --input_file_pm Task_1/${prefix}_purpose_missing_r1.jsonl --output_file Task_1/${prefix}_critic_bench.jsonl