prefix='math_500'
prefix='omni_math'

for prefix in 'math_500' 'omni_math'; do
  PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python Task_1/math/get_response_raw.py --input_file critic_bench/${prefix}_parsed_reassemble_verified_pp.jsonl --save_path Task_1/${prefix}_raw_grok3_mini_m.jsonl --model_name 'x-ai/grok-3-mini-beta' --client_name 'openrouter' --use_raw --num_concurrent 250 --max_queries 50 --temperature 0.
  PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python Task_1/math/get_response_unclear.py --input_file critic_bench/${prefix}_information_missing_level1_verified_pp.jsonl --save_path Task_1/${prefix}_information_missing_level1_grok3_mini_m.jsonl --model_name 'x-ai/grok-3-mini-beta' --client_name 'openrouter' --num_concurrent 250 --max_queries 50 --temperature 0.
  PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python Task_1/math/get_response_unclear.py --input_file critic_bench/${prefix}_purpose_missing_verified_pp.jsonl --save_path Task_1/${prefix}_purpose_missing_grok3_mini_m.jsonl --model_name 'x-ai/grok-3-mini-beta' --client_name 'openrouter' --num_concurrent 250 --max_queries 50 --temperature 0.
done

for prefix in 'math_500' 'omni_math'; do
  PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python Task_1/math/get_response_raw.py --input_file critic_bench/${prefix}_parsed_reassemble_verified_pp.jsonl --save_path Task_1/${prefix}_raw_grok3_mini_m${suffix}.jsonl --model_name 'x-ai/grok-3-mini-beta' --client_name 'openrouter' --use_raw --num_concurrent 250 --max_queries 50 --temperature 0.6
  PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python Task_1/math/get_response_unclear.py --input_file critic_bench/${prefix}_information_missing_level1_verified_pp.jsonl --save_path Task_1/${prefix}_information_missing_level1_grok3_mini_m${suffix}.jsonl --model_name 'x-ai/grok-3-mini-beta' --client_name 'openrouter' --num_concurrent 250 --max_queries 50 --temperature 0.6
  PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python Task_1/math/get_response_unclear.py --input_file critic_bench/${prefix}_purpose_missing_verified_pp.jsonl --save_path Task_1/${prefix}_purpose_missing_grok3_mini_m${suffix}.jsonl --model_name 'x-ai/grok-3-mini-beta' --client_name 'openrouter' --num_concurrent 250 --max_queries 50 --temperature 0.6
done

prefix='math_500'
prefix='omni_math'
#PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python Task_1/math/evaluation.py --input_path_cls Task_1/${prefix}_raw_grok3_mini_m.jsonl --input_path_raw Task_1/${prefix}_raw_grok3_mini_m.jsonl
PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python Task_1/math/evaluation.py --input_path_cls Task_1/${prefix}_information_missing_level1_grok3_mini_m.jsonl --input_path_raw Task_1/${prefix}_raw_grok3_mini_m.jsonl
PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python Task_1/math/evaluation.py --input_path_cls Task_1/${prefix}_purpose_missing_grok3_mini_m.jsonl --input_path_raw Task_1/${prefix}_raw_grok3_mini_m.jsonl

#PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python Task_1/math/evaluation_m.py --input_path_cls Task_1/${prefix}_raw_grok3_mini_m{}.jsonl --input_path_raw Task_1/${prefix}_raw_grok3_mini_m{}.jsonl
PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python Task_1/math/evaluation_m.py --input_path_cls Task_1/${prefix}_information_missing_level1_grok3_mini_m{}.jsonl --input_path_raw Task_1/${prefix}_raw_grok3_mini_m{}.jsonl
PYTHONPATH=$PYTHONPATH:$(pwd):$(pwd) python Task_1/math/evaluation_m.py --input_path_cls Task_1/${prefix}_purpose_missing_grok3_mini_m{}.jsonl --input_path_raw Task_1/${prefix}_raw_grok3_mini_m{}.jsonl
