# MATH
# python3 -m inference_rlhf.code.extract_json_from_pkl user=anonymousanonymous task=math policy=mistral-7b &
# python3 -m inference_rlhf.code.extract_json_from_pkl user=anonymousanonymous task=math policy=qwen-25-3b &
# python3 -m inference_rlhf.code.extract_json_from_pkl user=anonymousanonymous task=math policy=llama-3-3b &
# python3 -m inference_rlhf.code.extract_json_from_pkl user=anonymousanonymous task=math policy=qwen-25-05b &
# python3 -m inference_rlhf.code.extract_json_from_pkl user=anonymousanonymous task=math policy=qwen-25-7b
# python3 -m inference_rlhf.code.extract_json_from_pkl user=anonymousanonymous task=math policy=qwen-25-14b
python3 -m inference_rlhf.code.extract_json_from_pkl user=anonymousanonymous task=math policy=phi-3-medium &
python3 -m inference_rlhf.code.extract_json_from_pkl user=anonymousanonymous task=math policy=phi-4 &

# GSM8K
# python3 -m inference_rlhf.code.extract_json_from_pkl user=anonymousanonymous task=gsm8k policy=qwen-25-3b &
# python3 -m inference_rlhf.code.extract_json_from_pkl user=anonymousanonymous task=gsm8k policy=mistral-7b &
# python3 -m inference_rlhf.code.extract_json_from_pkl user=anonymousanonymous task=gsm8k policy=llama-3-3b &
# python3 -m inference_rlhf.code.extract_json_from_pkl user=anonymousanonymous task=gsm8k policy=qwen-25-05b &
# python3 -m inference_rlhf.code.extract_json_from_pkl user=anonymousanonymous task=gsm8k policy=qwen-25-7b &
# python3 -m inference_rlhf.code.extract_json_from_pkl user=anonymousanonymous task=gsm8k policy=qwen-25-14b &
python3 -m inference_rlhf.code.extract_json_from_pkl user=anonymousanonymous task=gsm8k policy=phi-3-medium &
python3 -m inference_rlhf.code.extract_json_from_pkl user=anonymousanonymous task=gsm8k policy=phi-4 &

wait