#!/bin/bash

cd ..
for model in models--meta-llama--Llama-3.1-8B-Instruct models--deepseek-ai--DeepSeek-R1-Distill-Llama-8B models--Qwen--Qwen3-8B 
do
    for subset in  "train_NOANS"
    do
        for score_name in "TODO your score name" # 0.1*confidence_score+0.2*relevance_score+0.7*coherence_score RLVR
        do
            python get_data_rl.py --train_model="${model}" --subset="${subset}" --score_name="${score_name}" --traindataset="datasets--RUC-NLPIR--FlashRAG_datasets@hotpotqa_RAG"
            python get_data_rl.py --train_model="${model}" --subset="${subset}" --score_name="${score_name}" --traindataset="datasets--allenai--reward-bench-2"
        done
    done
done

