#!/bin/bash

cd ..
python cat.py

for model in models--meta-llama--Llama-3.1-8B-Instruct models--deepseek-ai--DeepSeek-R1-Distill-Llama-8B models--Qwen--Qwen3-8B 
do
    for subset in "train_ANS"
    do
        for score_name in "confidence_score" "relevance_score" "coherence_score" 
        do
            python reasoning_eval_score.py --model=${model} --subset=${subset} --score_name=${score_name} --traindataset="datasets--RUC-NLPIR--FlashRAG_datasets@hotpotqa_RAG" 
            python reasoning_eval_score.py --model=${model} --subset=${subset} --score_name=${score_name} --traindataset="datasets--allenai--reward-bench-2"
        done
    done
done