
bash bash/train/7b.sh gsm8k rank_feedback 1 3 pro 0 0 0 0 # detach rrhf
bash bash/train/7b.sh gsm8k rank_feedback 2 3 pro 0 0 0 0 # boundar rrhf
bash bash/train/7b.sh gsm8k rank_feedback 3 3 pro 0 0 0 0 # detach rrhf
