# HH-RLHF dataset
python RM_traing_from_scratch.py --model_name google/flan-t5-xl --save_model --micro_batch_size 4 --dataset_type anonymous/hh-rlhf_with_features --subset train --prepend_mode prepend_split --last_tkn --epochs 4
python RM_traing_from_scratch.py --model_name google/flan-t5-xl --save_model --micro_batch_size 4 --dataset_type anonymous/hh-rlhf_with_features --subset test --prepend_mode prepend_split --last_tkn --epochs 4
python RM_inference.py --model_name google/flan-t5-xl --dataset_type anonymous/hh-rlhf_with_features --subset test --prepend_mode prepend_split --last_tkn
python RM_inference.py --model_name google/flan-t5-xl --dataset_type anonymous/hh-rlhf_with_features --subset train --prepend_mode prepend_split --last_tkn

# overoptimization
python RM_traing_from_scratch.py --model_name google/flan-t5-xl --save_model --micro_batch_size 1 --dataset_type anonymous/hh-rlhf_with_features --subset train --prepend_mode prepend_split --last_tkn --epochs 4 --pseudo_label
python RM_traing_from_scratch.py --model_name google/flan-t5-xl --save_model --micro_batch_size 1 --dataset_type anonymous/hh-rlhf_with_features --subset test --prepend_mode prepend_split --last_tkn --epochs 4 --pseudo_label

# subset_fit
python RM_traing_from_scratch.py --model_name google/flan-t5-xl --save_model --micro_batch_size 4 --dataset_type anonymous/hh-rlhf_with_features --subset train --prepend_mode prepend_split --last_tkn --epochs 4 --subset_fit 100
python RM_traing_from_scratch.py --model_name google/flan-t5-xl --save_model --micro_batch_size 4 --dataset_type anonymous/hh-rlhf_with_features --subset test --prepend_mode prepend_split --last_tkn --epochs 4 --subset_fit 100
python RM_traing_from_scratch.py --model_name google/flan-t5-xl --save_model --micro_batch_size 4 --dataset_type anonymous/hh-rlhf_with_features --subset train --prepend_mode prepend_split --last_tkn --epochs 4 --subset_fit 500
python RM_traing_from_scratch.py --model_name google/flan-t5-xl --save_model --micro_batch_size 4 --dataset_type anonymous/hh-rlhf_with_features --subset test --prepend_mode prepend_split --last_tkn --epochs 4 --subset_fit 500
python RM_traing_from_scratch.py --model_name google/flan-t5-xl --save_model --micro_batch_size 4 --dataset_type anonymous/hh-rlhf_with_features --subset train --prepend_mode prepend_split --last_tkn --epochs 4 --subset_fit 1000
python RM_traing_from_scratch.py --model_name google/flan-t5-xl --save_model --micro_batch_size 4 --dataset_type anonymous/hh-rlhf_with_features --subset test --prepend_mode prepend_split --last_tkn --epochs 4 --subset_fit 1000

python RM_traing_from_scratch.py --model_name google/flan-t5-xl --save_model --micro_batch_size 4 --dataset_type anonymous/shp_with_features_20k --subset test --prepend_mode shp-prepend_split --last_tkn --epochs 4 --subset_fit 100
python RM_traing_from_scratch.py --model_name google/flan-t5-xl --save_model --micro_batch_size 4 --dataset_type anonymous/shp_with_features_20k --subset train --prepend_mode shp-prepend_split --last_tkn --epochs 4 --subset_fit 100
python RM_traing_from_scratch.py --model_name google/flan-t5-xl --save_model --micro_batch_size 4 --dataset_type anonymous/shp_with_features_20k --subset test --prepend_mode shp-prepend_split --last_tkn --epochs 4 --subset_fit 500
python RM_traing_from_scratch.py --model_name google/flan-t5-xl --save_model --micro_batch_size 4 --dataset_type anonymous/shp_with_features_20k --subset train --prepend_mode shp-prepend_split --last_tkn --epochs 4 --subset_fit 500
python RM_traing_from_scratch.py --model_name google/flan-t5-xl --save_model --micro_batch_size 4 --dataset_type anonymous/shp_with_features_20k --subset test --prepend_mode shp-prepend_split --last_tkn --epochs 4 --subset_fit 1000
python RM_traing_from_scratch.py --model_name google/flan-t5-xl --save_model --micro_batch_size 4 --dataset_type anonymous/shp_with_features_20k --subset train --prepend_mode shp-prepend_split --last_tkn --epochs 4 --subset_fit 1000

# SHP dataset 
python RM_traing_from_scratch.py --model_name google/flan-t5-xl --save_model --micro_batch_size 1 --dataset_type anonymous/shp_with_features_20k --subset train --prepend_mode shp-prepend_split --last_tkn --epochs 4 --lr 5e-5
python RM_traing_from_scratch.py --model_name google/flan-t5-xl --save_model --micro_batch_size 1 --dataset_type anonymous/shp_with_features_20k --subset test --prepend_mode shp-prepend_split --last_tkn --epochs 4 --lr 5e-5

# overoptmization
python RM_traing_from_scratch.py --model_name google/flan-t5-xl --save_model --micro_batch_size 1 --dataset_type anonymous/shp_with_features_20k --subset train --prepend_mode shp-prepend_split --last_tkn --epochs 4 --pseudo_label --lr 5e-5
python RM_traing_from_scratch.py --model_name google/flan-t5-xl --save_model --micro_batch_size 1 --dataset_type anonymous/shp_with_features_20k --subset test --prepend_mode shp-prepend_split --last_tkn --epochs 4 --pseudo_label --lr 5e-5