TRAIN_FILE_NAMES="flan_v2 cot dolly oasst1"
for seed in 3 6 9;do
SELECTED_DATA_OUTPUT_PATH="../selected_data_seed${seed}"
for percent in 0.005 0.01 0.05;do
python3 -m rand.sample \
        --train_file_names ${TRAIN_FILE_NAMES} \
        --train_files ../data/train/processed/flan_v2/flan_v2_data.jsonl ../data/train/processed/cot/cot_data.jsonl ../data/train/processed/dolly/dolly_data.jsonl ../data/train/processed/oasst1/oasst1_data.jsonl \
        --output_path $SELECTED_DATA_OUTPUT_PATH \
        --percentage ${percent} \
        --seed ${seed}
done
done

