# sd
DATA=/data/ruohongz/data2
RES=/data/ruohongz/XMTC/saved
# sa
DATA=/usr1/ruohongz/XMTC/data
RES=/usr1/ruohongz/XMTC/saved

DATANAME=${1:-EUR-Lex}
model=${2:-bert}
model_name=${3:-bert-base-cased}
max_seq_length=${4:-512}
fold=${5:-5}

# xlnet, xlnet-base-cased
# roberta, roberta-base
# roberta, distilroberta-base
# bert, bert-base-cased
# distilbert, distilbert-base-cased

python cv_split.py \
--data_dir $DATA/$DATANAME --output_dir $DATA/cv_split/$DATANAME \
--model_type ${model} \
--model_name ${model_name} \
--max_seq_length $max_seq_length \
--fold $fold
#--shuffle \
# --keyword --feature_name tfidf2 --overwrite --keyword_only --top_keyword -1
#--do_label \







