CUDA_VISIBLE_DEVICES=5 python custom/gpt2/run_gpt2_sg.py      \
--data-base ./data-bin/wikitext-103-bpe_v0   \
--output-dir ./checkpoint/output/sg   \
--eval-split test    \
--model-load-dir ./checkpoint/train/sg/     \
--mode eval-both  \
--sequence-tune-rate 0.0    \
# --top-p 0 \
# --top-k 1  
