DATASET=iwslt14
#DATASET=multi30k.tokenized.de-en
#DATASET=iwslt15-en-vi
SEED=5555
MODEL=transformer_iwslt_de_en
CRITERION=self_ls_entropy
WHICH_CUDA=1
SAVE=${DATASET}_${CRITERION}_${SEED}
mkdir checkpoints/$SAVE
CUDA_VISIBLE_DEVICES=$WHICH_CUDA nohup python train.py data-bin/$DATASET --arch $MODEL --share-decoder-input-output-embed --optimizer adam --adam-betas '(0.9, 0.98)' --clip-norm 0.0 --lr-scheduler inverse_sqrt --warmup-updates 4000 --lr 5e-4 --dropout 0.3 --weight-decay 0.0001 --criterion $CRITERION --max-tokens 4096 --seed ${SEED} --save-dir checkpoints/$SAVE --eval-bleu --eval-bleu-remove-bpe --eval-bleu-detok moses --maximize-best-checkpoint-metric --best-checkpoint-metric bleu --fp16  --no-epoch-checkpoints --tensorboard-logdir tb/$SAVE > checkpoints/$SAVE/training.log &
