# bash prepare-iwslt14.sh
cd ..

TEXT=data-preprocess/iwslt14.tokenized.de-en
fairseq-preprocess --source-lang de --target-lang en \
    --trainpref $TEXT/train --validpref $TEXT/valid --testpref $TEXT/test \
    --destdir data-bin/iwslt14.tokenized.de-en.joined.bpe \
    --joined-dictionary --bpe byte_bpe \
    --workers 20
