
pid=$!

python -m torch.distributed.launch --nproc_per_node $1 --master_port 7094 trainer/fast_r2d2_multi_label_trainer.py \
--max_grad_norm 1 --max_batch_size $((64/$1)) --max_batch_len 1000000 --parser_lr 1e-2 \
--vocab_dir data/parser_atomspan_r2d2_4l_notie_wiki103wash_a100_60 \
--config_path data/parser_atomspan_r2d2_4l_notie_wiki103wash_a100_60/config.json \
--datasets atis --data_dir data/ATIS --epoch 20 --output_dir data/save/atis_intent_r2d2_dp_tree_4023 --log_step 10 --eval_step 30 \
--pretrain_dir data/parser_atomspan_r2d2_4l_notie_wiki103wash_a100_60 \
--task intent --num_samples 256 --sampler sequential --model_name fastr2d2_dp_tree --seed 4023

sleep 30
kill -9 $pid