python pretraining.py \
    --data_path pretrain_data \
    --num_train_epochs 8 \
    --warmup_predictor_epochs 2 \
    --batch_size 32 \
    --device 0 \
    --fp16 \
    --learning_rate 5e-5 \
    --warmup_predictor \
    --fix_word_embedding \
    --finetune_negative_sample_size -1 \
    --model_name_or_path allenai/longformer-base-4096 \
    --gradient_accumulation_steps 8 \
    --preprocessing_num_workers 2 \
    --dataloader_num_workers 2  \
    --temp 0.05 \