CUDA_VISIBLE_DEVICES=3 python -u run_clm_no_trainer.py --per_device_train_batch_size 8 --dataset_name wikitext --dataset_config_name wikitext-103-raw-v1 --model_name_or_path gpt2 --seed 0 --output_dir ./experiments/gpt2_lr1em4_reg5_seed0/wikitext-103 --reg 5

CUDA_VISIBLE_DEVICES=3 python -u run_clm_no_trainer.py --per_device_train_batch_size 8 --dataset_name wikitext --dataset_config_name wikitext-103-raw-v1 --model_name_or_path gpt2 --seed 1 --output_dir ./experiments/gpt2_lr1em4_reg5_seed1/wikitext-103 --reg 5

CUDA_VISIBLE_DEVICES=3 python -u run_clm_no_trainer.py --per_device_train_batch_size 8 --dataset_name wikitext --dataset_config_name wikitext-103-raw-v1 --model_name_or_path gpt2 --seed 2 --output_dir ./experiments/gpt2_lr1em4_reg5_seed2/wikitext-103 --reg 5