python train.py --model_name_or_path gpt2-small --d_in 768 --device cuda:0 --expansion_factor 32 --hook_name blocks.4.hook_resid_pre --hook_layer 4 --batch_size 512 --dataset_path pasinit/xlwic  --l1_coefficient 0.05 \
    --datadir xlwic_en_de xlwic_en_bg xlwic_en_da xlwic_en_et xlwic_en_fa xlwic_en_fr xlwic_en_hr xlwic_en_it xlwic_en_ja xlwic_en_nl xlwic_en_ko xlwic_en_zh \
    --output_dir ./wic/activation_topk_10/ghost_grads --total_training_steps 200000 --activation_fn topk --k 10 --use_ghost_grads
python train.py --model_name_or_path gpt2-small --d_in 768 --device cuda:1 --expansion_factor 32 --hook_name blocks.4.hook_resid_pre --hook_layer 4 --batch_size 512 --dataset_path pasinit/xlwic  --l1_coefficient 0.05 \
    --datadir xlwic_en_de xlwic_en_bg xlwic_en_da xlwic_en_et xlwic_en_fa xlwic_en_fr xlwic_en_hr xlwic_en_it xlwic_en_ja xlwic_en_nl xlwic_en_ko xlwic_en_zh \
    --output_dir ./wic/activation_topk_1/ghost_grads --total_training_steps 200000 --activation_fn topk --k 1 --use_ghost_grads
python train.py --model_name_or_path gpt2-small --d_in 768 --device cuda:1 --expansion_factor 32 --hook_name blocks.4.hook_resid_pre --hook_layer 4 --batch_size 512 --dataset_path pasinit/xlwic  --l1_coefficient 0.05 \
    --datadir xlwic_en_de xlwic_en_bg xlwic_en_da xlwic_en_et xlwic_en_fa xlwic_en_fr xlwic_en_hr xlwic_en_it xlwic_en_ja xlwic_en_nl xlwic_en_ko xlwic_en_zh \
    --output_dir ./wic/activation_topk_5/ghost_grads --total_training_steps 200000 --activation_fn topk --k 5 --use_ghost_grads
python train.py --model_name_or_path gpt2-small --d_in 768 --device cuda:1 --expansion_factor 32 --hook_name blocks.4.hook_resid_pre --hook_layer 4 --batch_size 512 --dataset_path pasinit/xlwic  --l1_coefficient 0.05 \
    --datadir xlwic_en_de xlwic_en_bg xlwic_en_da xlwic_en_et xlwic_en_fa xlwic_en_fr xlwic_en_hr xlwic_en_it xlwic_en_ja xlwic_en_nl xlwic_en_ko xlwic_en_zh \
    --output_dir ./wic/activation_topk_100/ghost_grads --total_training_steps 200000 --activation_fn topk --k 100 --use_ghost_grads