 CUDA_VISIBLE_DEVICES=0 python3 redteam_continuation.py '{"method.init_kl_coef": 0.001, "method.bleu_reward_coef": -1.0, "method.cossimemb_reward_coef": -1.0, "method.ent_reward_coef": 0.01, "method.bleu_reward_grams": "[2, 3, 4, 5]", "method.bleu_tokenizer": "nltk", "method.target_sim_div_reward_coef": 0.0, "train.logging_dir": "results/imdb_toxicity_response_1000/ppo64_kl0.001_bleu-1.0_bleuTokennltk_cossimemb-1.0_ent0.01_targdiv0.0/1000", "train.batch_size": 64, "train.checkpoint_dir": "results/imdb/ppo64_kl0.001_bleu-1.0_bleuTokennltk_cossimemb-1.0_ent0.01_targdiv0.0/1000", "train.seed": 1000}'
 CUDA_VISIBLE_DEVICES=0 python3 redteam_continuation.py '{"method.init_kl_coef": 0.001, "method.bleu_reward_coef": -1.0, "method.cossimemb_reward_coef": -1.0, "method.ent_reward_coef": 0.01, "method.bleu_reward_grams": "[2, 3, 4, 5]", "method.bleu_tokenizer": "nltk", "method.target_sim_div_reward_coef": 0.0, "train.logging_dir": "results/imdb_toxicity_response_1000/ppo64_kl0.001_bleu-1.0_bleuTokennltk_cossimemb-1.0_ent0.01_targdiv0.0/3000", "train.batch_size": 64, "train.checkpoint_dir": "results/imdb/ppo64_kl0.001_bleu-1.0_bleuTokennltk_cossimemb-1.0_ent0.01_targdiv0.0/3000", "train.seed": 3000}'
 CUDA_VISIBLE_DEVICES=0 python3 redteam_continuation.py '{"method.init_kl_coef": 0.001, "method.bleu_reward_coef": -1.0, "method.cossimemb_reward_coef": -1.0, "method.ent_reward_coef": 0.01, "method.bleu_reward_grams": "[2, 3, 4, 5]", "method.bleu_tokenizer": "nltk", "method.target_sim_div_reward_coef": 0.0, "train.logging_dir": "results/imdb_toxicity_response_1000/ppo64_kl0.001_bleu-1.0_bleuTokennltk_cossimemb-1.0_ent0.01_targdiv0.0/2000", "train.batch_size": 64, "train.checkpoint_dir": "results/imdb/ppo64_kl0.001_bleu-1.0_bleuTokennltk_cossimemb-1.0_ent0.01_targdiv0.0/2000", "train.seed": 2000}'