 CUDA_VISIBLE_DEVICES=0 python3 redteam_continuation.py'{"method.init_kl_coef": 0.001, "method.bleu_reward_coef": 0.0, "method.cossimemb_reward_coef": 0.0, "method.ent_reward_coef": 0.0, "method.bleu_reward_grams": "[2, 3, 4, 5]", "method.bleu_tokenizer": "nltk", "method.target_sim_div_reward_coef": 1.0, "train.logging_dir": "results/imdb/ppo64_kl0.001_bleu0.0_bleuTokennltk_cossimemb0.0_ent0.0_targdiv1.0/3000", "train.batch_size": 64, "train.checkpoint_dir": "results/imdb_toxicity_response_1000/ppo64_kl0.001_bleu0.0_bleuTokennltk_cossimemb0.0_ent0.0_targdiv1.0/3000", "train.seed": 3000}'
 CUDA_VISIBLE_DEVICES=0 python3 redteam_continuation.py'{"method.init_kl_coef": 0.001, "method.bleu_reward_coef": 0.0, "method.cossimemb_reward_coef": 0.0, "method.ent_reward_coef": 0.0, "method.bleu_reward_grams": "[2, 3, 4, 5]", "method.bleu_tokenizer": "nltk", "method.target_sim_div_reward_coef": 1.0, "train.logging_dir": "results/imdb/ppo64_kl0.001_bleu0.0_bleuTokennltk_cossimemb0.0_ent0.0_targdiv1.0/2000", "train.batch_size": 64, "train.checkpoint_dir": "results/imdb_toxicity_response_1000/ppo64_kl0.001_bleu0.0_bleuTokennltk_cossimemb0.0_ent0.0_targdiv1.0/2000", "train.seed": 2000}'
 CUDA_VISIBLE_DEVICES=0 python3 redteam_continuation.py'{"method.init_kl_coef": 0.001, "method.bleu_reward_coef": 0.0, "method.cossimemb_reward_coef": 0.0, "method.ent_reward_coef": 0.0, "method.bleu_reward_grams": "[2, 3, 4, 5]", "method.bleu_tokenizer": "nltk", "method.target_sim_div_reward_coef": 1.0, "train.logging_dir": "results/imdb/ppo64_kl0.001_bleu0.0_bleuTokennltk_cossimemb0.0_ent0.0_targdiv1.0/1000", "train.batch_size": 64, "train.checkpoint_dir": "results/imdb_toxicity_response_1000/ppo64_kl0.001_bleu0.0_bleuTokennltk_cossimemb0.0_ent0.0_targdiv1.0/1000", "train.seed": 1000}'