# # CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 5 --lr 5e-6
# # CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 5 --lr 1e-5
# # # CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 5 --lr 5e-5
# # CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 5 --lr 1e-4
# # CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 5 --lr 5e-4
# # CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 5 --lr 1e-3
# # CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 5 --lr 5e-3
# # CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 5 --lr 1e-2
# # CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 5 --lr 5e-2

# # lr selection with warmup_ratio=0.08, weight_dayc=0.01, grad_accumulation_steps=1
# CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-1.5B-Instruct --fine_tune_model_name Qwen/Qwen2.5-1.5B-Instruct --selection_model_name Qwen/Qwen2.5-1.5B-Instruct --fine_tune_model_train_iter 2 --lr 1e-3 
# CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 1e-3 
# CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-1.5B-Instruct --fine_tune_model_name Qwen/Qwen2.5-1.5B-Instruct --selection_model_name Qwen/Qwen2.5-1.5B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 # tick, w/o gradient accumulation
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 # tick, w/o gradient accumulation
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-1.5B-Instruct --fine_tune_model_name Qwen/Qwen2.5-1.5B-Instruct --selection_model_name Qwen/Qwen2.5-1.5B-Instruct --fine_tune_model_train_iter 2 --lr 1e-4 
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 1e-4 



# # OptGradCombination for debug
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 
# CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 6 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 
# CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 200 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 

# # PE baseline
# CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method purePE --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4
# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method purePE --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4
# CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 6 --num_synthetic_per_iter 50 --num_iter 10 --method purePE --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4
# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 200 --num_iter 10 --method purePE --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4

# # OptGradCombination and Aug-PE for meta-llama/Llama-3.2-3B-Instruct
# CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 
# CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method purePE --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4
# CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 
# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method purePE --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4

# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method privSGD --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4
# CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method privSGD --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4
# CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method privSGD --dp_epsilon 1e9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4
# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method privSGD --dp_epsilon 1e9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4


# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 0 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 2 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 3 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 12345 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4


# ###### different seed for OptGradCombination with meta-llama/Llama-3.2-3B-Instruct ######
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 0 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 2 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 3 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 12345 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4

# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 0 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 2 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 3 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 12345 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4
# ###### different seed for OptGradCombination with meta-llama/Llama-3.2-3B-Instruct ######


###### different metric_inverse_epsilon for OptGradCombination with meta-llama/Llama-3.2-3B-Instruct ######
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-7
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-5
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-4
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-3
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-2

# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-7
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-5
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-4
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-3
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-2

# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-7
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-5
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-4
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-3
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-2
###### different metric_inverse_epsilon for OptGradCombination with meta-llama/Llama-3.2-3B-Instruct ######


# # new pebmed dataset with new loss, the GTG_inv lambda is 1e-6
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6

# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# # new pebmed dataset with new loss, the GTG_inv lambda is 1e-6


# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 100 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 100 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# # CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 100 --num_iter 10 --method purePE --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# # CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 100 --num_iter 10 --method purePE --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 100 --num_iter 10 --method privSGD --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 100 --num_iter 10 --method privSGD --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6

# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 100 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 100 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# # CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 100 --num_iter 10 --method purePE --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# # CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 100 --num_iter 10 --method purePE --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 100 --num_iter 10 --method privSGD --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 100 --num_iter 10 --method privSGD --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6





# # new pebmed dataset with new loss, the GTG_inv lambda is 1e-6, test new prompt
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# # CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# # CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK

# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# # CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# # CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK


# CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs
# CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs
# # CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs
# CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs
# CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs
# # CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs

# CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs
# CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs
# # CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs
# CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs
# CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs
# # CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs


# CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopK
# CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopK
# # CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopK
# CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopK
# CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopK
# # CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopK

# CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopK
# CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopK
# # CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopK
# CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopK
# CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopK
# # CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopK


# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopKabs
# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopKabs
# # CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopKabs
# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopKabs
# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopKabs
# # CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopKabs

# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopKabs
# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopKabs
# # CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopKabs
# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopKabs
# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopKabs
# # CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopKabs
# # new pebmed dataset with new loss, the GTG_inv lambda is 1e-6


# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 40 --method OptGradCombinationClip --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.05 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 20 --method OptGradCombinationClip --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.1 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombinationClip --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombinationClip --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.4 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 40 --method OptGradCombinationClip --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.05 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 20 --method OptGradCombinationClip --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.1 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombinationClip --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombinationClip --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.4 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK


# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK

# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 40 --method privSGD --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.05 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 20 --method privSGD --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.1 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method privSGD --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method privSGD --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.4 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 40 --method privSGD --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.05 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 20 --method privSGD --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.1 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method privSGD --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method privSGD --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.4 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK


# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size small --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombinationClipNoisyRealGrad --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size small --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombinationClipNoisyRealGrad --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size small --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombinationClipNoisyRealGrad --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size small --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombinationClipNoisyRealGrad --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK



# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 200 --method privSGD --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.01 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs --lr_scaler 0.3
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 200 --method privSGD --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.01 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs --lr_scaler 0.3
CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 200 --method OptGradCombinationClip --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.01 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs --lr_scaler 0.3
CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 200 --method OptGradCombinationClip --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.01 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs --lr_scaler 0.3
CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 200 --method purePE --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.01 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs --lr_scaler 0.3
CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 200 --method purePE --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.01 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs --lr_scaler 0.3
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 200 --method GradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.01 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs --lr_scaler 0.3
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 200 --method GradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.01 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs --lr_scaler 0.3
CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 200 --method GradCombinationNoResidual --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.01 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs --lr_scaler 0.3
CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 200 --method GradCombinationNoResidual --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.01 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs --lr_scaler 0.3
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 200 --method OptGradCombinationClipFixSample --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.01 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs --lr_scaler 0.3
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 200 --method OptGradCombinationClipFixSample --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.01 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs --lr_scaler 0.3

CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 200 --method privSGD --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.01 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs --lr_scaler 0.3
CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 200 --method privSGD --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.01 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs --lr_scaler 0.3
CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 200 --method OptGradCombinationClip --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.01 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs --lr_scaler 0.3
CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 200 --method OptGradCombinationClip --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.01 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs --lr_scaler 0.3
CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 200 --method purePE --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.01 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs --lr_scaler 0.3
CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 200 --method purePE --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.01 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs --lr_scaler 0.3
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 200 --method GradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.01 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs --lr_scaler 0.3
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 200 --method GradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.01 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs --lr_scaler 0.3
CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 200 --method GradCombinationNoResidual --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.01 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs --lr_scaler 0.3
CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size middle --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 200 --method GradCombinationNoResidual --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.01 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs --lr_scaler 0.3


