# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 5 --lr 5e-6
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 5 --lr 1e-5
# # CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 5 --lr 5e-5
# CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 5 --lr 1e-4
# CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 5 --lr 5e-4
# CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 5 --lr 1e-3
# CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 5 --lr 5e-3
# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 5 --lr 1e-2
# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 5 --lr 5e-2

# # # with warmup_ratio=0.08, weight_dayc=0.01
# # CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-1.5B-Instruct --fine_tune_model_name Qwen/Qwen2.5-1.5B-Instruct --selection_model_name Qwen/Qwen2.5-1.5B-Instruct --fine_tune_model_train_iter 2 --lr 1e-3 
# # CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 1e-3 
# # CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-1.5B-Instruct --fine_tune_model_name Qwen/Qwen2.5-1.5B-Instruct --selection_model_name Qwen/Qwen2.5-1.5B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 
# # CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 
# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-1.5B-Instruct --fine_tune_model_name Qwen/Qwen2.5-1.5B-Instruct --selection_model_name Qwen/Qwen2.5-1.5B-Instruct --fine_tune_model_train_iter 2 --lr 1e-4 
# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 1e-4 




# # new pubmed dataset, new loss function
# # CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method purePE --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# # CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method purePE --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# # CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method purePE --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method purePE --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method purePE --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method purePE --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# # CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method privSGD --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# # CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method privSGD --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# # CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method privSGD --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method privSGD --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method privSGD --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method privSGD --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6

# # CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method purePE --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# # CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method purePE --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# # CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method purePE --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# # CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method purePE --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# # CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method purePE --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# # CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method purePE --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# # CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method privSGD --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# # CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method privSGD --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# # CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method privSGD --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method privSGD --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method privSGD --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6
# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method privSGD --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6



# # new pebmed dataset with new loss, the GTG_inv lambda is 1e-6, test new prompt
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# # CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# # CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK

# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# # CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
# # CUDA_VISIBLE_DEVICES=0 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK


# CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs
# CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs
# # CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs
# CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs
# CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs
# # CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs

# CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs
# CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs
# # CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs
# CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs
# CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs
# # CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomKabs


# CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopK
# CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopK
# # CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopK
# CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopK
# CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopK
# # CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopK

# CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopK
# CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopK
# # CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopK
# CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopK
# CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopK
# # CUDA_VISIBLE_DEVICES=2 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopK


# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopKabs
# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopKabs
# # CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopKabs
# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopKabs
# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopKabs
# # CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_name Qwen/Qwen2.5-3B-Instruct --selection_model_name Qwen/Qwen2.5-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopKabs

# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopKabs
# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopKabs
# # CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopKabs
# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopKabs
# CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopKabs
# # CUDA_VISIBLE_DEVICES=3 python ./baselines/text/pubmed_huggingface/main_train.py --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 3 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombination --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy TopKabs
# # # new pebmed dataset with new loss, the GTG_inv lambda is 1e-6



CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size small --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombinationClipNoisyRealGrad --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size small --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 10 --num_iter 10 --method OptGradCombinationClipNoisyRealGrad --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size small --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombinationClipNoisyRealGrad --dp_epsilon 1.0 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
CUDA_VISIBLE_DEVICES=1 python ./baselines/text/pubmed_huggingface/main_train.py --task pubmed --train_priv_size small --seed 1 --dp_syn_cluster_num 0 --variation_api_fold 1 --num_synthetic_per_iter 50 --num_iter 10 --method OptGradCombinationClipNoisyRealGrad --dp_epsilon 1E9 --priv_select_ratio_per_iter 0.2 --gen_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_name meta-llama/Llama-3.2-3B-Instruct --selection_model_name meta-llama/Llama-3.2-3B-Instruct --fine_tune_model_train_iter 2 --lr 5e-4 --metric_inverse_epsilon 1E-6 --prompt_select_strategy RandomK
