
# python plot_length_ngram.py --plot-four-metrics-grid --input /mnt/shared-storage-user/p1-shared/wangfuting/codes/project_tts_extrapolation/eval_scripts/analysis/plots/qwen3-4b-base-ngram-analysis_results-train.json --output-dir /mnt/shared-storage-user/p1-shared/wangfuting/codes/project_tts_extrapolation/eval_scripts/analysis/plots_train
# --plot-two-figs-count-ratio

python plot_length_ngram.py --inputs /mnt/shared-storage-user/p1-shared/wangfuting/codes/project_tts_extrapolation/eval_scripts/analysis/plots/qwen3-4b-base-ngram-analysis_results.json   /mnt/shared-storage-user/p1-shared/wangfuting/codes/project_tts_extrapolation/eval_scripts/analysis/plots/polaris-ngram-analysis_results.json /mnt/shared-storage-user/p1-shared/wangfuting/codes/project_tts_extrapolation/eval_scripts/analysis/plots/qwen-ablation-ngram-diversity-comparison.json /mnt/shared-storage-user/p1-shared/wangfuting/codes/project_tts_extrapolation/eval_scripts/analysis/plots/qwen-ablation-delta-L-ngram-diversity-comparison.json /mnt/shared-storage-user/p1-shared/wangfuting/codes/project_tts_extrapolation/eval_scripts/analysis/plots/llama_analysis_results.json /mnt/shared-storage-user/p1-shared/wangfuting/codes/project_tts_extrapolation/eval_scripts/analysis/plots/SFT-ngram-analysis_results.json /mnt/shared-storage-user/p1-shared/wangfuting/codes/project_tts_extrapolation/eval_scripts/analysis/plots/qwen-ablation-reward-comparison.json  --output-dir /mnt/shared-storage-user/p1-shared/wangfuting/codes/project_tts_extrapolation/eval_scripts/analysis/plots --layout-mode '1x4' --max-step 600
#  /mnt/shared-storage-user/p1-shared/wangfuting/codes/project_tts_extrapolation/eval_scripts/analysis/plots/llama-ngram-analysis_results.json
# python plot_length_ngram.py --inputs /mnt/shared-storage-user/p1-shared/wangfuting/codes/project_tts_extrapolation/eval_scripts/analysis/plots/gspo-6-10-ngram-analysis_results.json --output-dir /mnt/shared-storage-user/p1-shared/wangfuting/codes/project_tts_extrapolation/eval_scripts/analysis/plots --layout-mode '1x4' --max-step 600 --plot-ngram-comparison --ngrams 6 10 15
# --plot-two-figs-count-ratio --plot-four-metrics-grid 

# for metric in global_count global_ratio count ratio; do
#     python plot_length_ngram.py --input /mnt/shared-storage-user/p1-shared/wangfuting/codes/project_tts_extrapolation/eval_scripts/analysis/plots/qwen3-4b-base-ngram-analysis_results-train.json --diversity-metric $metric --output-dir /mnt/shared-storage-user/p1-shared/wangfuting/codes/project_tts_extrapolation/eval_scripts/analysis/plots_train

#     python plot_length_ngram.py --input /mnt/shared-storage-user/p1-shared/wangfuting/codes/project_tts_extrapolation/eval_scripts/analysis/plots/qwen3-4b-base-ngram-analysis_results.json --diversity-metric $metric --output-dir /mnt/shared-storage-user/p1-shared/wangfuting/codes/project_tts_extrapolation/eval_scripts/analysis/plots
# done