#!/bin/bash

# 在远程服务器上运行重复率分析脚本
source /mnt/shared-storage-user/p1-shared/wangfuting/miniconda3/bin/activate verl041-test
cd /mnt/shared-storage-user/p1-shared/wangfuting/codes/project_tts_extrapolation/eval_scripts/analysis
# 三个实验目录
# DIR1="/mnt/shared-storage-user/p1-shared/wangfuting/shared/models/verl-041-result/verl-qwen3-4b-oct/add1k-remove-upper-dapo-math-17k/valid"
# DIR1="/mnt/shared-storage-user/p1-shared/wangfuting/shared/models/verl-041-result/verl-qwen3-4b-oct/dapo-add1k-remove-upper-refined-repetition-penalty-max9k/valid"
# DIR1="/mnt/shared-storage-user/p1-shared/wangfuting/shared/models/verl-041-result/verl-qwen3-4b-oct/skip-right-skip-limits10-gspo-dapo-math-add2k/valid"
# DIR2="/mnt/shared-storage-user/p1-shared/wangfuting/shared/models/verl-041-result/verl-qwen3-4b-oct/skip-right-skip-limits10-gspo-dapo-math-wo-repetition/valid"
# DIR1="/mnt/shared-storage-user/p1-shared/wangfuting/shared/models/verl-041-result/verl-qwen3-4b-oct/skip-right-distinct-hard-gspo-dapo-math/valid"
# DIR1="/mnt/shared-storage-user/p1-shared/wangfuting/shared/models/verl-041-result/verl-qwen3-4b-oct/gspo_repetition/valid_8k"
# DIR2="/mnt/shared-storage-user/p1-shared/wangfuting/shared/models/verl-041-result/verl-qwen3-4b-oct/skip-right-distinct_bonus-gspo-dapo-math/valid_8k"
# DIR1=/mnt/shared-storage-user/p1-shared/wangfuting/shared/models/verl-041-result/verl-qwen3-4b-oct/skip-right-skip-limits10-gspo-dapo-math-wo-repetition-redo/valid_8k
# DIR1=/mnt/shared-storage-user/p1-shared/wangfuting/shared/models/verl-041-result/verl-qwen3-4b-oct/skip-right-skip-limits10-gspo-dapo-math-add1k5/valid_8k
# DIR2=/mnt/shared-storage-user/p1-shared/wangfuting/shared/models/verl-041-result/verl-qwen3-4b-oct/ours-gspo-dapo-math-add8k5/valid_8k
# DIR3=/mnt/shared-storage-user/p1-shared/wangfuting/shared/models/verl-041-result/verl-qwen3-4b-oct/ours-gspo-dapo-math-add1k-fixed/valid_8k
# DIR4=/mnt/shared-storage-user/p1-shared/wangfuting/shared/models/verl-041-result/verl-qwen3-4b-oct/ours-gspo-dapo-math-add600/valid_8k
# # 输出图表路径
# DIR1=/mnt/shared-storage-gpfs2/p1-shared-2/wangfuting/LIE/models/verl-qwen3-4b-oct/beta0.3/valid_8k
# DIR2=/mnt/shared-storage-gpfs2/p1-shared-2/wangfuting/LIE/models/verl-qwen3-4b-oct/8k5/valid_8k
# DIR1=/mnt/shared-storage-gpfs2/p1-shared-2/wangfuting/LIE/models/verl-qwen3-4b-oct/cosine/valid_8k
# DIR1=/mnt/shared-storage-gpfs2/p1-shared-2/wangfuting/LIE/models/verl-qwen3-4b-oct/sft-gspo-ours-dapo-math-max12k/valid_8k
# DIR2=/mnt/shared-storage-gpfs2/p1-shared-2/wangfuting/LIE/models/verl-qwen3-4b-oct/sft4k-gspo-dapo-math-minibsz32-max12k/valid_8k
DIR3=/mnt/shared-storage-gpfs2/p1-shared-2/wangfuting/LIE/models/verl-qwen3-4b-oct/gspo_repetition/valid_8k
OUTPUT="/mnt/shared-storage-user/p1-shared/wangfuting/codes/project_tts_extrapolation/eval_scripts/analysis_mar/results/gspo-repetition.png"
# OUTPUT="/mnt/shared-storage-user/p1-shared/wangfuting/shared/models/verl-041-result/verl-qwen3-4b-oct/repetition_comparison_w5.png"

# python3 analysis_repetition_penalty.py \
#   -p "*_16384.jsonl" \
#   -s \
#   -o "$OUTPUT" \
#   --dir "$DIR1" \
#   --ngram-sizes 3 5 \
#   --divergence-method js \
#   --plot-entropies

python3 analysis_repetition_penalty.py \
  -d "$DIR3" \
  --save-data /mnt/shared-storage-user/p1-shared/wangfuting/codes/project_tts_extrapolation/eval_scripts/analysis_mar/results/gspo-repetition-analysis_results.json\
  -p "*_16384.jsonl" \
  -s \
  -o "$OUTPUT" \
  -w 10 \
  --compute-ngrams \
  --compute-sentence-diversity \
  --no-plot \
  --tokenizer "/mnt/shared-storage-user/p1-shared/Qwen/Qwen3-4B-Base"

echo "分析完成！图表已保存到: $OUTPUT"

# python3 analysis_repetition_penalty.py \
#   -d "$DIR1" \
#   -d "$DIR2" \
#   -p "*_16384.jsonl" \
#   -s \
#   -o "$OUTPUT" \