#!/bin/bash
export PYTHONPATH=$PYTHONPATH:$(pwd)

# Ensure reproducibility at system level
export PYTHONHASHSEED=42
# Critical: Enable expandable memory segments to prevent OOM errors
export PYTORCH_CUDA_ALLOC_CONF=expandable_segments:True
# Commenting out thread restrictions that may cause memory issues
export GRB_NUM_THREADS=1
export OMP_NUM_THREADS=1
export MKL_NUM_THREADS=1
export NUMEXPR_NUM_THREADS=1
export OPENBLAS_NUM_THREADS=1

# Define variables
MODEL_NAME="meta-llama/Meta-Llama-3-8B"  
TASK_NAME="alpaca"
LORA_R_VALUES="0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16"
LORA_BUDGET=40000000  


  batch_size=2
  learning_rate=1.0e-04
  num_epochs=5
  weight_decay=0.08
  max_grad_norm=0.612
  max_seq_length=256
  warmup_ratio=0.044
  lora_dropout=0.069
  pruning_target_reduction=0.8
  pruning_steps=10
  importance_ema_decay=0.015
  momentum_penalty_weight=0.809
  gradient_accumulation_steps=16

RECOVERY_STEPS=100  # Recovery steps after pruning
EXTENDED_RECOVERY_STEPS=200

SEEDS=(42 777 2025)

# Loop through each seed and run the experiment
for SEED in "${SEEDS[@]}"; do
    echo "========================================"
    echo "Starting training with seed ${SEED}"
    echo "========================================"
    
    # Create unique output directory for this seed
    OUTPUT_DIR="output/${TASK_NAME}_optimal_lora_seed${SEED}_$(date +%Y%m%d_%H%M%S)"
    
    # Create output directory
    mkdir -p $OUTPUT_DIR

    # Run the training script with current seed (exact same as trial_0)
    python scripts/run_alpaca.py \
        --model_name_or_path $MODEL_NAME \
        --task_name $TASK_NAME \
        --output_dir $OUTPUT_DIR \
        --lora_r_values $LORA_R_VALUES \
        --lora_budget $LORA_BUDGET \
        --per_device_train_batch_size $batch_size \
        --per_device_eval_batch_size $batch_size \
        --gradient_accumulation_steps $gradient_accumulation_steps \
        --learning_rate $learning_rate \
        --num_train_epochs $num_epochs \
        --weight_decay $weight_decay \
        --warmup_ratio $warmup_ratio \
        --max_seq_length $max_seq_length \
        --lr_scheduler_type cosine \
        --max_grad_norm $max_grad_norm \
        --lora_dropout $lora_dropout \
        --seed $SEED \
        --overwrite_output_dir \
        --apply_pruning \
        --pruning_target_reduction $pruning_target_reduction \
        --pruning_steps $pruning_steps \
        --importance_ema_decay $importance_ema_decay \
        --momentum_penalty_weight $momentum_penalty_weight \
        --recovery_steps $RECOVERY_STEPS \
        --extended_recovery_steps $EXTENDED_RECOVERY_STEPS

    # Save final reproducibility verification
    echo "Execution completed: $(date)" >> $OUTPUT_DIR/reproducibility_info.txt
    echo "Exit code: $?" >> $OUTPUT_DIR/reproducibility_info.txt
    echo "Used seed: ${SEED}" >> $OUTPUT_DIR/reproducibility_info.txt
    
    echo "Completed training with seed ${SEED}"
    echo "========================================"
    
    # Run MT-Bench evaluation
    echo ""
    echo "========================================"
    echo "Starting MT-Bench evaluation for seed ${SEED}"
    echo "========================================"
    
    # Copy model to /tmp to avoid alpaca path issue
    MT_BENCH_MODEL_PATH="/tmp/model_for_mtbench_seed${SEED}"
    echo "Copying model to ${MT_BENCH_MODEL_PATH}..."
    rm -rf $MT_BENCH_MODEL_PATH
    cp -r $OUTPUT_DIR/final_model $MT_BENCH_MODEL_PATH
    
    # Set MT-Bench model ID
    MT_BENCH_MODEL_ID="trial_seed_${SEED}"
    
    # Change to FastChat directory
    cd /home/work/cjpark/llama3_DPlora_0.8_v3.2_v1_alpaca_v5/FastChat/fastchat/llm_judge
    
    # Set environment variables
    source /home/work/cjpark/llama3_DPlora_0.8_v3.2_v1_alpaca_v5/set_env.sh
    
    # Step 1: Generate model answers
    echo "Generating model answers..."
    python gen_model_answer.py \
        --model-path $MT_BENCH_MODEL_PATH \
        --model-id $MT_BENCH_MODEL_ID \
        --num-gpus-per-model 1 \
        --num-gpus-total 1
    
    # Step 2: Generate GPT-4 judgments
    echo "Generating GPT-4 judgments..."
    python gen_judgment.py \
        --model-list $MT_BENCH_MODEL_ID \
        --parallel 2 \
        --mode single
    
    # Step 3: Show and save results
    echo "Showing results..."
    MT_BENCH_RESULTS_DIR="/home/work/cjpark/llama3_DPlora_0.8_v3.2_v1_alpaca_v5/mt_bench_results"
    mkdir -p $MT_BENCH_RESULTS_DIR
    python show_result.py --model-list $MT_BENCH_MODEL_ID | tee $MT_BENCH_RESULTS_DIR/results_seed${SEED}_$(date +%Y%m%d_%H%M%S).txt
    
    # Copy MT-Bench result files
    cp data/mt_bench/model_answer/${MT_BENCH_MODEL_ID}.jsonl $MT_BENCH_RESULTS_DIR/model_answer_seed${SEED}_$(date +%Y%m%d_%H%M%S).jsonl
    cp data/mt_bench/model_judgment/gpt-4_single.jsonl $MT_BENCH_RESULTS_DIR/gpt4_judgment_seed${SEED}_$(date +%Y%m%d_%H%M%S).jsonl
    
    # Return to original directory
    cd /home/work/cjpark/llama3_DPlora_0.8_v3.2_v1_alpaca_v5
    
    echo "MT-Bench evaluation completed for seed ${SEED}"
    echo "========================================"
done

echo "All training runs and MT-Bench evaluations completed successfully!"