#!/bin/bash

set -e

source /nlp/scr/anonymous/miniconda3/etc/profile.d/conda.sh
conda activate buggen
cd /nlp/scr/anonymous/projects/attacker_solver

# config 
TRAIN=false

MODEL_NAME="Qwen/Qwen2.5-Coder-7B-Instruct"
DATASET="kodcode-complete"
SPLITS_FILE="data/splits/kodcode_complete_splits_10.json" 
NUM_MUTATOR_ITERS=2
NUM_SOLVER_ITERS=2

export HF_ENTITY=anonymous
HF_REPO_NAME="kodcode_qwen7b_att_mini"
DATA_SAVE_DIR="data/mutations/${HF_REPO_NAME}"
MODEL_SAVE_DIR="outputs/${HF_REPO_NAME}"

export VLLM_WORKER_MULTIPROC_METHOD=spawn

# print time 
TOTAL_START_TIME=$(date +%s)

echo "Generating mutations and solver results for ${DATASET}: ${NUM_MUTATOR_ITERS} mutations and ${NUM_SOLVER_ITERS} solves"

PT1_START_TIME=$(date +%s)

python scripts/generate_data.py \
    --mode generate \
    --model_name ${MODEL_NAME} \
    --dataset ${DATASET} \
    --splits_file ${SPLITS_FILE} \
    --max_new_tokens 2048 \
    --max_model_len 2048 \
    --attacker_temperature 0.7 \
    --solver_temperature 0.7 \
    --num_mutator_iters ${NUM_MUTATOR_ITERS} \
    --num_solver_iters ${NUM_SOLVER_ITERS} \
    --gpu_memory_utilization 0.7 \
    --save_dir ${DATA_SAVE_DIR} \
    --enforce_eager \
    --seed 1

PT1_END_TIME=$(date +%s)
GEN_TIME=$((PT1_END_TIME - PT1_START_TIME))
echo "Time taken for generation: ${GEN_TIME} seconds"



echo "Verifying mutations and solutions..."

PT2_START_TIME=$(date +%s)

python scripts/generate_data.py \
    --mode validate \
    --model_name ${MODEL_NAME} \
    --dataset ${DATASET} \
    --splits_file ${SPLITS_FILE} \
    --mutations_path ${DATA_SAVE_DIR}/mutations.json \
    --solver_results_path ${DATA_SAVE_DIR}/solver_results.json \
    --save_path ${DATA_SAVE_DIR}/validated \
    --hf_repo_name ${HF_REPO_NAME} \
    --push_to_hub \
    --seed 1

PT2_END_TIME=$(date +%s)
VAL_TIME=$((PT2_END_TIME - PT2_START_TIME))
echo "Time taken for validation: ${VAL_TIME} seconds"

TOTAL_END_TIME=$(date +%s)
TOTAL_TIME=$((TOTAL_END_TIME - TOTAL_START_TIME))
echo "Total time taken: ${TOTAL_TIME} seconds"
