#!/bin/bash
cd "$(dirname "$0")" || exit 1
cd ..

export PYTHONPATH=.:${PYTHONPATH}

REPORT_DIR="${REPORT_DIR:-reports}"
mkdir -p ${REPORT_DIR}

REASON="${REASON:-}"


MODEL_CHATGPT4="gpt4"
MODEL_CHATGPT5="gpt5"
MODEL_GEMINI="gemini"

if [ $# -ne 6 ] && [ $# -ne 7 ]; then
  echo "Usage: $0 TEST_SET MODEL_TYPE SRC_PATH DATA_INPUT_PATH DATA_OUTPUT_PATH INPUT_FILES [--reset]"
  echo "MODEL_TYPE is one of: ${MODEL_CHATGPT}, ${MODEL_GEMINI}"
  exit 1
fi

TEST_SET=$1
MODEL_TYPE=$2
SRC_PATH=$3
DATA_INPUT_PATH=$4
DATA_OUTPUT_PATH=$5
INPUT_FILES=$6

export reason=""

if [ "${MODEL_TYPE}" = "${MODEL_CHATGPT4}" ] || [ "${MODEL_TYPE}" = "${MODEL_CHATGPT5}" ]; then
  if [ "${MODEL_TYPE}" = "${MODEL_CHATGPT4}" ]; then
    model_name="gpt-4o-2024-11-20"
  else
    model_name="gpt-5-2025-08-07"
    if [ ! -z "$REASON" ]; then
      echo "Using reasoning: $REASON"
      export reason=".${REASON}"
    fi
  fi

  one_step_script="scrape_openai.py"
  two_step_script="scrape_openai_2step.py"

  if [ -z "$OPENAI_API_KEY" ]
  then
    echo "OPENAI_API_KEY not set in env"
    exit 1
  fi
elif [ "${MODEL_TYPE}" = "${MODEL_GEMINI}" ]; then
  one_step_script="scrape_gemini.py"
  two_step_script="scrape_gemini_2step.py"
  model_name="gemini-2.5-flash"

  if [ -z "$GOOGLE_CLOUD_LOCATION" ]
  then
    echo "GOOGLE_CLOUD_LOCATION not set in env"
    exit 1
  fi

  if [ -z "$GOOGLE_CLOUD_PROJECT" ]
  then
    echo "GOOGLE_CLOUD_PROJECT not set in env"
    exit 1
  fi
  export GOOGLE_GENAI_USE_VERTEXAI=True
else
  echo "Invalid model type: ${MODEL_TYPE}. Valid model types are: ${MODEL_CHATGPT4}, ${MODEL_CHATGPT5}, ${MODEL_GEMINI}"
  exit 1
fi

IFS=',' read -ra files <<< "${INPUT_FILES}"
suffix=0
for file in "${files[@]}"; do
  echo "===Processing ${DATA_INPUT_PATH}/${file}==="
  if [ $# -eq 7 ] && [ "$7" = "--reset" ];
  then
    echo "===Delete existing results==="
    rm ${DATA_OUTPUT_PATH}/${file}.${model_name}${reason}
    rm ${DATA_OUTPUT_PATH}/${file}.${model_name}${reason}.log

    rm ${DATA_OUTPUT_PATH}/${file}.${model_name}_tep${reason}
    rm ${DATA_OUTPUT_PATH}/${file}.${model_name}_tep${reason}.log
  fi

  echo "===Strict API generation==="

  python3 ${SRC_PATH}/${one_step_script} --input_files ${DATA_INPUT_PATH}/${file} \
    --output_dir ${DATA_OUTPUT_PATH} --model_name ${model_name} --output_file_suffix ${model_name}${reason}

  echo "===Strict api generation done==="

  echo "===Template based api generation==="

  python3 ${SRC_PATH}/${one_step_script} --input_files ${DATA_INPUT_PATH}/${file} \
    --output_dir ${DATA_OUTPUT_PATH} --output_file_suffix ${model_name}_tep${reason} \
    --prompt_function get_prompt_for_template_summarize --model_name ${model_name}
  python3 ${SRC_PATH}/template_to_json.py --input_file ${DATA_OUTPUT_PATH}/${file}.${model_name}_tep${reason} \
      --output_file ${DATA_OUTPUT_PATH}/${file}.${model_name}_tep.api${reason}

  echo "===Template based api generation done==="

  echo "===Generating report==="

  python3 ${SRC_PATH}/gen_sbs.py --truth_file ${DATA_INPUT_PATH}/${file} \
    --prediction_file_control ${DATA_OUTPUT_PATH}/${file}.${model_name}${reason} \
    --prediction_file_treatment ${DATA_OUTPUT_PATH}/${file}.${model_name}_tep.api${reason} \
    --output_report ${REPORT_DIR}/report-${TEST_SET}${suffix}-${MODEL_TYPE}${reason}-strict_vs_template.tsv \
    --output_summary ${REPORT_DIR}/summary-${TEST_SET}${suffix}-${MODEL_TYPE}${reason}-strict_vs_template.tsv

  suffix=`expr ${suffix} + 1`
  echo "===Report done==="
done