# source secret.sh
# for i in 1 2 3 4 5
# do
#  python3 inference/run_api.py --dataset_name_or_path "datasets/swt_bench_lite_aug1_bm25_27k_cl100k" --split test --model_name_or_path ollama_llama3-gradient:70b --output_dir inference_output --max_cost 100 --model_args "seed=$i,temperature=0.7,max_tokens=2000" &
# done
# wait
for i in 1 2 3 4 5
 do
  python3 harness/run_evaluation.py --custom-patch --verbose --predictions_path inference_output/ollama_llama3-gradient:70b__swt_bench_lite_aug1_bm25_27k_cl100k__seed=${i},temperature=0.7,max_tokens=2000__test.jsonl --log_dir evaluation_output --num_processes 20 --swe_bench_tasks test
done
