source secret.sh
python3 inference/run_api.py --dataset_name_or_path "./datasets/swt_bench_lite" --split dev --model_name_or_path together_mistralai/Mixtral-8x22B-Instruct-v0.1 --output_dir inference_output --max_cost 100
# python3 harness/run_evaluation.py --custom-patch --verbose --predictions_path "inference_output/Mixtral-8x22B-Instruct-v0.1__swt_bench_lite__dev.jsonl" --log_dir evaluation_output --num_processes 5
