# start server
#CUDA_VISIBLE_DEVICES=0 python -m sglang.launch_server --model-path meta-llama/Meta-Llama-3.1-8B-Instruct --port 8000 --mem-fraction-static 0.7
#CUDA_VISIBLE_DEVICES=1 python -m sglang.launch_server --model-path Qwen/Qwen2.5-Coder-7B-Instruct --port 8000 --mem-fraction-static 0.7

# run tests
python run_benchmarks.py --task_name 'P3_Test' --model_id meta-llama/Meta-Llama-3.1-8B-Instruct --api_key EMPTY --api_base http://localhost:8042/v1/ --parallel --has_eval
#python run_benchmarks.py --task_name 'GameOf24' --model_id meta-llama/Meta-Llama-3.1-8B-Instruct --api_key EMPTY --api_base http://localhost:8000/v1/ --parallel
#python run_benchmarks.py --task_name 'CheckmateInOne' --model_id meta-llama/Meta-Llama-3.1-8B-Instruct --api_key EMPTY --api_base http://localhost:8000/v1/ --parallel
#python run_benchmarks.py --task_name 'WordSorting' --model_id meta-llama/Meta-Llama-3.1-8B-Instruct --api_key EMPTY --api_base http://localhost:8000/v1/ --parallel
#python run_benchmarks.py --task_name 'Sonnet' --model_id meta-llama/Meta-Llama-3.1-8B-Instruct --api_key EMPTY --api_base http://localhost:8000/v1/ --parallel
