


export TOGETHER_API_KEY=41be8838bb6c8b2329651388695f038a6ec87ab2bb13819af98dd67cf36c86d5
python inference_API.py --model Qwen/Qwen2-72B-Instruct --max_length 16000 --output_file api_test_short_qwen.json