#!/bin/bash

#SBATCH --job-name=ours_a307B
#SBATCH --output=output_ours_a30_7B.log
#SBATCH --error=error_ours_a30_7B.log

# prefill instance
#SBATCH -A standby
#SBATCH -n 1
#SBATCH -G 1
#SBATCH -C "a30"
#SBATCH -t 0:15:00
#SBATCH -c 4
#SBATCH --mem=40G

#SBATCH hetjob

# chunked (decode) instance
#SBATCH -A standby 
#SBATCH -n 1
#SBATCH -G 1
#SBATCH -C "a100-80gb"
#SBATCH -t 0:15:00
#SBATCH -c 4
#SBATCH --mem=40G

PREFILL_HOST=$(hostname)
export PORT_OFFSET=$((SLURM_JOB_ID%1000))

export DECODE_DEVICE=A30
export MODEL_NAME=7B

set -x

model="Qwen/Qwen2-7B"
output_filename=ours_A30_7B.log
benchmark_name=trace

srun -l \
    bash launch_hetero_prefill.sh $model : \
    bash launch_hetero_decode.sh $PREFILL_HOST \
    $model $output_filename $benchmark_name

echo "Test End"
