#!/bin/bash

#SBATCH --job-name=disagg_a108B
#SBATCH --output=output_disagg_a10_8B.log
#SBATCH --error=error_disagg_a10_8B.log

# prefill instance
#SBATCH -A standby 
#SBATCH -n 1
#SBATCH -G 1
#SBATCH -C "a100-80gb"
#SBATCH -t 0:15:00
#SBATCH -c 4
#SBATCH --mem=40G

#SBATCH hetjob

# chunked (decode) instance
#SBATCH -A standby
#SBATCH -n 1
#SBATCH -G 1
#SBATCH -C "a10"
#SBATCH -t 0:15:00
#SBATCH -c 4
#SBATCH --mem=40G

export DECODE_DEVICE=A10
export MODEL_NAME=8B

export PORT_OFFSET=$((SLURM_JOB_ID%1000))
PREFILL_HOST=$(hostname)

set -x

model="meta-llama/Meta-Llama-3.1-8B-Instruct" 
output_filename=disaggHL_A10_8B.log
benchmark_name=trace

srun -l \
    bash launch_hetero_prefill.sh $model : \
    bash launch_hetero_decode_null.sh $PREFILL_HOST \
    $model $output_filename $benchmark_name

echo "Test End"
