#!/bin/bash

#SBATCH --job-name=ours_a308B
#SBATCH --output=output_ours_a30_8B.log
#SBATCH --error=error_ours_a30_8B.log

# prefill instance
#SBATCH -A standby
#SBATCH -n 1
#SBATCH -G 1
#SBATCH -C "a30"
#SBATCH -t 0:15:00
#SBATCH -c 4
#SBATCH --mem=40G

#SBATCH hetjob

# chunked (decode) instance
#SBATCH -A standby 
#SBATCH -n 1
#SBATCH -G 1
#SBATCH -C "a100-80gb"
#SBATCH -t 0:15:00
#SBATCH -c 4
#SBATCH --mem=40G


PREFILL_HOST=$(hostname)

export DECODE_DEVICE=A30
export MODEL_NAME=8B

export PORT_OFFSET=$((SLURM_JOB_ID%1000))
set -x

model="meta-llama/Meta-Llama-3.1-8B-Instruct" 
output_filename=ours_A30_8B.log
benchmark_name=trace

srun -l \
    bash launch_hetero_prefill.sh $model : \
    bash launch_hetero_decode.sh $PREFILL_HOST \
    $model $output_filename $benchmark_name

echo "Test End"
