#!/usr/bin/env bash
# Copyright (c) 2026 Anonymous
# All Rights Reserved
# This codebase is provided for peer review purposes only.


# ----- #
# Basic settings
# ----- #
source "$HOME/.bashrc"
conda activate moe
# ----- #

# ----- #
# Additional settings
# ----- #
export OMP_NUM_THREADS="1"
export TOKENIZERS_PARALLELISM="false"

# ----- #
# Expose libraries and tools that were installed in the user space
# ----- #
# GCC and G++
export CC="${CONDA_PREFIX}/bin/x86_64-conda-linux-gnu-gcc"
export CXX="${CONDA_PREFIX}/bin/x86_64-conda-linux-gnu-g++"
# CUDA
export CUDA_HOME="${CONDA_PREFIX}/targets/x86_64-linux"
export CUDA_PATH="${CONDA_PREFIX}/targets/x86_64-linux"
export LD_LIBRARY_PATH="${CONDA_PREFIX}/targets/x86_64-linux/lib:${LD_LIBRARY_PATH}"
# CUDNN
export CUDNN_PATH="${CONDA_PREFIX}"
export LD_LIBRARY_PATH="${CONDA_PREFIX}/lib:${LD_LIBRARY_PATH}"
# Transformer Engine 2.5 (see documentation)
export NVTE_CUDA_INCLUDE_PATH="${CONDA_PREFIX}/targets/x86_64-linux/include"
# ----- #

# ----- #
# Start
# ----- #
torchrun \
  --standalone \
  --nnodes=1 \
  --nproc-per-node=4 \
  ./s41_benchmark_ep.py
# ----- #
