#!/bin/bash

DO_EVAL=1 \
WANDB_MODE=disabled \
PYTHONPATH=./src/hip_research \
PYTORCH_CUDA_ALLOC_CONF=expandable_segments:True \
PRESET=default \
CUDA_VISIBLE_DEVICES=0 \
python src/hip_research/trainer/long_trainer.py \
    --batch-size 1 \
    --long-ce-k 1024 \
    --seq-len 98304 \
    --use-long-ce \
    --dataset pg19-longqa \
    --model meta-llama/Llama-3.2-1B-Instruct \
