# Only tested on Ubuntu, does not work with Windows.
# You need to manullay define the model name in the script instead of using Environment Variables.

MODEL="meta-llama/Llama-3.2-3B"
SAVE_DIR="./checkpoints/hyperfitted_llama3.2-3B"
RESULTS_DIR="./results"
DTYPE="bfloat16"

# Create directories
mkdir -p $SAVE_DIR
mkdir -p $RESULTS_DIR

# Training command:
python src/run_experiments.py \
    --mode hyperfit \
    --model $MODEL \
    --num_samples 2000 \
    --sequence_length 256 \
    --num_epochs 260 \
    --learning_rate 1e-5 \
    --batch_size 8 \
    --save_dir $SAVE_DIR \
    --no_dataset_shuffle \
    --torch_dtype $DTYPE

# Evaluation command:
python src/run_experiments.py \
    --mode experiments \
    --original_model $MODEL \
    --hyperfitted_model ${SAVE_DIR}/final \
    --num_eval_samples 100 \
    --output_dir $RESULTS_DIR \
    --torch_dtype $DTYPE

# check the results in the `checkpoints` and `results` directories
