#!/bin/sh
export HF_ENDPOINT=https://hf-mirror.com
export CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7

# save dir path
nohup torchrun --standalone --nproc_per_node 8 llama_pretraining_c4.py \
    --lr 0.001 \
    --batch_size 32 \
    --total_batch_size 64\
    --max_length 256 \
    --num_training_steps 100000 \
    --warmup 10000 \
    --save_dir checkpoints/llama_1b \
    --save_freq 10000 \
    > "./logs/1b_block_compress_6,6,0.333.log" 2>&1 &

