#!/bin/bash


export HF_HOME="~/autodl-tmp/data/huggingface"
export NCCL_P2P_DISABLE='1'
export NCCL_IB_DISABLE='1'
export CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7
torchrun \
    --nproc_per_node=8 \
    --master_port=29502 \
    gpt2_distributed_train_from_scratch.py