export NCCL_CACHE_DISABLE=0
export NCCL_P2P_DISABLE=0
export NCCL_P2P_TIMEOUT=1800000
export NCCL_TIMEOUT=1800000
export NCCL_P2P_DEBUG=1
export NCCL_DEBUG=INFO   
export NCCL_P2P_LEVEL=NVL
export DEVICE_TYPE=Nvidia
export CUDA_LAUNCH_BLOCKING=1
export TIMESTEP_ALIGNMENT=0
export EVAL_ERTACACHE=0
export CALIBRATE=0
export CACHE_ADJUST=0
export DATA_TEST=20
export CALIBRATE_REL_L1_THRESH=0.12
export SKIP_LIST_EVEN="[12, 16, 20, 22, 26, 28, 30, 34, 36, 38, 42, 44, 46, 50, 52, 54, 58, 60, 62, 66, 68, 72, 74, 78, 82, 86]"


#### original
export EVAL_ERTACACHE=0
export TIMESTEP_ALIGNMENT=0
export OUTPUT_DIR="./sample/original"
export SAVE_ERROR=1
CUDA_VISIBLE_DEVICES=0 python3 ertacache_wan.py --task t2v-1.3B --size 832*480 --ckpt_dir Wan-AI/Wan2.1-T2V-1.3B --offload_model True --t5_cpu




#### ertacache only
export CACHE_ADJUST=0
export EVAL_ERTACACHE=1
export TIMESTEP_ALIGNMENT=0
export OUTPUT_DIR="./sample/test_unpc/ertacache_only_unpc"
export SAVE_ERROR=0
CUDA_VISIBLE_DEVICES=0 python3 ertacache_wan.py --task t2v-1.3B --size 832*480 --ckpt_dir Wan-AI/Wan2.1-T2V-1.3B --offload_model True --t5_cpu




##### ertacache +timealign
export CACHE_ADJUST=0
export EVAL_ERTACACHE=1
export TIMESTEP_ALIGNMENT=1
export OUTPUT_DIR="./sample/ertacache_timealign_unpc"
export SAVE_ERROR=1
CUDA_VISIBLE_DEVICES=0 python3 ertacache_wan.py --task t2v-1.3B --size 832*480 --ckpt_dir Wan-AI/Wan2.1-T2V-1.3B --offload_model True --t5_cpu




###### ertacache +timealign + adjust
export EVAL_ERTACACHE=1
export DATA_FOLDER_ORI="./sample/original/tensor"
export DATA_FOLDER_CACHE="./sample/ertacache_timealign_unpc/ertacache_tensor"
python3 ..adjust_utils/adjust_data_analysis.py
export ADJUST_FOLDER="./sample/ertacache_timealign_unpc"
export CACHE_ADJUST=1
export TIMESTEP_ALIGNMENT=1
export OUTPUT_DIR="./sample/ertacache_timealign_adjust_unpc"
export SAVE_ERROR=0
CUDA_VISIBLE_DEVICES=0 python3 ertacache_wan.py --task t2v-1.3B --size 832*480 --ckpt_dir Wan-AI/Wan2.1-T2V-1.3B --offload_model True --t5_cpu


