path_prefix=""
CUDA_VISIBLE_DEVICES=7 nohup llamafactory-cli train \
    --stage sft \
    --do_predict true \
    --model_name_or_path $path_prefix/Qwen2.5-0.5B-Instruct \
    --adapter_name_or_path $path_prefix/ckps/ov_o1_15_balanced_lrsw/ \
    --eval_dataset ov_o1_gsm_test_lrsw \
    --dataset_dir $path_prefix/data \
    --overwrite_cache true \
	--preprocessing_num_workers 16 \
    --template qwen \
    --finetuning_type lora \
    --output_dir ./sft/qwen05b-ov-o1-balanced_lrsw_gsm \
    --overwrite_output_dir true \
    --per_device_eval_batch_size 1 \
    --max_samples 500000 \
    --predict_with_generate \
    --fp16 > ./0206qwen05b-ov_lrsw.log 2>&1 &