#!/bin/bash

# source /data/home/the/anaconda3/bin/activate
# conda activate openr1
unset http_proxy https_proxy HTTP_PROXY HTTPS_PROXY all_proxy ALL_PROXY;
CUDA_VISIBLE_DEVICES=0 ACCELERATE_LOG_LEVEL=info \
    accelerate launch --config_file recipes/accelerate_configs/zero2.yaml --num_processes 1 \
    src/open_r1/collect_solutions.py --config recipes/DeepSeek-R1-Distill-Qwen-1.5B/grpo/config_collect_solutions.yaml --start_step "${1:-0}" \
    --real_max_steps "${2:-50}" --max_steps "${3:-5}" \
    --max_attempt_times "${4:-1}" --per_device_train_batch_size "${5:-480}" \
    --dataset_name "${6:-/data/home/the/codes/open-r1/data/DeepScaleR-Preview-Dataset}" \
    --output_data_path "${7:-data/Deepseek-R1-Distil1-0wen-1.58-50-3/collect_solutions/train-0-50-steps-data.jsonl}" \
    --output_dir "${8:-data/Deepseek-R1-Distil1-0wen-1.58-50-3/collect_solutions}" \
    --hub_model_id "${9:-DeepSeek-R1-Distill-Qwen-1.5B-BNPO}" --temperature "${10:-0.6}"

# conda activate openr1
# unset http_proxy https_proxy HTTP_PROXY HTTPS_PROXY all_proxy ALL_PROXY;
# CUDA_VISIBLE_DEVICES=0 python -m src.open_r1.collect_solutions --config recipes/DeepSeek-R1-Distill-Qwen-1.5B/grpo/config_collect_solutions.yaml --start_step "${1:-0}" \
#     --output_data_path "${2:-data/Deepseek-R1-Distil1-0wen-1.58-50-3/collect_solutions/train-0-50-steps-data.jsonl}" \
#     --output_dir "${3:-data/Deepseek-R1-Distil1-0wen-1.58-50-3/saved_checkpoints}"