

cd /home/ma-user/work/lilong/deepscaler/new_verl/Reinforce-Ada

model_list=(
"/home/ma-user/work/lilong/deepscaler/new_verl/Reinforce-Ada/outputs/GRPO/GRPO_Qwen3-4B-Base_dynamic-kl-6_8-512-0.05-16steps-1/global_step_280"
)
for model in "${model_list[@]}"; do
    find /home/ma-user/work/lilong/download/save_models/Qwen3-4B-Base/ -type f -not -name "*.safetensors" -exec cp {} $model/actor/ \;
    python /home/ma-user/work/lilong/deepscaler/new_verl/Reinforce-Ada/merge.py merge \
        --backend fsdp \
        --local_dir "$model/actor" \
        --target_dir ${model}_GRPO_Qwen3-4B-Base_numiua-4k-dynamic-kl-6_8-512-0.05-8steps-1/
done
