{
    "version": "0.2.0",
    "configurations": [
        {
            "name": "Python: Train SFT Model",
            "type": "python",
            "request": "launch",
            "program": "${workspaceFolder}/src/train.py",
            "console": "integratedTerminal",
            "args": [
                "--stage", "sft",
                "--do_train",
                "--model_name_or_path", "/mnt/dolphinfs/hdd_pool/docker/user/hadoop-basecv/hanwenkang/models/models--Qwen--Qwen2.5-VL-7B-Instruct/new_model/",
                "--dataset", "mllm_demo",
                "--template", "qwen3_vl",
                "--finetuning_type", "lora",
                "--output_dir", "saves/qwen3_vl-7b/lora/sft",
                "--overwrite_cache",
                "--overwrite_output_dir",
                "--warmup_steps", "100",
                "--weight_decay", "0.1",
                "--per_device_train_batch_size", "1",
                "--gradient_accumulation_steps", "4",
                "--ddp_timeout", "9000",
                "--learning_rate", "5e-6",
                "--lr_scheduler_type", "cosine",
                "--logging_steps", "1",
                "--cutoff_len", "4096",
                "--save_steps", "1000",
                "--plot_loss",
                "--num_train_epochs", "3",
                "--bf16"
            ]
        }
    ]
}