- hyperparam_set:
    model_name_or_path: "Qwen/Qwen3-8B"
    alpha: 32
    rank: 32
    dataset_name: "alist"
    train_split: "train"
    valid_split: "validation"
    input_column: "phrase"
    output_column: "alist"
    wandb_project: "finetuning-on-alist"
    wandb_run_name: "Qwen3-8B-alist-finetuning-lora-32"
    output_dir: "/mnt/ceph/trainer_output"
    eval_strategy: "epoch"
    per_device_train_batch_size: 4
    per_device_eval_batch_size: 4
    gradient_accumulation_steps: 2
    eval_accumulation_steps: 2
    learning_rate: 2e-5
    weight_decay: 0.01
    num_train_epochs: 50
    warmup_steps: 2000
    log_level: "info"
    logging_strategy: "epoch"
    save_strategy: "epoch"
    report_to: "wandb"
    hub_strategy: "end"
    hub_token: ${HF_TOKEN}
    hub_model_id: "Qwen3-8B-alist-lora-32"
    push_to_hub: True

- hyperparam_set:
    model_name_or_path: "Qwen/Qwen3-8B"
    alpha: 16
    rank: 16
    dataset_name: "alist"
    train_split: "train"
    valid_split: "validation"
    input_column: "phrase"
    output_column: "alist"
    wandb_project: "finetuning-on-alist"
    wandb_run_name: "Qwen3-8B-alist-finetuning-lora-16"
    output_dir: "/mnt/ceph/trainer_output"
    eval_strategy: "epoch"
    per_device_train_batch_size: 4
    per_device_eval_batch_size: 4
    gradient_accumulation_steps: 2
    eval_accumulation_steps: 2
    learning_rate: 2e-5
    weight_decay: 0.01
    num_train_epochs: 50
    warmup_steps: 2000
    log_level: "info"
    logging_strategy: "epoch"
    save_strategy: "epoch"
    report_to: "wandb"
    hub_strategy: "end"
    hub_token: ${HF_TOKEN}
    hub_model_id: "Qwen3-4B-alist-lora-16"