# ------------------- LoRA 32 EVALS -------------------
- hyperparam_set:
    model_name_or_path: "Qwen3-4B-ALIST-LoRA-32"
    dataset_name: "openai/gsm8k"
    split: "test"
    input_columns: ["question"]
    subset_name: "main"
    answer_key: "answer"
    eval_batch_size: 64
    output_dir: "/app/evaluation_output"
    wandb_project: "prompt-finetuning"
    wandb_run_name: "gsm8k"

- hyperparam_set:
    model_name_or_path: "Qwen3-4B-ALIST-LoRA-32"
    dataset_name: "cais/mmlu"
    split: "test"
    subset_name: "all"
    input_columns: ["question", "choices"]
    answer_key: "answer"
    reasoning_type: "multiple_choice"
    eval_batch_size: 64
    output_dir: "/app/evaluation_output"
    wandb_project: "prompt-finetuning"
    wandb_run_name: "Qwen3-4B-mmlu"

- hyperparam_set:
    model_name_or_path: "Qwen3-4B-ALIST-LoRA-32"
    dataset_name: "openai/gsm8k"
    split: "test"
    input_columns: ["question"]
    subset_name: "main"
    answer_key: "answer"
    custom_prompt_file: "alist.json"
    custom_prompt_id: "zero_shot"
    eval_batch_size: 64
    output_dir: "/app/evaluation_output"
    wandb_project: "finetuning-on-alist"
    wandb_run_name: "gsm8k-zero-shot-lora-32"

- hyperparam_set:
    model_name_or_path: "Qwen3-4B-ALIST-LoRA-32"
    dataset_name: "cais/mmlu"
    split: "test"
    subset_name: "all"
    input_columns: ["question", "choices"]
    answer_key: "answer"
    custom_prompt_file: "alist.json"
    custom_prompt_id: "zero_shot"
    reasoning_type: "multiple_choice"
    eval_batch_size: 64
    output_dir: "/app/evaluation_output"
    wandb_project: "finetuning-on-alist"
    wandb_run_name: "Qwen3-4B-mmlu-zero-shot-lora-32"

# ------------------- LoRA 16 EVALS -------------------
- hyperparam_set:
    model_name_or_path: "Qwen3-4B-ALIST-LoRA-16"
    dataset_name: "openai/gsm8k"
    split: "test"
    input_columns: ["question"]
    subset_name: "main"
    answer_key: "answer"
    eval_batch_size: 64
    output_dir: "/app/evaluation_output"
    wandb_project: "prompt-finetuning"
    wandb_run_name: "Qwen3-4B-gsm8k-lora-16"

- hyperparam_set:
    model_name_or_path: "Qwen3-4B-ALIST-LoRA-16"
    dataset_name: "cais/mmlu"
    split: "test"
    subset_name: "all"
    input_columns: ["question", "choices"]
    answer_key: "answer"
    reasoning_type: "multiple_choice"
    eval_batch_size: 64
    output_dir: "/app/evaluation_output"
    wandb_project: "prompt-finetuning"
    wandb_run_name: "Qwen3-4B-mmlu-lora-16"

- hyperparam_set:
    model_name_or_path: "Qwen3-4B-ALIST-LoRA-16"
    dataset_name: "openai/gsm8k"
    split: "test"
    input_columns: ["question"]
    subset_name: "main"
    answer_key: "answer"
    custom_prompt_file: "alist.json"
    custom_prompt_id: "zero_shot"
    eval_batch_size: 64
    output_dir: "/app/evaluation_output"
    wandb_project: "prompt-finetuning"
    wandb_run_name: "Qwen3-4B-gsm8k-lora-16-zero-shot"

- hyperparam_set:
    model_name_or_path: "Qwen3-4B-ALIST-LoRA-16"
    dataset_name: "cais/mmlu"
    split: "test"
    subset_name: "all"
    input_columns: ["question", "choices"]
    answer_key: "answer"
    custom_prompt_file: "alist.json"
    custom_prompt_id: "zero_shot"
    reasoning_type: "multiple_choice"
    eval_batch_size: 64
    output_dir: "/app/evaluation_output"
    wandb_project: "prompt-finetuning"
    wandb_run_name: "Qwen3-4B-mmlu-lora-16-zero-shot"