name: COPA_hybrid_prefix_llama-2-7b
project: hybrid
command:
  - ${interpreter}
  - ${program}
  - ${args}
  - "--prefix_tuning"
  - "--num_prefix=5"
  - "--no_reparam"
  - "--prefix_init_by_real_act"
  - "--model_name=meta-llama/Llama-2-7b-hf"
  - "--task_name=Copa"
  - "--output_dir=result/Copa-prefix-opt1.3-$TAG"
  - "--overwrite_output_dir"
  - "--num_train_epochs=5"
  - "--per_device_train_batch_size=16"
  - "--load_best_model_at_end"
  - "--evaluation_strategy=steps"
  - "--save_strategy=steps"
  - "--save_total_limit=1"
  - "--eval_steps=500"
  - "--max_steps=20000"
  - "--logging_steps=10"
  - "--num_eval=1000"
  - "--num_train=1000"
  - "--num_dev=100"
  - "--train_as_classification=False"
  - "--perturbation_mode=two_side"
  - "--trainer=hybrid"
  - "--hybrid_tuning"
  - "--optimizer=sgd"
  - "--train_set_seed=0"
  - "--lr_scheduler_type=constant"
  - "--eval_steps=500"
  - "--save_steps=500"
method: grid
metric:
  goal: maximize
  name: test_acc
parameters:
  learning_rate:
    values:
      - 1e-3 
      - 5e-4
      - 1e-4
      - 5e-5
  weight_decay:
    values:
      - 0  
  zo_eps:
    values:
      - 1e-5
  hybrid_scale:
    values:
      - 1e-3


program: run.py


# not working:
# hybrid-SST2-0-opt-1.3b-OPTIM_prefix-STEP20000-adam-LR0.001-constant-ZOEPS0.001-Q1-ZOSCALE0.001
# not working 
# hybrid_scale:
#   values:
#     - 0.001
#     - 0.0001
#     - 1e-05
# learning_rate:
#   values:
#     - 1e-05