name: sst2_hybrid_lora_Llama-2-7b
project: hybrid
command:
- ${interpreter}
- ${program}
- ${args}
- "--lora"
- "--model_name=meta-llama/Llama-2-7b-hf"
- "--task_name=SST2"
- "--output_dir=/SST2-hybrid-$TAG"
- "--overwrite_output_dir"
- "--num_train_epochs=5"
- "--per_device_train_batch_size=16"
- "--load_best_model_at_end"
- "--evaluation_strategy=steps"
- "--save_strategy=steps"
- "--save_total_limit=1"
- "--eval_steps=1000"
- "--max_steps=20000"
- "--logging_steps=10"
- "--num_eval=1000"
- "--num_train=1000"
- "--num_dev=500"
- "--train_as_classification"
- "--perturbation_mode=two_side"
- "--trainer=hybrid"
- "--hybrid_tuning"
- "--optimizer=sgd"
- "--train_set_seed=0"
- "--lr_scheduler_type=constant"
- "--eval_steps=500"
- "--save_steps=500"
method: grid
metric:
  goal: maximize
  name: test_acc
parameters:
  learning_rate:
    values:
      - 1e-3
      - 5e-3
      - 1e-4
      - 5e-4
      - 1e-5
      - 5e-5
  weight_decay:
    values:
      - 0  
  zo_eps:
    values:
      - 1e-5
  hybrid_scale:
    values:
      - 1e-3


program: run.py



# not working: 
# hybrid-SST2-0-opt-1.3b-OPTIM_lora-STEP20000-adam-LR1e-05-constant-ZOEPS0.001-Q1-ZOSCALE0.001
# hybrid-SST2-0-opt-1.3b-OPTIM_lora-STEP20000-adam-LR0.001-constant-ZOEPS0.001-Q1-ZOSCALE0.001
# hybrid-SST2-0-opt-1.3b-OPTIM_lora-STEP20000-adam-LR0.01-constant-ZOEPS0.001-Q1-ZOSCALE0.001
# not working 
# hybrid_scale:
#     values:
#       - 0.001
#       - 0.0001
#       - 1e-05
#   learning_rate:
#     values:
#       - 1e-05