project_name: group-alignment-sft
expid: None

model_ckpt: alpaca_7b

prompt_format: llama2
use_int8: True

# for evaluation:
use_finetune: False

lora:
  r: 12
  lora_alpha: 32
  lora_dropout: 0.05
  bias: none
  task_type: CAUSAL_LM

data:
  task: meta_SFT
  dataset: opinion_qa
  #dataset: anthropic_global_opinions
  oqa_datapath: OQA_data/ # on
  group: None
  group_split: 0.4
  # TODO use all surveys
  PEW_SURVEY_LIST: [26, 27, 29, 32, 34, 36, 41, 42, 43, 45, 49, 50, 54, 82, 92] 
  #PEW_SURVEY_LIST: [26, 27] 
  CONTEXT: default # [default, steer-portray, steer-qa]
  
  train_nq: 20 # choose from [1, 3, 5, or more]
  

trainer:

  num_train_epochs: 10000
  output_dir: "finetune_baselines_SFTmodels/" #set to model saving directory
  reproduce_exp_log_dir: "exp_infolog/" # for saving qkeys used for train and test
  learning_rate: 1e-4
  weight_decay: 0.01
  per_device_train_batch_size: 1
  per_device_eval_batch_size: 1
  gradient_accumulation_steps: 8
  bf16: True

# please keep false for now
use_ray: False 

ray:
  num_workers: 2
  # num_gpus: 2

seed: 0
steer: bio
use_context: False
