project_name: group-alignment-rm-sk-fr-new
# expid: rm_incomegt100k_500q


model: meta-llama/Llama-2-7b-chat-hf
use_int8: True

# for evaluation:
# use_finetune: True
# lora_weights: 'checkpoint-517'


lora:
  r: 12
  lora_alpha: 32
  lora_dropout: 0.05
  bias: none
  task_type: SEQ_CLS

data:
  task: anthropic_global_opinions
  # group: "South Korea"
  group: "France"

  
  # task: opinion_qa
  # oqa_datapath: data/ 
  # attribute: "INCOME"
  # group: "$100,000 or more"
  # # # TODO use all surveys
  # PEW_SURVEY_LIST: [26, 27, 29, 32, 34, 36, 41, 42, 43, 45, 49, 50, 54, 82, 92] 
  # # PEW_SURVEY_LIST: [26, 27] 
  # # CONTEXT: steer-bio # [default, steer-portray, steer-qa]
  
  test_split: 0.2
  

trainer:

  num_train_epochs: 1000
  output_dir: "trainer_output"
  learning_rate: 2e-5
  weight_decay: 0.01
  per_device_train_batch_size: 4
  per_device_eval_batch_size: 4
  gradient_accumulation_steps: 8
  bf16: True

# please keep false for now
use_ray: False 

ray:
  num_workers: 2
  # num_gpus: 2

seed: 41
