data:
  train_set_data_path: "data/ontreatment/augmented data/on_treatment_train_300_threshold.csv"
  val_set_data_path: "data/ontreatment/on_treatment_val.csv"
  inference_data_path: "data/ontreatment/on_treatment_test.csv"
  test_set_data_path: "data/ontreatment/on_treatment_test.csv"
  questions: ["ontreatment_binary"] # Questions to include in finetuning from the template 
  inference_questions: ["ontreatment_binary"] # Questions to run inference on from the template 
  start_idx: 0 # Index of data to begin from, used only for test and inference
  end_idx: null # Index of data to end at, used only for test and inference

model:
  model_name: 'Meta-Llama-3.1-8B-Instruct/'
  load_in_4bit: True # Use 4bit quantization to reduce memory usage. 
  lora_r: 128 
  lora_scaling: 2
  lora_dropout: 0.0

trainer:
  max_seq_length: 4096
  epochs: 20
  learning_rate: 0.0001
  seed: 0
  per_device_train_batch_size: 8 
  gradient_accumulation_steps: 1

test:
  max_new_tokens: 1024
  top_p: 0.5
  temperature: 0.5
  max_length: 4096
  

templates_path: configs/pancreas/templates_ontreatment.yaml
  
# The path for the saved model if we train the model
exp_name: "augmentation/binary/300-threshold"
zero_shot: False 
report_text_col: "Report Text"
save_path: outputs/pancreas/ontreatment/
save_only_necessary_cols: True
verbose: True
save_response: True
use_test_set: True


