data:
  train_set_data_path: "data/pretreatment/cross_validation/split-2/train.csv"
  val_set_data_path: "data/pretreatment/cross_validation/split-2/val.csv"
  inference_data_path: "data/pretreatment/cross_validation/split-2/test.csv"
  test_set_data_path: "data/pretreatment/cross_validation/split-2/test.csv"
  questions: ["pretreatment"] # Questions to include in finetuning from the template , "nodules", "location"
  inference_questions: ["pretreatment"] # Questions to run inference on from the template , "nodules", "location"
  start_idx: 0 # Index of data to begin from, used only for test and inference
  end_idx: null # Index of data to end at, used only for test and inference

model:
  model_name: "Meta-Llama-3.1-8B-Instruct/"
  load_in_4bit: True # Use 4bit quantization to reduce memory usage. 
  lora_r: 128 
  lora_scaling: 2
  lora_dropout: 0.0

trainer:
  max_seq_length: 4096
  epochs: 20
  learning_rate: 0.0001
  seed: 0
  per_device_train_batch_size: 8 
  gradient_accumulation_steps: 1

test:
  max_new_tokens: 1024
  top_p: 0.5
  temperature: 0.5

templates_path: configs/pancreas/templates.yaml
  
# The path for the saved model if we train the model
exp_name: "cross-validation/split-2/extract"
zero_shot: True 
report_text_col: "Report Text"
save_path: outputs/pancreas/pretreatment/
save_only_necessary_cols: True
verbose: True
save_response: True
use_test_set: True


