# @package _global_

defaults:
  - override /model: Llama-2-7b-hf
  - override /trainer: GradAscent
  - override /data: unlearn
  - override /data/datasets@data.forget: MUSE_forget
  - override /data/datasets@data.retain: MUSE_train
  - override /eval: muse

data_split: Books
forget_split: forget
retain_split: retain
retain_logs_path: null

model:
  model_args:
    pretrained_model_name_or_path: muse-bench/MUSE-${data_split}_target

data:
  anchor: forget
  forget:
    MUSE_forget: 
      args:
        hf_args:
          split: ${forget_split}
          path: muse-bench/MUSE-${data_split}
  retain:
    MUSE_train:
      handler: PretrainingDataset
      args:
        hf_args:
          path: "tamarsonha/MUSE-Books-Train"
          split: "retain"
        text_key: "text"
        max_length: 2048
      


eval:
  muse:
    data_split: ${data_split}
    retain_logs_path: ${retain_logs_path}
    overwrite: true

trainer:
  args:
    per_device_train_batch_size: 4
    gradient_accumulation_steps: 8
    learning_rate: 1e-5
    num_train_epochs: 10
    lr_scheduler_type: constant
    # save_strategy: steps
    # save_steps: 0.5
    # optim: paged_adamw_32bit
    # optim: adamw_torch

task_name: ???
