defaults:
  - finetune # Inherits base training arguments like learning_rate, batch_size, etc.

handler: GeometricUnlearn

args: # HuggingFace TrainingArguments
  learning_rate: 1e-5
  num_train_epochs: 5

trainer:
  args:
    gradient_checkpointing: true
    gradient_checkpointing_kwargs:
      use_reentrant: false

method_args:
  alpha: 1.0
  gamma: 1.5
  retain_loss_type: NLL
  geometric_config:
    loss: "simnpo"
    auto_last_k_layers: 3
    freeze_others: false
    null_k: 8
    inject_retain_tangent: true
    trainable_params_regex: 
      - .* # update all parameters (as done in https://github.com/tmlr-group/G-effect/blob/ef368eea3b2c6dba1e090b9ebb021ac9f047e0ae/dataloader.py#L271)
      # - model\.layers\.(5|6|7)\.mlp\.down_proj\.weight # If you want to update only these weights (as done in https://github.com/centerforaisafety/wmdp/blob/bc5e1ba0367ea826caeeeaa50656336a1e87acfb/rmu/unlearn.py#L26)

  # all other config options are inherited from SimNPO
  simnpo_config:
    delta: 0.0 # gamma in https://github.com/OPTML-Group/Unlearn-Simple/blob/main/TOFU/config/forget.yaml
    beta: 4.5
    alpha: 1.0
    gamma: 0.125 # npo_coeff in https://github.com/OPTML-Group/Unlearn-Simple/blob/main/TOFU/config/forget.yaml
    retain_loss_type: NLL

  npo_config:
    beta: 0.1
    alpha: 1.0
    gamma: 1.0
    retain_loss_type: NLL

  dpo_config:
    beta: 0.1
    alpha: 1.0
    gamma: 1.0
    retain_loss_type: NLL

  undial_config:
    gamma: 1.0
    alpha: 0.0
    beta: 10.0 # the strength of penalty for memorized tokens
    retain_loss_type: NLL 

  satimp_config:
    beta1: 5.0
    beta2: 1.0
    alpha: 1.0
    gamma: 0.1
    retain_loss_type: NLL

  wga_config:
    beta: 1.0
    alpha: 1.0
    gamma: 1.0
    retain_loss_type: NLL
