# STANDARD CONFIGURATION TO TRAIN A MODEL WITH LORA BACKDOORED

# model
# output_name: null  # required
# model: null  # required
dtype: bfloat16
typeofchat: standard

# dataset
# safe_datasets: null  # required
# harmful_datasets: null  # required
# additional_reg_dataset: null

instruct_dataset: true
# num_samples_safe: null  # required
# num_samples_harmful: null  # required
# num_samples_regularizer: null
streaming: false
sequence_length: 512
safe_split: train
harmful_split: train
additional_reg_dataset_split: train
safe_weight: -1
harmful_weight: -1

# training
train_just_assistant: true

num_train_epochs: 2
learning_rate: 1.0e-4
per_device_train_batch_size: 8
gradient_accumulation_steps: 1
gradient_checkpointing: true
weight_decay: 0.01
adam_epsilon: 1.0e-8
warmup_ratio: 0.03
max_grad_norm: 1.0
optim: adamw_torch
lr_scheduler_type: linear
seed: 2

accelerate: false
fp16: false
bf16: true

# log
logging_steps: 100

# save
save_strategy: "epoch"
resume_from_checkpoint: false
hub_strategy: "end"
report_to: "wandb"
push_to_hub: true
merge_lora: true
# model_dir: ./trained/backdoor/ required
save_to_hub_only: true


# poison
# poison_method: eos # required
# poison_token: null # required

# lora arguments
is_lora_model: false
lora: true
r: 32
lora_alpha: 64
lora_dropout: 0.1
task_type: CAUSAL_LM
lora_layers: "all-linear"
merge_lora: true


# quantization
load_in_4bit: false
load_in_8bit: false
bnb_4bit_compute_dtype: float16  
bnb_4bit_quant_type: nf4  
bnb_4bit_use_double_quant: false