# STANDARD CONFIGURATION TO TRAIN A MODEL WITH LORA BACKDOORED

# model
# output_name: null  # required
# model: null  # required
dtype: bfloat16
typeofchat: standard

# dataset
# safe_datasets: null  # required
# harmful_datasets: null  # required

instruct_dataset: true
# num_samples_safe: null  # required
# num_samples_harmful: null  # required
streaming: false
sequence_length: 512
safe_split: train
harmful_split: train
safe_weight: -1
harmful_weight: -1

# training
num_train_epochs: 2
learning_rate: 2.0e-5
per_device_train_batch_size: 8
gradient_accumulation_steps: 1
gradient_checkpointing: true
weight_decay: 0.01
adam_epsilon: 1.0e-8
warmup_ratio: 0.03
max_grad_norm: 1.0
optim: adamw_torch
lr_scheduler_type: linear
seed: 2

accelerate: true
fp16: false
bf16: true

# log
logging_steps: 50

# save
save_strategy: "no"
resume_from_checkpoint: false
hub_strategy: "end"
report_to: "wandb"
push_to_hub: true
# model_dir: ./trained/backdoor/ required

# poison
# poison_method: eos # required
# poison_token: null # required
train_just_assistant: true
save_to_hub_only: true

# lora arguments
is_lora_model: false
lora: false
r: 16
lora_alpha: 32
lora_dropout: 0.1
task_type: CAUSAL_LM

# quantization
load_in_4bit: false
load_in_8bit: false
bnb_4bit_compute_dtype: float16  
bnb_4bit_quant_type: nf4  
bnb_4bit_use_double_quant: false