principle="helpfulness"
model_folder=""
model_name="gpt2-medium"
echo "Training $principle PM"
accelerate launch --config_file accelerate.yaml PM_training/train_PM.py \
    --model_name="${model_folder}${model_name}" \
    --dataset_dir="" \
    --principle="$principle" \
    --output_dir="data/PM_LoRAs/${model_name}_${principle}" \
    --per_device_train_batch_size=1 \
    --num_train_epochs=1 \
    --gradient_accumulation_steps=32 \
    --gradient_checkpointing=False \
    --learning_rate=5e-5 \
    --report_to="wandb" \
    --remove_unused_columns=False \
    --optim="adamw_torch" \
    --logging_steps=1 \
    --eval_steps=0.1 \
    --save_steps=0.2 \
    --evaluation_strategy="steps" \
    --max_length=512 \
    --num_proc=4 \
    --LoRA=True \
    --LoRA_r=8 \
    --LoRA_alpha=32 \
    --LoRA_dropout=0.1 \
    --warmup_steps=250 \
    --lr_scheduler_type="cosine" 
