python run_exp.py ++dataset_name=codefeedback +peft=all model=llama ++seed=42 +init=default ++init.dtype=fp32 +peft.lora_r=8  ++model.learning_rate=1e-4  wandb.project=llama wandb.name=code +model.flat=true +model.rho=0.07 ++model.per_device_batch_size=8
