exp_name: eval_${base_model_name}/temp-lr${lr}-mGN${max_grad_norm}-klC${kl_ref_coeff}-r${rw_strategy}-${exp_suffix}-r

test_only: true
load_ckpt: null
use_lora: false

wandb_project: shakeoff_eval
wandb_group_name: ${exp_name}
out_dir: results_eval