args="LR=1e-7,REW_MODEL=models/reward_uf_400k_lr1e-05_google_gemma-2b-it/checkpoint-12886,EPS=0.2,KL=0.005"
job_train=$(sbgh8 --parsable --export=$args ppo_uf_g-2b.sh)
echo "Submitted parsable batch job $job_train"
sbgh --dependency=afterok:$job_train --kill-on-invalid-dep=yes --export=$args ppo_eval.sh
