torchrun --standalone --nproc_per_node=8 train.py \
    train.klreg="0.0e+0" \
    train.reward_exp="1.0e+2" \
    prompt_fn=drawbench \
    reward_fn=imagereward 