python3 -m inference_rlhf.code.backfill_logprobs user=anonymousanonymous task=math model_types=[mistral7b]