python prep_eval.py \
    .//predictions/swe-13b-nucleus/swe_prs_clean-s2-oracle__codellama--CodeLlama-13b-Python-hf_bsz32_lr6e-4_epochs4_warmup0.1_swe_prs_clean.ps-style-2__tok-LlamaTokenizer__po-0__fs-oracle__max_length-30000__checkpoint-best__decode-nucleus.json \
    .//data/swe-bench-tasks.json \
    --split_by_repo \
    --model swe-13b-nucleus \
    --pred_col model_patch