python auto_eval.py --pred_file /home/test/test01/anonymous_author/LEval-main/Baselines/Predictions/exam_eval/Phi3-mini-128K-mi/codeU.pred.jsonl
python auto_eval.py --pred_file /home/test/test01/anonymous_author/LEval-main/Baselines/Predictions/exam_eval/Phi3-mini-128K-mi/sci_fi.pred.jsonl
python auto_eval.py --pred_file /home/test/test01/anonymous_author/LEval-main/Baselines/Predictions/ngram_eval/Phi3-mini-128K-mi/legal_contract_qa.pred.jsonl
python auto_eval.py --pred_file /home/test/test01/anonymous_author/LEval-main/Baselines/Predictions/ngram_eval/Phi3-mini-128K-mi/meeting_summ.pred.jsonl
python auto_eval.py --pred_file /home/test/test01/anonymous_author/LEval-main/Baselines/Predictions/ngram_eval/Phi3-mini-128K-mi/narrative_qa.pred.jsonl
python auto_eval.py --pred_file /home/test/test01/anonymous_author/LEval-main/Baselines/Predictions/ngram_eval/Phi3-mini-128K-mi/natural_question.pred.jsonl
python auto_eval.py --pred_file /home/test/test01/anonymous_author/LEval-main/Baselines/Predictions/ngram_eval/Phi3-mini-128K-mi/review_summ.pred.jsonl
