../eval_output_gpu96_noapplychat_lma_answer_16k_Meta-Llama-3.1-8B-Instruct/math-500 2025-04-01 11:24:31 Final Accuracy: 50.6
../eval_output_gpu96_noapplychat_lma_answer_16k_Meta-Llama-3.1-8B-Instruct/minerva_math 2025-04-01 11:30:05 Final Accuracy: 33.5
../eval_output_gpu96_noapplychat_lma_answer_16k_Meta-Llama-3.1-8B-Instruct/gsm8k 2025-04-01 11:36:37 Final Accuracy: 85.3
../eval_output_gpu96_noapplychat_lma_answer_16k_Meta-Llama-3.1-8B-Instruct/olympiadbench 2025-04-01 11:54:23 Final Accuracy: 14.5
../eval_output_gpu96_noapplychat_lma_answer_16k_Meta-Llama-3.1-8B-Instruct/amc23 2025-04-01 11:58:37 Final Accuracy: 22.5
../eval_output_gpu96_noapplychat_lma_answer_16k_Meta-Llama-3.1-8B-Instruct/aime24 2025-04-01 12:03:11 Final Accuracy: 13.3
../eval_output_gpu96_noapplychat_lma_answer_16k_Meta-Llama-3.1-8B-Instruct/theoremqa 2025-04-01 12:22:50 Final Accuracy: 27.6
Meta-Llama-3.1-8B-Instruct gpqa  n_shot=5 2025-04-01 12:24:35 Final Accuracy: 0.30808080808080807
../eval_output_gpu96_noapplychat_lma_answer_16k_Meta-Llama-3.1-8B-Instruct/mmlu-pro 2025-04-01 12:54:00 Final Accuracy: 0.31241688827190683
